diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.575, "train/learning_rate": 2.3768408551068884e-05, "train/epoch": 5.04, "train/global_step": 4500, "_runtime": 29171, "_timestamp": 1646690410, "_step": 4502, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 80.0, 17.0, 11.0, 6.0, 1.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 29497.0, 639.0, 98.0, 53.0, 32.0, 8.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.03125, -59.52392578125, -58.0166015625, -56.50927734375, -55.001953125, -53.49462890625, -51.9873046875, -50.47998046875, -48.97265625, -47.46533203125, -45.9580078125, -44.45068359375, -42.943359375, -41.43603515625, -39.9287109375, -38.42138671875, -36.9140625, -35.40673828125, -33.8994140625, -32.39208984375, -30.884765625, -29.37744140625, -27.8701171875, -26.36279296875, -24.85546875, -23.34814453125, -21.8408203125, -20.33349609375, -18.826171875, -17.31884765625, -15.8115234375, -14.30419921875, -12.796875, -11.28955078125, -9.7822265625, -8.27490234375, -6.767578125, -5.26025390625, -3.7529296875, -2.24560546875, -0.73828125, 0.76904296875, 2.2763671875, 3.78369140625, 5.291015625, 6.79833984375, 8.3056640625, 9.81298828125, 11.3203125, 12.82763671875, 14.3349609375, 15.84228515625, 17.349609375, 18.85693359375, 20.3642578125, 21.87158203125, 23.37890625, 24.88623046875, 26.3935546875, 27.90087890625, 29.408203125, 30.91552734375, 32.4228515625, 33.93017578125, 35.4375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 2.0, 8.0, 14.0, 15.0, 7.0, 25.0, 15.0, 21.0, 22.0, 25.0, 34.0, 32.0, 29.0, 45.0, 37.0, 44.0, 49.0, 58.0, 50.0, 45.0, 54.0, 38.0, 47.0, 36.0, 45.0, 40.0, 28.0, 25.0, 21.0, 23.0, 17.0, 10.0, 7.0, 6.0, 10.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.9805793762207, -37.988128662109375, -36.99567794799805, -36.00322723388672, -35.010780334472656, -34.01832962036133, -33.02587890625, -32.03342819213867, -31.040977478027344, -30.048526763916016, -29.056076049804688, -28.063627243041992, -27.071176528930664, -26.078725814819336, -25.08627700805664, -24.093826293945312, -23.101375579833984, -22.108924865722656, -21.116474151611328, -20.124025344848633, -19.131574630737305, -18.139123916625977, -17.14667510986328, -16.154224395751953, -15.161773681640625, -14.169322967529297, -13.176873207092285, -12.184423446655273, -11.191972732543945, -10.199522018432617, -9.207072257995605, -8.214622497558594, -7.222169876098633, -6.229719638824463, -5.237269401550293, -4.244819164276123, -3.252368927001953, -2.259918689727783, -1.2674684524536133, -0.27501821517944336, 0.7174320220947266, 1.7098822593688965, 2.7023324966430664, 3.6947827339172363, 4.687232971191406, 5.679683208465576, 6.672133445739746, 7.664583683013916, 8.657033920288086, 9.649484634399414, 10.641934394836426, 11.634384155273438, 12.626834869384766, 13.619285583496094, 14.611735343933105, 15.604185104370117, 16.596635818481445, 17.589086532592773, 18.58153533935547, 19.573986053466797, 20.566436767578125, 21.558887481689453, 22.55133819580078, 23.543787002563477, 24.536237716674805]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 1.0, 5.0, 10.0, 11.0, 13.0, 10.0, 14.0, 15.0, 21.0, 23.0, 26.0, 26.0, 39.0, 27.0, 39.0, 32.0, 39.0, 43.0, 53.0, 47.0, 35.0, 46.0, 46.0, 36.0, 45.0, 44.0, 38.0, 33.0, 27.0, 24.0, 17.0, 22.0, 22.0, 17.0, 9.0, 11.0, 10.0, 5.0, 4.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.333877563476562, -27.439260482788086, -26.544641494750977, -25.6500244140625, -24.75540542602539, -23.860788345336914, -22.966171264648438, -22.071552276611328, -21.17693519592285, -20.282318115234375, -19.387699127197266, -18.49308204650879, -17.598464965820312, -16.703845977783203, -15.809228897094727, -14.914610862731934, -14.01999282836914, -13.125374794006348, -12.230756759643555, -11.336139678955078, -10.441521644592285, -9.546903610229492, -8.652286529541016, -7.757668495178223, -6.86305046081543, -5.968432426452637, -5.073814868927002, -4.179197311401367, -3.284579277038574, -2.3899612426757812, -1.4953436851501465, -0.6007261276245117, 0.29389381408691406, 1.188511610031128, 2.083129405975342, 2.9777472019195557, 3.8723649978637695, 4.7669830322265625, 5.661600589752197, 6.556218147277832, 7.450836181640625, 8.345454216003418, 9.240072250366211, 10.134689331054688, 11.02930736541748, 11.923925399780273, 12.81854248046875, 13.713160514831543, 14.607778549194336, 15.502396583557129, 16.397014617919922, 17.2916316986084, 18.186248779296875, 19.080867767333984, 19.97548484802246, 20.870101928710938, 21.764720916748047, 22.659337997436523, 23.553956985473633, 24.44857406616211, 25.34319305419922, 26.237810134887695, 27.132427215576172, 28.02704620361328, 28.921663284301758]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 16.0, 17.0, 33.0, 53.0, 76.0, 112.0, 165.0, 295.0, 420.0, 688.0, 1049.0, 1526.0, 2226.0, 3212.0, 4844.0, 7050.0, 9968.0, 13904.0, 19144.0, 25851.0, 34149.0, 43572.0, 54784.0, 67079.0, 79821.0, 97823.0, 120191.0, 96406.0, 78474.0, 65956.0, 54261.0, 43449.0, 33233.0, 25292.0, 18909.0, 13531.0, 9772.0, 6745.0, 4792.0, 3165.0, 2268.0, 1441.0, 1012.0, 645.0, 400.0, 267.0, 179.0, 112.0, 75.0, 42.0, 29.0, 18.0, 5.0, 9.0, 6.0, 2.0, 1.0, 2.0], "bins": [-61.9375, -60.02978515625, -58.1220703125, -56.21435546875, -54.306640625, -52.39892578125, -50.4912109375, -48.58349609375, -46.67578125, -44.76806640625, -42.8603515625, -40.95263671875, -39.044921875, -37.13720703125, -35.2294921875, -33.32177734375, -31.4140625, -29.50634765625, -27.5986328125, -25.69091796875, -23.783203125, -21.87548828125, -19.9677734375, -18.06005859375, -16.15234375, -14.24462890625, -12.3369140625, -10.42919921875, -8.521484375, -6.61376953125, -4.7060546875, -2.79833984375, -0.890625, 1.01708984375, 2.9248046875, 4.83251953125, 6.740234375, 8.64794921875, 10.5556640625, 12.46337890625, 14.37109375, 16.27880859375, 18.1865234375, 20.09423828125, 22.001953125, 23.90966796875, 25.8173828125, 27.72509765625, 29.6328125, 31.54052734375, 33.4482421875, 35.35595703125, 37.263671875, 39.17138671875, 41.0791015625, 42.98681640625, 44.89453125, 46.80224609375, 48.7099609375, 50.61767578125, 52.525390625, 54.43310546875, 56.3408203125, 58.24853515625, 60.15625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 3.0, 5.0, 7.0, 8.0, 9.0, 10.0, 13.0, 14.0, 19.0, 20.0, 15.0, 18.0, 15.0, 22.0, 25.0, 25.0, 28.0, 45.0, 51.0, 41.0, 50.0, 39.0, 56.0, 53.0, 31.0, 46.0, 28.0, 35.0, 33.0, 27.0, 31.0, 26.0, 22.0, 13.0, 8.0, 17.0, 11.0, 17.0, 9.0, 8.0, 3.0, 8.0, 5.0, 3.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-27.046875, -26.14453125, -25.2421875, -24.33984375, -23.4375, -22.53515625, -21.6328125, -20.73046875, -19.828125, -18.92578125, -18.0234375, -17.12109375, -16.21875, -15.31640625, -14.4140625, -13.51171875, -12.609375, -11.70703125, -10.8046875, -9.90234375, -9.0, -8.09765625, -7.1953125, -6.29296875, -5.390625, -4.48828125, -3.5859375, -2.68359375, -1.78125, -0.87890625, 0.0234375, 0.92578125, 1.828125, 2.73046875, 3.6328125, 4.53515625, 5.4375, 6.33984375, 7.2421875, 8.14453125, 9.046875, 9.94921875, 10.8515625, 11.75390625, 12.65625, 13.55859375, 14.4609375, 15.36328125, 16.265625, 17.16796875, 18.0703125, 18.97265625, 19.875, 20.77734375, 21.6796875, 22.58203125, 23.484375, 24.38671875, 25.2890625, 26.19140625, 27.09375, 27.99609375, 28.8984375, 29.80078125, 30.703125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 4.0, 10.0, 9.0, 7.0, 21.0, 22.0, 19.0, 23.0, 23.0, 33.0, 33.0, 40.0, 48.0, 28.0, 49.0, 42.0, 49.0, 57.0, 40.0, 38.0, 39.0, 62.0, 32.0, 39.0, 30.0, 39.0, 30.0, 18.0, 14.0, 21.0, 18.0, 8.0, 5.0, 4.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.536663055419922, -19.864686965942383, -19.192712783813477, -18.520736694335938, -17.84876251220703, -17.176786422729492, -16.504812240600586, -15.832836151123047, -15.16086196899414, -14.488886833190918, -13.816911697387695, -13.144936561584473, -12.47296142578125, -11.800986289978027, -11.129011154174805, -10.457035064697266, -9.785059928894043, -9.11308479309082, -8.441109657287598, -7.769134521484375, -7.097159385681152, -6.42518424987793, -5.753208637237549, -5.081233501434326, -4.4092583656311035, -3.737283229827881, -3.065308094024658, -2.3933327198028564, -1.7213575839996338, -1.0493824481964111, -0.3774070739746094, 0.2945680618286133, 0.9665431976318359, 1.6385183334350586, 2.3104934692382812, 2.982468843460083, 3.6544439792633057, 4.326418876647949, 4.99839448928833, 5.670369625091553, 6.342344760894775, 7.014319896697998, 7.686295032501221, 8.358270645141602, 9.030245780944824, 9.702220916748047, 10.37419605255127, 11.046171188354492, 11.718146324157715, 12.390121459960938, 13.06209659576416, 13.734071731567383, 14.406046867370605, 15.078022003173828, 15.749998092651367, 16.421972274780273, 17.093948364257812, 17.76592445373535, 18.437898635864258, 19.109874725341797, 19.781848907470703, 20.453824996948242, 21.12579917907715, 21.797775268554688, 22.469749450683594]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 11.0, 13.0, 18.0, 16.0, 20.0, 24.0, 28.0, 32.0, 27.0, 37.0, 36.0, 42.0, 49.0, 41.0, 53.0, 49.0, 34.0, 38.0, 48.0, 47.0, 37.0, 35.0, 38.0, 25.0, 27.0, 22.0, 16.0, 26.0, 21.0, 16.0, 13.0, 6.0, 11.0, 3.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.259138107299805, -20.608158111572266, -19.95718002319336, -19.30620002746582, -18.65522003173828, -18.004241943359375, -17.353261947631836, -16.702281951904297, -16.05130386352539, -15.400324821472168, -14.749344825744629, -14.098365783691406, -13.447385787963867, -12.796406745910645, -12.145427703857422, -11.494447708129883, -10.843467712402344, -10.192488670349121, -9.541508674621582, -8.89052963256836, -8.23954963684082, -7.588570594787598, -6.937591552734375, -6.286612033843994, -5.635632514953613, -4.984652996063232, -4.333673477172852, -3.682694435119629, -3.031714916229248, -2.380735397338867, -1.7297561168670654, -1.0787768363952637, -0.4277992248535156, 0.22318017482757568, 0.874159574508667, 1.5251389741897583, 2.1761183738708496, 2.8270978927612305, 3.4780771732330322, 4.129056453704834, 4.780035972595215, 5.431015491485596, 6.081995010375977, 6.732974052429199, 7.38395357131958, 8.034933090209961, 8.685912132263184, 9.336891174316406, 9.987871170043945, 10.638850212097168, 11.289830207824707, 11.94080924987793, 12.591789245605469, 13.242768287658691, 13.893747329711914, 14.544727325439453, 15.195706367492676, 15.846685409545898, 16.497665405273438, 17.148645401000977, 17.799623489379883, 18.450603485107422, 19.10158348083496, 19.752561569213867, 20.403541564941406]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 6.0, 20.0, 17.0, 25.0, 42.0, 50.0, 87.0, 131.0, 218.0, 294.0, 538.0, 797.0, 1389.0, 2245.0, 3887.0, 6489.0, 11267.0, 19824.0, 35066.0, 61816.0, 109436.0, 191100.0, 323787.0, 514932.0, 702790.0, 733593.0, 576174.0, 375318.0, 224305.0, 129706.0, 73403.0, 41147.0, 23169.0, 13133.0, 7461.0, 4253.0, 2507.0, 1513.0, 869.0, 537.0, 365.0, 203.0, 135.0, 101.0, 47.0, 27.0, 27.0, 10.0, 10.0, 11.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-23.09375, -22.39697265625, -21.7001953125, -21.00341796875, -20.306640625, -19.60986328125, -18.9130859375, -18.21630859375, -17.51953125, -16.82275390625, -16.1259765625, -15.42919921875, -14.732421875, -14.03564453125, -13.3388671875, -12.64208984375, -11.9453125, -11.24853515625, -10.5517578125, -9.85498046875, -9.158203125, -8.46142578125, -7.7646484375, -7.06787109375, -6.37109375, -5.67431640625, -4.9775390625, -4.28076171875, -3.583984375, -2.88720703125, -2.1904296875, -1.49365234375, -0.796875, -0.10009765625, 0.5966796875, 1.29345703125, 1.990234375, 2.68701171875, 3.3837890625, 4.08056640625, 4.77734375, 5.47412109375, 6.1708984375, 6.86767578125, 7.564453125, 8.26123046875, 8.9580078125, 9.65478515625, 10.3515625, 11.04833984375, 11.7451171875, 12.44189453125, 13.138671875, 13.83544921875, 14.5322265625, 15.22900390625, 15.92578125, 16.62255859375, 17.3193359375, 18.01611328125, 18.712890625, 19.40966796875, 20.1064453125, 20.80322265625, 21.5]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 7.0, 4.0, 7.0, 11.0, 7.0, 15.0, 12.0, 17.0, 21.0, 22.0, 25.0, 20.0, 28.0, 39.0, 31.0, 31.0, 42.0, 45.0, 41.0, 51.0, 43.0, 45.0, 48.0, 44.0, 42.0, 32.0, 38.0, 26.0, 30.0, 25.0, 20.0, 24.0, 21.0, 24.0, 16.0, 15.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.8260498046875, -14.355224609375, -13.8843994140625, -13.41357421875, -12.9427490234375, -12.471923828125, -12.0010986328125, -11.5302734375, -11.0594482421875, -10.588623046875, -10.1177978515625, -9.64697265625, -9.1761474609375, -8.705322265625, -8.2344970703125, -7.763671875, -7.2928466796875, -6.822021484375, -6.3511962890625, -5.88037109375, -5.4095458984375, -4.938720703125, -4.4678955078125, -3.9970703125, -3.5262451171875, -3.055419921875, -2.5845947265625, -2.11376953125, -1.6429443359375, -1.172119140625, -0.7012939453125, -0.23046875, 0.2403564453125, 0.711181640625, 1.1820068359375, 1.65283203125, 2.1236572265625, 2.594482421875, 3.0653076171875, 3.5361328125, 4.0069580078125, 4.477783203125, 4.9486083984375, 5.41943359375, 5.8902587890625, 6.361083984375, 6.8319091796875, 7.302734375, 7.7735595703125, 8.244384765625, 8.7152099609375, 9.18603515625, 9.6568603515625, 10.127685546875, 10.5985107421875, 11.0693359375, 11.5401611328125, 12.010986328125, 12.4818115234375, 12.95263671875, 13.4234619140625, 13.894287109375, 14.3651123046875, 14.8359375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 22.0, 26.0, 57.0, 95.0, 165.0, 312.0, 531.0, 938.0, 1650.0, 2751.0, 4885.0, 8658.0, 14777.0, 25628.0, 43270.0, 72783.0, 119442.0, 186944.0, 280334.0, 392445.0, 501492.0, 567422.0, 545115.0, 456980.0, 341490.0, 236681.0, 153440.0, 96635.0, 58651.0, 33813.0, 19933.0, 11359.0, 6712.0, 3757.0, 2147.0, 1250.0, 711.0, 412.0, 244.0, 133.0, 74.0, 51.0, 29.0, 12.0, 9.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.222900390625, -15.69580078125, -15.168701171875, -14.6416015625, -14.114501953125, -13.58740234375, -13.060302734375, -12.533203125, -12.006103515625, -11.47900390625, -10.951904296875, -10.4248046875, -9.897705078125, -9.37060546875, -8.843505859375, -8.31640625, -7.789306640625, -7.26220703125, -6.735107421875, -6.2080078125, -5.680908203125, -5.15380859375, -4.626708984375, -4.099609375, -3.572509765625, -3.04541015625, -2.518310546875, -1.9912109375, -1.464111328125, -0.93701171875, -0.409912109375, 0.1171875, 0.644287109375, 1.17138671875, 1.698486328125, 2.2255859375, 2.752685546875, 3.27978515625, 3.806884765625, 4.333984375, 4.861083984375, 5.38818359375, 5.915283203125, 6.4423828125, 6.969482421875, 7.49658203125, 8.023681640625, 8.55078125, 9.077880859375, 9.60498046875, 10.132080078125, 10.6591796875, 11.186279296875, 11.71337890625, 12.240478515625, 12.767578125, 13.294677734375, 13.82177734375, 14.348876953125, 14.8759765625, 15.403076171875, 15.93017578125, 16.457275390625, 16.984375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 13.0, 12.0, 14.0, 27.0, 28.0, 30.0, 42.0, 48.0, 45.0, 70.0, 83.0, 101.0, 106.0, 152.0, 138.0, 146.0, 181.0, 193.0, 178.0, 207.0, 199.0, 189.0, 192.0, 210.0, 180.0, 171.0, 146.0, 140.0, 122.0, 114.0, 86.0, 84.0, 61.0, 54.0, 59.0, 49.0, 31.0, 27.0, 26.0, 18.0, 25.0, 16.0, 8.0, 9.0, 4.0, 3.0, 3.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.39453125, -5.197998046875, -5.00146484375, -4.804931640625, -4.6083984375, -4.411865234375, -4.21533203125, -4.018798828125, -3.822265625, -3.625732421875, -3.42919921875, -3.232666015625, -3.0361328125, -2.839599609375, -2.64306640625, -2.446533203125, -2.25, -2.053466796875, -1.85693359375, -1.660400390625, -1.4638671875, -1.267333984375, -1.07080078125, -0.874267578125, -0.677734375, -0.481201171875, -0.28466796875, -0.088134765625, 0.1083984375, 0.304931640625, 0.50146484375, 0.697998046875, 0.89453125, 1.091064453125, 1.28759765625, 1.484130859375, 1.6806640625, 1.877197265625, 2.07373046875, 2.270263671875, 2.466796875, 2.663330078125, 2.85986328125, 3.056396484375, 3.2529296875, 3.449462890625, 3.64599609375, 3.842529296875, 4.0390625, 4.235595703125, 4.43212890625, 4.628662109375, 4.8251953125, 5.021728515625, 5.21826171875, 5.414794921875, 5.611328125, 5.807861328125, 6.00439453125, 6.200927734375, 6.3974609375, 6.593994140625, 6.79052734375, 6.987060546875, 7.18359375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 7.0, 17.0, 9.0, 19.0, 32.0, 27.0, 26.0, 38.0, 41.0, 46.0, 42.0, 46.0, 63.0, 57.0, 51.0, 53.0, 49.0, 43.0, 46.0, 44.0, 29.0, 40.0, 23.0, 22.0, 22.0, 20.0, 17.0, 13.0, 14.0, 10.0, 10.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.262739181518555, -21.616479873657227, -20.9702205657959, -20.32396125793457, -19.677703857421875, -19.031444549560547, -18.38518524169922, -17.73892593383789, -17.092666625976562, -16.446407318115234, -15.800148010253906, -15.153889656066895, -14.507630348205566, -13.861371040344238, -13.215112686157227, -12.568853378295898, -11.92259407043457, -11.276334762573242, -10.630075454711914, -9.983817100524902, -9.337557792663574, -8.691298484802246, -8.045040130615234, -7.398780822753906, -6.752521514892578, -6.10626220703125, -5.46000337600708, -4.81374454498291, -4.167485237121582, -3.521226167678833, -2.874967098236084, -2.228708267211914, -1.582448959350586, -0.9361898899078369, -0.2899308204650879, 0.35632824897766113, 1.0025873184204102, 1.6488463878631592, 2.295105457305908, 2.941364288330078, 3.5876235961914062, 4.233882904052734, 4.880141735076904, 5.526400566101074, 6.172659873962402, 6.8189191818237305, 7.4651780128479, 8.11143684387207, 8.757696151733398, 9.403955459594727, 10.050214767456055, 10.696473121643066, 11.342732429504395, 11.988991737365723, 12.635250091552734, 13.281509399414062, 13.92776870727539, 14.574028015136719, 15.220287322998047, 15.866545677185059, 16.512805938720703, 17.1590633392334, 17.805322647094727, 18.451581954956055, 19.097841262817383]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 3.0, 5.0, 2.0, 7.0, 11.0, 10.0, 13.0, 14.0, 18.0, 15.0, 24.0, 18.0, 35.0, 29.0, 38.0, 31.0, 47.0, 39.0, 38.0, 32.0, 40.0, 38.0, 44.0, 38.0, 40.0, 41.0, 40.0, 34.0, 30.0, 32.0, 32.0, 30.0, 25.0, 21.0, 16.0, 12.0, 13.0, 5.0, 13.0, 2.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.441852569580078, -14.933212280273438, -14.42457103729248, -13.91593074798584, -13.407289505004883, -12.898649215698242, -12.390008926391602, -11.881368637084961, -11.372727394104004, -10.864087104797363, -10.355445861816406, -9.846805572509766, -9.338165283203125, -8.829524040222168, -8.320883750915527, -7.8122429847717285, -7.30360221862793, -6.794961452484131, -6.286320686340332, -5.777680397033691, -5.269039630889893, -4.760398864746094, -4.251758575439453, -3.7431178092956543, -3.2344770431518555, -2.7258362770080566, -2.217195749282837, -1.7085551023483276, -1.1999144554138184, -0.6912736892700195, -0.1826331615447998, 0.3260073661804199, 0.8346481323242188, 1.343288779258728, 1.8519294261932373, 2.360569953918457, 2.869210720062256, 3.3778514862060547, 3.8864920139312744, 4.395132541656494, 4.903773307800293, 5.412414073944092, 5.921054840087891, 6.429695129394531, 6.93833589553833, 7.446976661682129, 7.9556169509887695, 8.464258193969727, 8.972898483276367, 9.481538772583008, 9.990180015563965, 10.498820304870605, 11.007461547851562, 11.516101837158203, 12.024742126464844, 12.533382415771484, 13.042023658752441, 13.550663948059082, 14.059305191040039, 14.56794548034668, 15.07658576965332, 15.585227012634277, 16.093868255615234, 16.602508544921875, 17.111148834228516]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 8.0, 23.0, 26.0, 42.0, 76.0, 143.0, 194.0, 297.0, 461.0, 601.0, 1000.0, 1503.0, 2283.0, 3368.0, 5158.0, 7444.0, 11054.0, 16163.0, 23374.0, 34634.0, 51588.0, 75700.0, 107618.0, 138430.0, 148397.0, 126377.0, 93180.0, 64477.0, 43554.0, 29505.0, 20133.0, 13615.0, 9107.0, 6298.0, 4240.0, 2844.0, 1857.0, 1327.0, 845.0, 539.0, 360.0, 263.0, 173.0, 99.0, 51.0, 54.0, 33.0, 15.0, 11.0, 2.0, 4.0, 4.0, 2.0, 1.0], "bins": [-22.03125, -21.388671875, -20.74609375, -20.103515625, -19.4609375, -18.818359375, -18.17578125, -17.533203125, -16.890625, -16.248046875, -15.60546875, -14.962890625, -14.3203125, -13.677734375, -13.03515625, -12.392578125, -11.75, -11.107421875, -10.46484375, -9.822265625, -9.1796875, -8.537109375, -7.89453125, -7.251953125, -6.609375, -5.966796875, -5.32421875, -4.681640625, -4.0390625, -3.396484375, -2.75390625, -2.111328125, -1.46875, -0.826171875, -0.18359375, 0.458984375, 1.1015625, 1.744140625, 2.38671875, 3.029296875, 3.671875, 4.314453125, 4.95703125, 5.599609375, 6.2421875, 6.884765625, 7.52734375, 8.169921875, 8.8125, 9.455078125, 10.09765625, 10.740234375, 11.3828125, 12.025390625, 12.66796875, 13.310546875, 13.953125, 14.595703125, 15.23828125, 15.880859375, 16.5234375, 17.166015625, 17.80859375, 18.451171875, 19.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 5.0, 5.0, 6.0, 17.0, 13.0, 24.0, 20.0, 25.0, 24.0, 28.0, 34.0, 41.0, 28.0, 20.0, 40.0, 38.0, 40.0, 44.0, 28.0, 38.0, 41.0, 49.0, 43.0, 32.0, 29.0, 20.0, 36.0, 35.0, 21.0, 24.0, 20.0, 18.0, 16.0, 22.0, 8.0, 12.0, 7.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.9296875, -13.47509765625, -13.0205078125, -12.56591796875, -12.111328125, -11.65673828125, -11.2021484375, -10.74755859375, -10.29296875, -9.83837890625, -9.3837890625, -8.92919921875, -8.474609375, -8.02001953125, -7.5654296875, -7.11083984375, -6.65625, -6.20166015625, -5.7470703125, -5.29248046875, -4.837890625, -4.38330078125, -3.9287109375, -3.47412109375, -3.01953125, -2.56494140625, -2.1103515625, -1.65576171875, -1.201171875, -0.74658203125, -0.2919921875, 0.16259765625, 0.6171875, 1.07177734375, 1.5263671875, 1.98095703125, 2.435546875, 2.89013671875, 3.3447265625, 3.79931640625, 4.25390625, 4.70849609375, 5.1630859375, 5.61767578125, 6.072265625, 6.52685546875, 6.9814453125, 7.43603515625, 7.890625, 8.34521484375, 8.7998046875, 9.25439453125, 9.708984375, 10.16357421875, 10.6181640625, 11.07275390625, 11.52734375, 11.98193359375, 12.4365234375, 12.89111328125, 13.345703125, 13.80029296875, 14.2548828125, 14.70947265625, 15.1640625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 4.0, 9.0, 8.0, 29.0, 28.0, 47.0, 71.0, 121.0, 149.0, 210.0, 312.0, 526.0, 783.0, 1178.0, 1876.0, 2754.0, 4275.0, 6752.0, 10788.0, 18015.0, 30425.0, 53482.0, 97465.0, 171847.0, 230015.0, 177701.0, 101910.0, 55967.0, 31724.0, 18747.0, 11487.0, 7036.0, 4507.0, 2853.0, 1888.0, 1236.0, 738.0, 516.0, 347.0, 248.0, 170.0, 98.0, 88.0, 41.0, 22.0, 24.0, 14.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.65625, -21.914306640625, -21.17236328125, -20.430419921875, -19.6884765625, -18.946533203125, -18.20458984375, -17.462646484375, -16.720703125, -15.978759765625, -15.23681640625, -14.494873046875, -13.7529296875, -13.010986328125, -12.26904296875, -11.527099609375, -10.78515625, -10.043212890625, -9.30126953125, -8.559326171875, -7.8173828125, -7.075439453125, -6.33349609375, -5.591552734375, -4.849609375, -4.107666015625, -3.36572265625, -2.623779296875, -1.8818359375, -1.139892578125, -0.39794921875, 0.343994140625, 1.0859375, 1.827880859375, 2.56982421875, 3.311767578125, 4.0537109375, 4.795654296875, 5.53759765625, 6.279541015625, 7.021484375, 7.763427734375, 8.50537109375, 9.247314453125, 9.9892578125, 10.731201171875, 11.47314453125, 12.215087890625, 12.95703125, 13.698974609375, 14.44091796875, 15.182861328125, 15.9248046875, 16.666748046875, 17.40869140625, 18.150634765625, 18.892578125, 19.634521484375, 20.37646484375, 21.118408203125, 21.8603515625, 22.602294921875, 23.34423828125, 24.086181640625, 24.828125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 10.0, 6.0, 4.0, 5.0, 12.0, 14.0, 10.0, 16.0, 26.0, 30.0, 30.0, 31.0, 27.0, 35.0, 39.0, 51.0, 54.0, 38.0, 50.0, 34.0, 43.0, 40.0, 45.0, 41.0, 34.0, 38.0, 37.0, 35.0, 31.0, 34.0, 21.0, 15.0, 17.0, 11.0, 7.0, 10.0, 6.0, 9.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.40625, -13.0489501953125, -12.691650390625, -12.3343505859375, -11.97705078125, -11.6197509765625, -11.262451171875, -10.9051513671875, -10.5478515625, -10.1905517578125, -9.833251953125, -9.4759521484375, -9.11865234375, -8.7613525390625, -8.404052734375, -8.0467529296875, -7.689453125, -7.3321533203125, -6.974853515625, -6.6175537109375, -6.26025390625, -5.9029541015625, -5.545654296875, -5.1883544921875, -4.8310546875, -4.4737548828125, -4.116455078125, -3.7591552734375, -3.40185546875, -3.0445556640625, -2.687255859375, -2.3299560546875, -1.97265625, -1.6153564453125, -1.258056640625, -0.9007568359375, -0.54345703125, -0.1861572265625, 0.171142578125, 0.5284423828125, 0.8857421875, 1.2430419921875, 1.600341796875, 1.9576416015625, 2.31494140625, 2.6722412109375, 3.029541015625, 3.3868408203125, 3.744140625, 4.1014404296875, 4.458740234375, 4.8160400390625, 5.17333984375, 5.5306396484375, 5.887939453125, 6.2452392578125, 6.6025390625, 6.9598388671875, 7.317138671875, 7.6744384765625, 8.03173828125, 8.3890380859375, 8.746337890625, 9.1036376953125, 9.4609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 7.0, 22.0, 20.0, 20.0, 47.0, 69.0, 104.0, 157.0, 225.0, 404.0, 650.0, 1116.0, 1883.0, 3216.0, 6064.0, 11887.0, 26365.0, 64331.0, 179406.0, 391830.0, 221115.0, 78593.0, 31136.0, 14013.0, 7071.0, 3566.0, 2059.0, 1205.0, 727.0, 441.0, 276.0, 164.0, 128.0, 67.0, 61.0, 37.0, 21.0, 9.0, 16.0, 9.0, 0.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.40625, -24.650146484375, -23.89404296875, -23.137939453125, -22.3818359375, -21.625732421875, -20.86962890625, -20.113525390625, -19.357421875, -18.601318359375, -17.84521484375, -17.089111328125, -16.3330078125, -15.576904296875, -14.82080078125, -14.064697265625, -13.30859375, -12.552490234375, -11.79638671875, -11.040283203125, -10.2841796875, -9.528076171875, -8.77197265625, -8.015869140625, -7.259765625, -6.503662109375, -5.74755859375, -4.991455078125, -4.2353515625, -3.479248046875, -2.72314453125, -1.967041015625, -1.2109375, -0.454833984375, 0.30126953125, 1.057373046875, 1.8134765625, 2.569580078125, 3.32568359375, 4.081787109375, 4.837890625, 5.593994140625, 6.35009765625, 7.106201171875, 7.8623046875, 8.618408203125, 9.37451171875, 10.130615234375, 10.88671875, 11.642822265625, 12.39892578125, 13.155029296875, 13.9111328125, 14.667236328125, 15.42333984375, 16.179443359375, 16.935546875, 17.691650390625, 18.44775390625, 19.203857421875, 19.9599609375, 20.716064453125, 21.47216796875, 22.228271484375, 22.984375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 11.0, 17.0, 24.0, 42.0, 65.0, 93.0, 154.0, 216.0, 144.0, 63.0, 46.0, 36.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003326416015625, -0.0032374560832977295, -0.003148496150970459, -0.0030595362186431885, -0.002970576286315918, -0.0028816163539886475, -0.002792656421661377, -0.0027036964893341064, -0.002614736557006836, -0.0025257766246795654, -0.002436816692352295, -0.0023478567600250244, -0.002258896827697754, -0.0021699368953704834, -0.002080976963043213, -0.0019920170307159424, -0.0019030570983886719, -0.0018140971660614014, -0.0017251372337341309, -0.0016361773014068604, -0.0015472173690795898, -0.0014582574367523193, -0.0013692975044250488, -0.0012803375720977783, -0.0011913776397705078, -0.0011024177074432373, -0.0010134577751159668, -0.0009244978427886963, -0.0008355379104614258, -0.0007465779781341553, -0.0006576180458068848, -0.0005686581134796143, -0.00047969818115234375, -0.00039073824882507324, -0.00030177831649780273, -0.00021281838417053223, -0.00012385845184326172, -3.489851951599121e-05, 5.40614128112793e-05, 0.0001430213451385498, 0.0002319812774658203, 0.0003209412097930908, 0.00040990114212036133, 0.0004988610744476318, 0.0005878210067749023, 0.0006767809391021729, 0.0007657408714294434, 0.0008547008037567139, 0.0009436607360839844, 0.0010326206684112549, 0.0011215806007385254, 0.001210540533065796, 0.0012995004653930664, 0.001388460397720337, 0.0014774203300476074, 0.001566380262374878, 0.0016553401947021484, 0.001744300127029419, 0.0018332600593566895, 0.00192221999168396, 0.0020111799240112305, 0.002100139856338501, 0.0021890997886657715, 0.002278059720993042, 0.0023670196533203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 17.0, 21.0, 29.0, 49.0, 70.0, 88.0, 119.0, 183.0, 229.0, 369.0, 514.0, 792.0, 1138.0, 1822.0, 2757.0, 4577.0, 8046.0, 14943.0, 27852.0, 54969.0, 108646.0, 205049.0, 262843.0, 169153.0, 87224.0, 44508.0, 22724.0, 12135.0, 6664.0, 3806.0, 2380.0, 1647.0, 977.0, 647.0, 491.0, 339.0, 211.0, 152.0, 106.0, 70.0, 71.0, 34.0, 24.0, 12.0, 18.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-21.984375, -21.324951171875, -20.66552734375, -20.006103515625, -19.3466796875, -18.687255859375, -18.02783203125, -17.368408203125, -16.708984375, -16.049560546875, -15.39013671875, -14.730712890625, -14.0712890625, -13.411865234375, -12.75244140625, -12.093017578125, -11.43359375, -10.774169921875, -10.11474609375, -9.455322265625, -8.7958984375, -8.136474609375, -7.47705078125, -6.817626953125, -6.158203125, -5.498779296875, -4.83935546875, -4.179931640625, -3.5205078125, -2.861083984375, -2.20166015625, -1.542236328125, -0.8828125, -0.223388671875, 0.43603515625, 1.095458984375, 1.7548828125, 2.414306640625, 3.07373046875, 3.733154296875, 4.392578125, 5.052001953125, 5.71142578125, 6.370849609375, 7.0302734375, 7.689697265625, 8.34912109375, 9.008544921875, 9.66796875, 10.327392578125, 10.98681640625, 11.646240234375, 12.3056640625, 12.965087890625, 13.62451171875, 14.283935546875, 14.943359375, 15.602783203125, 16.26220703125, 16.921630859375, 17.5810546875, 18.240478515625, 18.89990234375, 19.559326171875, 20.21875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 3.0, 6.0, 6.0, 12.0, 15.0, 13.0, 18.0, 29.0, 30.0, 22.0, 28.0, 36.0, 40.0, 44.0, 55.0, 55.0, 57.0, 75.0, 79.0, 65.0, 52.0, 38.0, 34.0, 44.0, 23.0, 16.0, 20.0, 22.0, 10.0, 8.0, 9.0, 10.0, 3.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.6942138671875, -4.532958984375, -4.3717041015625, -4.21044921875, -4.0491943359375, -3.887939453125, -3.7266845703125, -3.5654296875, -3.4041748046875, -3.242919921875, -3.0816650390625, -2.92041015625, -2.7591552734375, -2.597900390625, -2.4366455078125, -2.275390625, -2.1141357421875, -1.952880859375, -1.7916259765625, -1.63037109375, -1.4691162109375, -1.307861328125, -1.1466064453125, -0.9853515625, -0.8240966796875, -0.662841796875, -0.5015869140625, -0.34033203125, -0.1790771484375, -0.017822265625, 0.1434326171875, 0.3046875, 0.4659423828125, 0.627197265625, 0.7884521484375, 0.94970703125, 1.1109619140625, 1.272216796875, 1.4334716796875, 1.5947265625, 1.7559814453125, 1.917236328125, 2.0784912109375, 2.23974609375, 2.4010009765625, 2.562255859375, 2.7235107421875, 2.884765625, 3.0460205078125, 3.207275390625, 3.3685302734375, 3.52978515625, 3.6910400390625, 3.852294921875, 4.0135498046875, 4.1748046875, 4.3360595703125, 4.497314453125, 4.6585693359375, 4.81982421875, 4.9810791015625, 5.142333984375, 5.3035888671875, 5.46484375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 16.0, 14.0, 15.0, 25.0, 33.0, 27.0, 40.0, 25.0, 49.0, 42.0, 57.0, 44.0, 35.0, 51.0, 55.0, 57.0, 49.0, 40.0, 40.0, 22.0, 23.0, 32.0, 18.0, 30.0, 28.0, 16.0, 10.0, 12.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.09552001953125, -15.579512596130371, -15.063505172729492, -14.547497749328613, -14.031490325927734, -13.515483856201172, -12.999476432800293, -12.483469009399414, -11.967461585998535, -11.451454162597656, -10.935446739196777, -10.419439315795898, -9.903432846069336, -9.38742446899414, -8.871417999267578, -8.3554105758667, -7.83940315246582, -7.323395729064941, -6.8073883056640625, -6.291381359100342, -5.775373935699463, -5.259366512298584, -4.743359565734863, -4.227352142333984, -3.7113447189331055, -3.1953372955322266, -2.6793301105499268, -2.163322925567627, -1.647315502166748, -1.1313080787658691, -0.6153008937835693, -0.09929370880126953, 0.41671180725097656, 0.9327191114425659, 1.4487264156341553, 1.9647337198257446, 2.480741024017334, 2.996748447418213, 3.5127556324005127, 4.0287628173828125, 4.544770240783691, 5.06077766418457, 5.576785087585449, 6.09279203414917, 6.608799457550049, 7.124806880950928, 7.640813827514648, 8.156821250915527, 8.672828674316406, 9.188836097717285, 9.704843521118164, 10.220850944519043, 10.736858367919922, 11.252864837646484, 11.768872261047363, 12.284879684448242, 12.800887107849121, 13.31689453125, 13.832901954650879, 14.348909378051758, 14.86491584777832, 15.380924224853516, 15.896930694580078, 16.41293716430664, 16.928945541381836]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 6.0, 6.0, 2.0, 7.0, 6.0, 10.0, 15.0, 15.0, 10.0, 19.0, 21.0, 18.0, 26.0, 33.0, 37.0, 32.0, 44.0, 34.0, 37.0, 35.0, 38.0, 42.0, 37.0, 35.0, 41.0, 40.0, 41.0, 41.0, 36.0, 37.0, 29.0, 24.0, 26.0, 26.0, 20.0, 13.0, 10.0, 13.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.952642440795898, -13.499324798583984, -13.046008110046387, -12.592690467834473, -12.139372825622559, -11.686056137084961, -11.232738494873047, -10.779420852661133, -10.326103210449219, -9.872785568237305, -9.419468879699707, -8.966151237487793, -8.512833595275879, -8.059516906738281, -7.606199264526367, -7.152881622314453, -6.6995649337768555, -6.2462477684021, -5.7929301261901855, -5.33961296081543, -4.886295318603516, -4.43297815322876, -3.979660987854004, -3.526343584060669, -3.073026180267334, -2.619708776473999, -2.166391372680664, -1.7130742073059082, -1.2597568035125732, -0.8064393997192383, -0.3531222343444824, 0.10019516944885254, 0.5535135269165039, 1.0068309307098389, 1.4601482152938843, 1.9134654998779297, 2.3667829036712646, 2.8201003074645996, 3.2734174728393555, 3.7267348766326904, 4.180052280426025, 4.633369445800781, 5.086687088012695, 5.540004253387451, 5.993321418762207, 6.446639060974121, 6.899956226348877, 7.353273391723633, 7.806591033935547, 8.259908676147461, 8.713225364685059, 9.166543006896973, 9.619860649108887, 10.073177337646484, 10.526494979858398, 10.979812622070312, 11.433130264282227, 11.88644790649414, 12.339764595031738, 12.793082237243652, 13.246399879455566, 13.699716567993164, 14.153034210205078, 14.606351852416992, 15.05966854095459]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 9.0, 19.0, 22.0, 39.0, 62.0, 92.0, 175.0, 256.0, 397.0, 644.0, 973.0, 1574.0, 2273.0, 3475.0, 5285.0, 7899.0, 12141.0, 17453.0, 25131.0, 35556.0, 47829.0, 62482.0, 77710.0, 90574.0, 99334.0, 101233.0, 97204.0, 86832.0, 72143.0, 57100.0, 43216.0, 31285.0, 22294.0, 15237.0, 10461.0, 6948.0, 4629.0, 2974.0, 2004.0, 1275.0, 836.0, 534.0, 354.0, 218.0, 137.0, 76.0, 66.0, 29.0, 22.0, 17.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-12.1015625, -11.7152099609375, -11.328857421875, -10.9425048828125, -10.55615234375, -10.1697998046875, -9.783447265625, -9.3970947265625, -9.0107421875, -8.6243896484375, -8.238037109375, -7.8516845703125, -7.46533203125, -7.0789794921875, -6.692626953125, -6.3062744140625, -5.919921875, -5.5335693359375, -5.147216796875, -4.7608642578125, -4.37451171875, -3.9881591796875, -3.601806640625, -3.2154541015625, -2.8291015625, -2.4427490234375, -2.056396484375, -1.6700439453125, -1.28369140625, -0.8973388671875, -0.510986328125, -0.1246337890625, 0.26171875, 0.6480712890625, 1.034423828125, 1.4207763671875, 1.80712890625, 2.1934814453125, 2.579833984375, 2.9661865234375, 3.3525390625, 3.7388916015625, 4.125244140625, 4.5115966796875, 4.89794921875, 5.2843017578125, 5.670654296875, 6.0570068359375, 6.443359375, 6.8297119140625, 7.216064453125, 7.6024169921875, 7.98876953125, 8.3751220703125, 8.761474609375, 9.1478271484375, 9.5341796875, 9.9205322265625, 10.306884765625, 10.6932373046875, 11.07958984375, 11.4659423828125, 11.852294921875, 12.2386474609375, 12.625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 10.0, 4.0, 6.0, 5.0, 10.0, 14.0, 18.0, 16.0, 19.0, 28.0, 24.0, 24.0, 23.0, 33.0, 35.0, 27.0, 43.0, 35.0, 45.0, 42.0, 36.0, 45.0, 37.0, 38.0, 29.0, 32.0, 37.0, 37.0, 27.0, 29.0, 26.0, 24.0, 16.0, 30.0, 13.0, 12.0, 18.0, 19.0, 1.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.205322265625, -11.76220703125, -11.319091796875, -10.8759765625, -10.432861328125, -9.98974609375, -9.546630859375, -9.103515625, -8.660400390625, -8.21728515625, -7.774169921875, -7.3310546875, -6.887939453125, -6.44482421875, -6.001708984375, -5.55859375, -5.115478515625, -4.67236328125, -4.229248046875, -3.7861328125, -3.343017578125, -2.89990234375, -2.456787109375, -2.013671875, -1.570556640625, -1.12744140625, -0.684326171875, -0.2412109375, 0.201904296875, 0.64501953125, 1.088134765625, 1.53125, 1.974365234375, 2.41748046875, 2.860595703125, 3.3037109375, 3.746826171875, 4.18994140625, 4.633056640625, 5.076171875, 5.519287109375, 5.96240234375, 6.405517578125, 6.8486328125, 7.291748046875, 7.73486328125, 8.177978515625, 8.62109375, 9.064208984375, 9.50732421875, 9.950439453125, 10.3935546875, 10.836669921875, 11.27978515625, 11.722900390625, 12.166015625, 12.609130859375, 13.05224609375, 13.495361328125, 13.9384765625, 14.381591796875, 14.82470703125, 15.267822265625, 15.7109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 6.0, 21.0, 28.0, 38.0, 68.0, 111.0, 159.0, 269.0, 391.0, 607.0, 964.0, 1537.0, 2281.0, 3403.0, 5362.0, 7932.0, 11793.0, 16897.0, 24198.0, 33251.0, 45020.0, 57825.0, 71790.0, 84357.0, 93920.0, 97650.0, 95779.0, 87022.0, 75300.0, 61790.0, 48304.0, 36251.0, 26418.0, 18807.0, 13016.0, 8952.0, 5861.0, 3954.0, 2585.0, 1619.0, 1076.0, 691.0, 430.0, 285.0, 210.0, 139.0, 68.0, 37.0, 25.0, 23.0, 18.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.890625, -11.5147705078125, -11.138916015625, -10.7630615234375, -10.38720703125, -10.0113525390625, -9.635498046875, -9.2596435546875, -8.8837890625, -8.5079345703125, -8.132080078125, -7.7562255859375, -7.38037109375, -7.0045166015625, -6.628662109375, -6.2528076171875, -5.876953125, -5.5010986328125, -5.125244140625, -4.7493896484375, -4.37353515625, -3.9976806640625, -3.621826171875, -3.2459716796875, -2.8701171875, -2.4942626953125, -2.118408203125, -1.7425537109375, -1.36669921875, -0.9908447265625, -0.614990234375, -0.2391357421875, 0.13671875, 0.5125732421875, 0.888427734375, 1.2642822265625, 1.64013671875, 2.0159912109375, 2.391845703125, 2.7677001953125, 3.1435546875, 3.5194091796875, 3.895263671875, 4.2711181640625, 4.64697265625, 5.0228271484375, 5.398681640625, 5.7745361328125, 6.150390625, 6.5262451171875, 6.902099609375, 7.2779541015625, 7.65380859375, 8.0296630859375, 8.405517578125, 8.7813720703125, 9.1572265625, 9.5330810546875, 9.908935546875, 10.2847900390625, 10.66064453125, 11.0364990234375, 11.412353515625, 11.7882080078125, 12.1640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 11.0, 12.0, 5.0, 12.0, 19.0, 13.0, 19.0, 18.0, 22.0, 32.0, 38.0, 30.0, 40.0, 30.0, 41.0, 42.0, 52.0, 52.0, 47.0, 36.0, 53.0, 45.0, 49.0, 34.0, 34.0, 29.0, 34.0, 35.0, 25.0, 20.0, 17.0, 7.0, 11.0, 16.0, 13.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.336181640625, -9.99267578125, -9.649169921875, -9.3056640625, -8.962158203125, -8.61865234375, -8.275146484375, -7.931640625, -7.588134765625, -7.24462890625, -6.901123046875, -6.5576171875, -6.214111328125, -5.87060546875, -5.527099609375, -5.18359375, -4.840087890625, -4.49658203125, -4.153076171875, -3.8095703125, -3.466064453125, -3.12255859375, -2.779052734375, -2.435546875, -2.092041015625, -1.74853515625, -1.405029296875, -1.0615234375, -0.718017578125, -0.37451171875, -0.031005859375, 0.3125, 0.656005859375, 0.99951171875, 1.343017578125, 1.6865234375, 2.030029296875, 2.37353515625, 2.717041015625, 3.060546875, 3.404052734375, 3.74755859375, 4.091064453125, 4.4345703125, 4.778076171875, 5.12158203125, 5.465087890625, 5.80859375, 6.152099609375, 6.49560546875, 6.839111328125, 7.1826171875, 7.526123046875, 7.86962890625, 8.213134765625, 8.556640625, 8.900146484375, 9.24365234375, 9.587158203125, 9.9306640625, 10.274169921875, 10.61767578125, 10.961181640625, 11.3046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 17.0, 24.0, 32.0, 38.0, 35.0, 63.0, 72.0, 87.0, 141.0, 164.0, 216.0, 286.0, 380.0, 543.0, 880.0, 1257.0, 2014.0, 3517.0, 6968.0, 14027.0, 29623.0, 61003.0, 116063.0, 184287.0, 218175.0, 179990.0, 112069.0, 58449.0, 28563.0, 13416.0, 6635.0, 3472.0, 1897.0, 1203.0, 821.0, 545.0, 401.0, 268.0, 217.0, 165.0, 124.0, 86.0, 75.0, 51.0, 56.0, 45.0, 23.0, 19.0, 12.0, 7.0, 6.0, 5.0, 5.0, 7.0, 3.0], "bins": [-10.9453125, -10.6182861328125, -10.291259765625, -9.9642333984375, -9.63720703125, -9.3101806640625, -8.983154296875, -8.6561279296875, -8.3291015625, -8.0020751953125, -7.675048828125, -7.3480224609375, -7.02099609375, -6.6939697265625, -6.366943359375, -6.0399169921875, -5.712890625, -5.3858642578125, -5.058837890625, -4.7318115234375, -4.40478515625, -4.0777587890625, -3.750732421875, -3.4237060546875, -3.0966796875, -2.7696533203125, -2.442626953125, -2.1156005859375, -1.78857421875, -1.4615478515625, -1.134521484375, -0.8074951171875, -0.48046875, -0.1534423828125, 0.173583984375, 0.5006103515625, 0.82763671875, 1.1546630859375, 1.481689453125, 1.8087158203125, 2.1357421875, 2.4627685546875, 2.789794921875, 3.1168212890625, 3.44384765625, 3.7708740234375, 4.097900390625, 4.4249267578125, 4.751953125, 5.0789794921875, 5.406005859375, 5.7330322265625, 6.06005859375, 6.3870849609375, 6.714111328125, 7.0411376953125, 7.3681640625, 7.6951904296875, 8.022216796875, 8.3492431640625, 8.67626953125, 9.0032958984375, 9.330322265625, 9.6573486328125, 9.984375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 13.0, 13.0, 13.0, 13.0, 18.0, 23.0, 31.0, 44.0, 38.0, 43.0, 52.0, 53.0, 62.0, 52.0, 68.0, 58.0, 54.0, 54.0, 43.0, 50.0, 40.0, 38.0, 28.0, 23.0, 12.0, 17.0, 11.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009183883666992188, -0.0008923634886741638, -0.0008663386106491089, -0.000840313732624054, -0.000814288854598999, -0.0007882639765739441, -0.0007622390985488892, -0.0007362142205238342, -0.0007101893424987793, -0.0006841644644737244, -0.0006581395864486694, -0.0006321147084236145, -0.0006060898303985596, -0.0005800649523735046, -0.0005540400743484497, -0.0005280151963233948, -0.0005019903182983398, -0.0004759654402732849, -0.00044994056224823, -0.00042391568422317505, -0.0003978908061981201, -0.0003718659281730652, -0.00034584105014801025, -0.0003198161721229553, -0.0002937912940979004, -0.00026776641607284546, -0.00024174153804779053, -0.0002157166600227356, -0.00018969178199768066, -0.00016366690397262573, -0.0001376420259475708, -0.00011161714792251587, -8.559226989746094e-05, -5.9567391872406006e-05, -3.3542513847351074e-05, -7.517635822296143e-06, 1.850724220275879e-05, 4.453212022781372e-05, 7.055699825286865e-05, 9.658187627792358e-05, 0.00012260675430297852, 0.00014863163232803345, 0.00017465651035308838, 0.0002006813883781433, 0.00022670626640319824, 0.0002527311444282532, 0.0002787560224533081, 0.00030478090047836304, 0.00033080577850341797, 0.0003568306565284729, 0.00038285553455352783, 0.00040888041257858276, 0.0004349052906036377, 0.0004609301686286926, 0.00048695504665374756, 0.0005129799246788025, 0.0005390048027038574, 0.0005650296807289124, 0.0005910545587539673, 0.0006170794367790222, 0.0006431043148040771, 0.0006691291928291321, 0.000695154070854187, 0.0007211789488792419, 0.0007472038269042969]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 8.0, 15.0, 13.0, 32.0, 39.0, 46.0, 77.0, 100.0, 134.0, 182.0, 258.0, 391.0, 536.0, 747.0, 1174.0, 1964.0, 3357.0, 6497.0, 13682.0, 29485.0, 61482.0, 116600.0, 184190.0, 216533.0, 180988.0, 113641.0, 59414.0, 28526.0, 13192.0, 6234.0, 3330.0, 1883.0, 1221.0, 735.0, 537.0, 397.0, 251.0, 168.0, 121.0, 109.0, 83.0, 61.0, 32.0, 27.0, 20.0, 7.0, 12.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.561279296875, -9.24755859375, -8.933837890625, -8.6201171875, -8.306396484375, -7.99267578125, -7.678955078125, -7.365234375, -7.051513671875, -6.73779296875, -6.424072265625, -6.1103515625, -5.796630859375, -5.48291015625, -5.169189453125, -4.85546875, -4.541748046875, -4.22802734375, -3.914306640625, -3.6005859375, -3.286865234375, -2.97314453125, -2.659423828125, -2.345703125, -2.031982421875, -1.71826171875, -1.404541015625, -1.0908203125, -0.777099609375, -0.46337890625, -0.149658203125, 0.1640625, 0.477783203125, 0.79150390625, 1.105224609375, 1.4189453125, 1.732666015625, 2.04638671875, 2.360107421875, 2.673828125, 2.987548828125, 3.30126953125, 3.614990234375, 3.9287109375, 4.242431640625, 4.55615234375, 4.869873046875, 5.18359375, 5.497314453125, 5.81103515625, 6.124755859375, 6.4384765625, 6.752197265625, 7.06591796875, 7.379638671875, 7.693359375, 8.007080078125, 8.32080078125, 8.634521484375, 8.9482421875, 9.261962890625, 9.57568359375, 9.889404296875, 10.203125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 9.0, 7.0, 13.0, 10.0, 10.0, 17.0, 27.0, 44.0, 40.0, 58.0, 63.0, 71.0, 57.0, 72.0, 69.0, 70.0, 67.0, 61.0, 42.0, 41.0, 36.0, 24.0, 26.0, 12.0, 10.0, 8.0, 8.0, 2.0, 8.0, 2.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.0831298828125, -2.982666015625, -2.8822021484375, -2.78173828125, -2.6812744140625, -2.580810546875, -2.4803466796875, -2.3798828125, -2.2794189453125, -2.178955078125, -2.0784912109375, -1.97802734375, -1.8775634765625, -1.777099609375, -1.6766357421875, -1.576171875, -1.4757080078125, -1.375244140625, -1.2747802734375, -1.17431640625, -1.0738525390625, -0.973388671875, -0.8729248046875, -0.7724609375, -0.6719970703125, -0.571533203125, -0.4710693359375, -0.37060546875, -0.2701416015625, -0.169677734375, -0.0692138671875, 0.03125, 0.1317138671875, 0.232177734375, 0.3326416015625, 0.43310546875, 0.5335693359375, 0.634033203125, 0.7344970703125, 0.8349609375, 0.9354248046875, 1.035888671875, 1.1363525390625, 1.23681640625, 1.3372802734375, 1.437744140625, 1.5382080078125, 1.638671875, 1.7391357421875, 1.839599609375, 1.9400634765625, 2.04052734375, 2.1409912109375, 2.241455078125, 2.3419189453125, 2.4423828125, 2.5428466796875, 2.643310546875, 2.7437744140625, 2.84423828125, 2.9447021484375, 3.045166015625, 3.1456298828125, 3.24609375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 2.0, 8.0, 10.0, 9.0, 12.0, 16.0, 14.0, 26.0, 33.0, 21.0, 28.0, 48.0, 42.0, 58.0, 44.0, 35.0, 56.0, 64.0, 57.0, 59.0, 56.0, 40.0, 38.0, 32.0, 27.0, 38.0, 26.0, 17.0, 21.0, 10.0, 13.0, 7.0, 6.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.244752883911133, -17.66324806213379, -17.081741333007812, -16.50023651123047, -15.918730735778809, -15.337224960327148, -14.755720138549805, -14.174214363098145, -13.592708587646484, -13.011202812194824, -12.42969799041748, -11.84819221496582, -11.26668643951416, -10.6851806640625, -10.103675842285156, -9.522170066833496, -8.940665245056152, -8.359159469604492, -7.77765417098999, -7.196148872375488, -6.614643096923828, -6.033137798309326, -5.451632499694824, -4.870126724243164, -4.288621425628662, -3.707115888595581, -3.1256103515625, -2.544105052947998, -1.962599515914917, -1.381093978881836, -0.799588680267334, -0.21808290481567383, 0.3634223937988281, 0.9449278712272644, 1.5264333486557007, 2.107938766479492, 2.6894443035125732, 3.2709498405456543, 3.8524551391601562, 4.433960914611816, 5.015466213226318, 5.59697151184082, 6.1784772872924805, 6.759982585906982, 7.341487884521484, 7.9229936599731445, 8.504499435424805, 9.086004257202148, 9.667510032653809, 10.249015808105469, 10.830520629882812, 11.412026405334473, 11.993532180786133, 12.575037002563477, 13.156542778015137, 13.738048553466797, 14.31955337524414, 14.9010591506958, 15.482563972473145, 16.064069747924805, 16.64557456970215, 17.227081298828125, 17.80858612060547, 18.390090942382812, 18.97159767150879]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 9.0, 6.0, 8.0, 18.0, 14.0, 18.0, 24.0, 26.0, 31.0, 25.0, 31.0, 27.0, 45.0, 32.0, 49.0, 39.0, 29.0, 36.0, 42.0, 43.0, 30.0, 46.0, 37.0, 36.0, 42.0, 31.0, 31.0, 35.0, 17.0, 20.0, 12.0, 16.0, 16.0, 9.0, 10.0, 10.0, 7.0, 5.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.138433456420898, -12.680917739868164, -12.22340202331543, -11.765886306762695, -11.308371543884277, -10.850855827331543, -10.393340110778809, -9.935824394226074, -9.478309631347656, -9.020793914794922, -8.563278198242188, -8.105762481689453, -7.648247718811035, -7.190732002258301, -6.733216285705566, -6.275700569152832, -5.818184852600098, -5.360669136047363, -4.903153896331787, -4.445638179779053, -3.9881227016448975, -3.530607223510742, -3.073091506958008, -2.6155760288238525, -2.1580605506896973, -1.700545072555542, -1.2430294752120972, -0.7855138778686523, -0.32799839973449707, 0.1295170783996582, 0.5870327949523926, 1.0445482730865479, 1.5020637512207031, 1.9595792293548584, 2.4170947074890137, 2.874610424041748, 3.3321259021759033, 3.7896413803100586, 4.247157096862793, 4.704672813415527, 5.1621880531311035, 5.619703769683838, 6.077219009399414, 6.534734725952148, 6.992250442504883, 7.449765682220459, 7.907281398773193, 8.36479663848877, 8.822312355041504, 9.279828071594238, 9.737343788146973, 10.19485855102539, 10.652374267578125, 11.10988998413086, 11.567405700683594, 12.024921417236328, 12.482437133789062, 12.939952850341797, 13.397468566894531, 13.854984283447266, 14.312499046325684, 14.770014762878418, 15.227530479431152, 15.685046195983887, 16.142560958862305]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 7.0, 16.0, 42.0, 48.0, 65.0, 84.0, 125.0, 210.0, 357.0, 556.0, 820.0, 1328.0, 1984.0, 3214.0, 4926.0, 7815.0, 12436.0, 19354.0, 30612.0, 49219.0, 77883.0, 122332.0, 189632.0, 287167.0, 410395.0, 528018.0, 584879.0, 543116.0, 434057.0, 310689.0, 208451.0, 134616.0, 85880.0, 53642.0, 33764.0, 21111.0, 13227.0, 8231.0, 5101.0, 3298.0, 2009.0, 1301.0, 810.0, 528.0, 330.0, 228.0, 148.0, 85.0, 54.0, 24.0, 20.0, 21.0, 10.0, 9.0, 2.0, 1.0, 4.0, 3.0], "bins": [-14.2265625, -13.7900390625, -13.353515625, -12.9169921875, -12.48046875, -12.0439453125, -11.607421875, -11.1708984375, -10.734375, -10.2978515625, -9.861328125, -9.4248046875, -8.98828125, -8.5517578125, -8.115234375, -7.6787109375, -7.2421875, -6.8056640625, -6.369140625, -5.9326171875, -5.49609375, -5.0595703125, -4.623046875, -4.1865234375, -3.75, -3.3134765625, -2.876953125, -2.4404296875, -2.00390625, -1.5673828125, -1.130859375, -0.6943359375, -0.2578125, 0.1787109375, 0.615234375, 1.0517578125, 1.48828125, 1.9248046875, 2.361328125, 2.7978515625, 3.234375, 3.6708984375, 4.107421875, 4.5439453125, 4.98046875, 5.4169921875, 5.853515625, 6.2900390625, 6.7265625, 7.1630859375, 7.599609375, 8.0361328125, 8.47265625, 8.9091796875, 9.345703125, 9.7822265625, 10.21875, 10.6552734375, 11.091796875, 11.5283203125, 11.96484375, 12.4013671875, 12.837890625, 13.2744140625, 13.7109375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 5.0, 10.0, 7.0, 7.0, 8.0, 14.0, 14.0, 21.0, 22.0, 18.0, 18.0, 28.0, 26.0, 29.0, 23.0, 31.0, 56.0, 24.0, 43.0, 42.0, 38.0, 41.0, 33.0, 45.0, 38.0, 36.0, 39.0, 34.0, 24.0, 33.0, 20.0, 25.0, 18.0, 24.0, 14.0, 14.0, 16.0, 7.0, 11.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.0, -10.6644287109375, -10.328857421875, -9.9932861328125, -9.65771484375, -9.3221435546875, -8.986572265625, -8.6510009765625, -8.3154296875, -7.9798583984375, -7.644287109375, -7.3087158203125, -6.97314453125, -6.6375732421875, -6.302001953125, -5.9664306640625, -5.630859375, -5.2952880859375, -4.959716796875, -4.6241455078125, -4.28857421875, -3.9530029296875, -3.617431640625, -3.2818603515625, -2.9462890625, -2.6107177734375, -2.275146484375, -1.9395751953125, -1.60400390625, -1.2684326171875, -0.932861328125, -0.5972900390625, -0.26171875, 0.0738525390625, 0.409423828125, 0.7449951171875, 1.08056640625, 1.4161376953125, 1.751708984375, 2.0872802734375, 2.4228515625, 2.7584228515625, 3.093994140625, 3.4295654296875, 3.76513671875, 4.1007080078125, 4.436279296875, 4.7718505859375, 5.107421875, 5.4429931640625, 5.778564453125, 6.1141357421875, 6.44970703125, 6.7852783203125, 7.120849609375, 7.4564208984375, 7.7919921875, 8.1275634765625, 8.463134765625, 8.7987060546875, 9.13427734375, 9.4698486328125, 9.805419921875, 10.1409912109375, 10.4765625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 16.0, 25.0, 40.0, 58.0, 128.0, 189.0, 349.0, 589.0, 964.0, 1659.0, 2805.0, 4791.0, 8255.0, 14045.0, 23367.0, 38938.0, 64335.0, 103107.0, 162183.0, 242559.0, 341786.0, 445607.0, 520355.0, 536264.0, 484148.0, 389136.0, 286153.0, 194898.0, 126454.0, 80054.0, 48986.0, 29531.0, 17549.0, 10510.0, 6110.0, 3473.0, 2022.0, 1169.0, 724.0, 380.0, 241.0, 127.0, 73.0, 40.0, 31.0, 34.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.3359375, -12.9088134765625, -12.481689453125, -12.0545654296875, -11.62744140625, -11.2003173828125, -10.773193359375, -10.3460693359375, -9.9189453125, -9.4918212890625, -9.064697265625, -8.6375732421875, -8.21044921875, -7.7833251953125, -7.356201171875, -6.9290771484375, -6.501953125, -6.0748291015625, -5.647705078125, -5.2205810546875, -4.79345703125, -4.3663330078125, -3.939208984375, -3.5120849609375, -3.0849609375, -2.6578369140625, -2.230712890625, -1.8035888671875, -1.37646484375, -0.9493408203125, -0.522216796875, -0.0950927734375, 0.33203125, 0.7591552734375, 1.186279296875, 1.6134033203125, 2.04052734375, 2.4676513671875, 2.894775390625, 3.3218994140625, 3.7490234375, 4.1761474609375, 4.603271484375, 5.0303955078125, 5.45751953125, 5.8846435546875, 6.311767578125, 6.7388916015625, 7.166015625, 7.5931396484375, 8.020263671875, 8.4473876953125, 8.87451171875, 9.3016357421875, 9.728759765625, 10.1558837890625, 10.5830078125, 11.0101318359375, 11.437255859375, 11.8643798828125, 12.29150390625, 12.7186279296875, 13.145751953125, 13.5728759765625, 14.0]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 12.0, 9.0, 14.0, 19.0, 20.0, 26.0, 35.0, 35.0, 39.0, 55.0, 63.0, 73.0, 108.0, 115.0, 105.0, 126.0, 163.0, 186.0, 168.0, 207.0, 191.0, 207.0, 206.0, 198.0, 213.0, 191.0, 173.0, 172.0, 148.0, 119.0, 117.0, 89.0, 83.0, 73.0, 51.0, 66.0, 39.0, 30.0, 32.0, 12.0, 19.0, 18.0, 14.0, 11.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0], "bins": [-6.17578125, -5.999267578125, -5.82275390625, -5.646240234375, -5.4697265625, -5.293212890625, -5.11669921875, -4.940185546875, -4.763671875, -4.587158203125, -4.41064453125, -4.234130859375, -4.0576171875, -3.881103515625, -3.70458984375, -3.528076171875, -3.3515625, -3.175048828125, -2.99853515625, -2.822021484375, -2.6455078125, -2.468994140625, -2.29248046875, -2.115966796875, -1.939453125, -1.762939453125, -1.58642578125, -1.409912109375, -1.2333984375, -1.056884765625, -0.88037109375, -0.703857421875, -0.52734375, -0.350830078125, -0.17431640625, 0.002197265625, 0.1787109375, 0.355224609375, 0.53173828125, 0.708251953125, 0.884765625, 1.061279296875, 1.23779296875, 1.414306640625, 1.5908203125, 1.767333984375, 1.94384765625, 2.120361328125, 2.296875, 2.473388671875, 2.64990234375, 2.826416015625, 3.0029296875, 3.179443359375, 3.35595703125, 3.532470703125, 3.708984375, 3.885498046875, 4.06201171875, 4.238525390625, 4.4150390625, 4.591552734375, 4.76806640625, 4.944580078125, 5.12109375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 8.0, 7.0, 5.0, 16.0, 14.0, 14.0, 22.0, 22.0, 32.0, 34.0, 41.0, 44.0, 44.0, 63.0, 56.0, 47.0, 60.0, 46.0, 43.0, 45.0, 55.0, 45.0, 37.0, 30.0, 26.0, 29.0, 26.0, 20.0, 20.0, 11.0, 8.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-20.975299835205078, -20.428804397583008, -19.882308959960938, -19.335811614990234, -18.789316177368164, -18.242820739746094, -17.69632339477539, -17.14982795715332, -16.60333251953125, -16.05683708190918, -15.510340690612793, -14.963844299316406, -14.417348861694336, -13.870853424072266, -13.324357032775879, -12.777860641479492, -12.231365203857422, -11.684869766235352, -11.138373374938965, -10.591876983642578, -10.045381546020508, -9.498886108398438, -8.95238971710205, -8.405893325805664, -7.859397888183594, -7.312901973724365, -6.766406059265137, -6.219910144805908, -5.67341423034668, -5.126918315887451, -4.580422401428223, -4.033926486968994, -3.4874324798583984, -2.94093656539917, -2.3944406509399414, -1.847944736480713, -1.3014488220214844, -0.7549529075622559, -0.20845699310302734, 0.33803892135620117, 0.8845348358154297, 1.4310307502746582, 1.9775266647338867, 2.5240225791931152, 3.0705184936523438, 3.6170144081115723, 4.163510322570801, 4.710006237030029, 5.256502151489258, 5.802998065948486, 6.349493980407715, 6.895989894866943, 7.442485809326172, 7.9889817237854, 8.535477638244629, 9.081974029541016, 9.628469467163086, 10.174964904785156, 10.721461296081543, 11.26795768737793, 11.814453125, 12.36094856262207, 12.907444953918457, 13.453941345214844, 14.000436782836914]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 8.0, 2.0, 2.0, 8.0, 10.0, 9.0, 8.0, 19.0, 15.0, 14.0, 23.0, 21.0, 28.0, 27.0, 35.0, 36.0, 25.0, 37.0, 38.0, 35.0, 46.0, 33.0, 47.0, 40.0, 34.0, 31.0, 45.0, 39.0, 35.0, 29.0, 27.0, 25.0, 25.0, 22.0, 20.0, 20.0, 17.0, 12.0, 14.0, 14.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.884172439575195, -13.466789245605469, -13.049405097961426, -12.6320219039917, -12.214637756347656, -11.79725456237793, -11.379871368408203, -10.96248722076416, -10.545103073120117, -10.12771987915039, -9.710335731506348, -9.292952537536621, -8.875568389892578, -8.458185195922852, -8.040802001953125, -7.623417854309082, -7.2060346603393555, -6.788650989532471, -6.371267318725586, -5.953884124755859, -5.536499977111816, -5.11911678314209, -4.701733112335205, -4.28434944152832, -3.8669657707214355, -3.449582099914551, -3.032198429107666, -2.6148149967193604, -2.1974313259124756, -1.7800476551055908, -1.3626642227172852, -0.9452805519104004, -0.5278959274291992, -0.11051231622695923, 0.30687129497528076, 0.724254846572876, 1.1416385173797607, 1.5590221881866455, 1.9764056205749512, 2.393789291381836, 2.8111729621887207, 3.2285566329956055, 3.6459403038024902, 4.063323974609375, 4.480707168579102, 4.8980913162231445, 5.315474510192871, 5.732858180999756, 6.150241851806641, 6.567625522613525, 6.98500919342041, 7.402392387390137, 7.81977653503418, 8.237159729003906, 8.654542922973633, 9.071927070617676, 9.489311218261719, 9.906694412231445, 10.324078559875488, 10.741461753845215, 11.158845901489258, 11.576229095458984, 11.993612289428711, 12.410996437072754, 12.82837963104248]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 16.0, 16.0, 21.0, 43.0, 47.0, 105.0, 169.0, 215.0, 315.0, 530.0, 788.0, 1181.0, 1954.0, 2954.0, 4736.0, 7380.0, 11715.0, 18508.0, 28700.0, 43320.0, 63115.0, 88371.0, 113595.0, 132281.0, 133636.0, 114799.0, 90018.0, 64541.0, 44099.0, 29312.0, 18745.0, 12268.0, 7590.0, 4853.0, 3040.0, 2007.0, 1246.0, 812.0, 516.0, 327.0, 244.0, 142.0, 84.0, 76.0, 45.0, 22.0, 20.0, 15.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-25.90625, -25.097412109375, -24.28857421875, -23.479736328125, -22.6708984375, -21.862060546875, -21.05322265625, -20.244384765625, -19.435546875, -18.626708984375, -17.81787109375, -17.009033203125, -16.2001953125, -15.391357421875, -14.58251953125, -13.773681640625, -12.96484375, -12.156005859375, -11.34716796875, -10.538330078125, -9.7294921875, -8.920654296875, -8.11181640625, -7.302978515625, -6.494140625, -5.685302734375, -4.87646484375, -4.067626953125, -3.2587890625, -2.449951171875, -1.64111328125, -0.832275390625, -0.0234375, 0.785400390625, 1.59423828125, 2.403076171875, 3.2119140625, 4.020751953125, 4.82958984375, 5.638427734375, 6.447265625, 7.256103515625, 8.06494140625, 8.873779296875, 9.6826171875, 10.491455078125, 11.30029296875, 12.109130859375, 12.91796875, 13.726806640625, 14.53564453125, 15.344482421875, 16.1533203125, 16.962158203125, 17.77099609375, 18.579833984375, 19.388671875, 20.197509765625, 21.00634765625, 21.815185546875, 22.6240234375, 23.432861328125, 24.24169921875, 25.050537109375, 25.859375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 10.0, 6.0, 7.0, 9.0, 12.0, 10.0, 14.0, 21.0, 21.0, 26.0, 30.0, 32.0, 33.0, 34.0, 29.0, 46.0, 42.0, 39.0, 42.0, 41.0, 39.0, 34.0, 43.0, 41.0, 46.0, 43.0, 33.0, 26.0, 34.0, 26.0, 22.0, 20.0, 13.0, 14.0, 15.0, 15.0, 8.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.765625, -13.3812255859375, -12.996826171875, -12.6124267578125, -12.22802734375, -11.8436279296875, -11.459228515625, -11.0748291015625, -10.6904296875, -10.3060302734375, -9.921630859375, -9.5372314453125, -9.15283203125, -8.7684326171875, -8.384033203125, -7.9996337890625, -7.615234375, -7.2308349609375, -6.846435546875, -6.4620361328125, -6.07763671875, -5.6932373046875, -5.308837890625, -4.9244384765625, -4.5400390625, -4.1556396484375, -3.771240234375, -3.3868408203125, -3.00244140625, -2.6180419921875, -2.233642578125, -1.8492431640625, -1.46484375, -1.0804443359375, -0.696044921875, -0.3116455078125, 0.07275390625, 0.4571533203125, 0.841552734375, 1.2259521484375, 1.6103515625, 1.9947509765625, 2.379150390625, 2.7635498046875, 3.14794921875, 3.5323486328125, 3.916748046875, 4.3011474609375, 4.685546875, 5.0699462890625, 5.454345703125, 5.8387451171875, 6.22314453125, 6.6075439453125, 6.991943359375, 7.3763427734375, 7.7607421875, 8.1451416015625, 8.529541015625, 8.9139404296875, 9.29833984375, 9.6827392578125, 10.067138671875, 10.4515380859375, 10.8359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 19.0, 17.0, 21.0, 40.0, 41.0, 78.0, 107.0, 163.0, 236.0, 368.0, 594.0, 793.0, 1343.0, 1988.0, 3042.0, 4708.0, 7688.0, 12111.0, 19245.0, 31756.0, 53017.0, 88258.0, 141540.0, 190333.0, 177708.0, 121777.0, 74616.0, 44897.0, 27058.0, 16522.0, 10287.0, 6493.0, 4011.0, 2566.0, 1764.0, 1110.0, 722.0, 486.0, 329.0, 227.0, 165.0, 113.0, 68.0, 37.0, 29.0, 21.0, 9.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0], "bins": [-27.796875, -26.9501953125, -26.103515625, -25.2568359375, -24.41015625, -23.5634765625, -22.716796875, -21.8701171875, -21.0234375, -20.1767578125, -19.330078125, -18.4833984375, -17.63671875, -16.7900390625, -15.943359375, -15.0966796875, -14.25, -13.4033203125, -12.556640625, -11.7099609375, -10.86328125, -10.0166015625, -9.169921875, -8.3232421875, -7.4765625, -6.6298828125, -5.783203125, -4.9365234375, -4.08984375, -3.2431640625, -2.396484375, -1.5498046875, -0.703125, 0.1435546875, 0.990234375, 1.8369140625, 2.68359375, 3.5302734375, 4.376953125, 5.2236328125, 6.0703125, 6.9169921875, 7.763671875, 8.6103515625, 9.45703125, 10.3037109375, 11.150390625, 11.9970703125, 12.84375, 13.6904296875, 14.537109375, 15.3837890625, 16.23046875, 17.0771484375, 17.923828125, 18.7705078125, 19.6171875, 20.4638671875, 21.310546875, 22.1572265625, 23.00390625, 23.8505859375, 24.697265625, 25.5439453125, 26.390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 5.0, 15.0, 16.0, 16.0, 17.0, 27.0, 27.0, 27.0, 26.0, 27.0, 36.0, 38.0, 46.0, 31.0, 41.0, 42.0, 41.0, 37.0, 40.0, 38.0, 53.0, 34.0, 38.0, 38.0, 30.0, 25.0, 28.0, 17.0, 16.0, 16.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 7.0, 0.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.6953125, -8.4195556640625, -8.143798828125, -7.8680419921875, -7.59228515625, -7.3165283203125, -7.040771484375, -6.7650146484375, -6.4892578125, -6.2135009765625, -5.937744140625, -5.6619873046875, -5.38623046875, -5.1104736328125, -4.834716796875, -4.5589599609375, -4.283203125, -4.0074462890625, -3.731689453125, -3.4559326171875, -3.18017578125, -2.9044189453125, -2.628662109375, -2.3529052734375, -2.0771484375, -1.8013916015625, -1.525634765625, -1.2498779296875, -0.97412109375, -0.6983642578125, -0.422607421875, -0.1468505859375, 0.12890625, 0.4046630859375, 0.680419921875, 0.9561767578125, 1.23193359375, 1.5076904296875, 1.783447265625, 2.0592041015625, 2.3349609375, 2.6107177734375, 2.886474609375, 3.1622314453125, 3.43798828125, 3.7137451171875, 3.989501953125, 4.2652587890625, 4.541015625, 4.8167724609375, 5.092529296875, 5.3682861328125, 5.64404296875, 5.9197998046875, 6.195556640625, 6.4713134765625, 6.7470703125, 7.0228271484375, 7.298583984375, 7.5743408203125, 7.85009765625, 8.1258544921875, 8.401611328125, 8.6773681640625, 8.953125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 1.0, 4.0, 8.0, 10.0, 14.0, 14.0, 23.0, 38.0, 78.0, 87.0, 171.0, 227.0, 348.0, 527.0, 857.0, 1293.0, 2060.0, 3468.0, 5846.0, 10794.0, 21462.0, 52023.0, 198685.0, 550550.0, 122181.0, 38349.0, 17388.0, 9040.0, 5067.0, 2978.0, 1786.0, 1116.0, 721.0, 467.0, 269.0, 205.0, 120.0, 90.0, 59.0, 40.0, 30.0, 22.0, 9.0, 12.0, 6.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-84.875, -82.330078125, -79.78515625, -77.240234375, -74.6953125, -72.150390625, -69.60546875, -67.060546875, -64.515625, -61.970703125, -59.42578125, -56.880859375, -54.3359375, -51.791015625, -49.24609375, -46.701171875, -44.15625, -41.611328125, -39.06640625, -36.521484375, -33.9765625, -31.431640625, -28.88671875, -26.341796875, -23.796875, -21.251953125, -18.70703125, -16.162109375, -13.6171875, -11.072265625, -8.52734375, -5.982421875, -3.4375, -0.892578125, 1.65234375, 4.197265625, 6.7421875, 9.287109375, 11.83203125, 14.376953125, 16.921875, 19.466796875, 22.01171875, 24.556640625, 27.1015625, 29.646484375, 32.19140625, 34.736328125, 37.28125, 39.826171875, 42.37109375, 44.916015625, 47.4609375, 50.005859375, 52.55078125, 55.095703125, 57.640625, 60.185546875, 62.73046875, 65.275390625, 67.8203125, 70.365234375, 72.91015625, 75.455078125, 78.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 11.0, 11.0, 22.0, 19.0, 22.0, 51.0, 99.0, 190.0, 223.0, 119.0, 59.0, 43.0, 25.0, 17.0, 15.0, 13.0, 15.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00933837890625, -0.009047269821166992, -0.008756160736083984, -0.008465051651000977, -0.008173942565917969, -0.007882833480834961, -0.007591724395751953, -0.007300615310668945, -0.0070095062255859375, -0.00671839714050293, -0.006427288055419922, -0.006136178970336914, -0.005845069885253906, -0.0055539608001708984, -0.005262851715087891, -0.004971742630004883, -0.004680633544921875, -0.004389524459838867, -0.004098415374755859, -0.0038073062896728516, -0.0035161972045898438, -0.003225088119506836, -0.002933979034423828, -0.0026428699493408203, -0.0023517608642578125, -0.0020606517791748047, -0.0017695426940917969, -0.001478433609008789, -0.0011873245239257812, -0.0008962154388427734, -0.0006051063537597656, -0.0003139972686767578, -2.288818359375e-05, 0.0002682209014892578, 0.0005593299865722656, 0.0008504390716552734, 0.0011415481567382812, 0.001432657241821289, 0.0017237663269042969, 0.0020148754119873047, 0.0023059844970703125, 0.0025970935821533203, 0.002888202667236328, 0.003179311752319336, 0.0034704208374023438, 0.0037615299224853516, 0.004052639007568359, 0.004343748092651367, 0.004634857177734375, 0.004925966262817383, 0.005217075347900391, 0.0055081844329833984, 0.005799293518066406, 0.006090402603149414, 0.006381511688232422, 0.00667262077331543, 0.0069637298583984375, 0.007254838943481445, 0.007545948028564453, 0.007837057113647461, 0.008128166198730469, 0.008419275283813477, 0.008710384368896484, 0.009001493453979492, 0.0092926025390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 4.0, 14.0, 20.0, 24.0, 26.0, 49.0, 57.0, 111.0, 132.0, 259.0, 318.0, 557.0, 922.0, 1543.0, 2787.0, 5071.0, 9519.0, 20219.0, 50645.0, 195090.0, 494728.0, 178548.0, 47696.0, 19424.0, 9312.0, 4832.0, 2698.0, 1509.0, 921.0, 530.0, 337.0, 199.0, 140.0, 100.0, 65.0, 51.0, 29.0, 19.0, 14.0, 15.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0, -49.1435546875, -47.287109375, -45.4306640625, -43.57421875, -41.7177734375, -39.861328125, -38.0048828125, -36.1484375, -34.2919921875, -32.435546875, -30.5791015625, -28.72265625, -26.8662109375, -25.009765625, -23.1533203125, -21.296875, -19.4404296875, -17.583984375, -15.7275390625, -13.87109375, -12.0146484375, -10.158203125, -8.3017578125, -6.4453125, -4.5888671875, -2.732421875, -0.8759765625, 0.98046875, 2.8369140625, 4.693359375, 6.5498046875, 8.40625, 10.2626953125, 12.119140625, 13.9755859375, 15.83203125, 17.6884765625, 19.544921875, 21.4013671875, 23.2578125, 25.1142578125, 26.970703125, 28.8271484375, 30.68359375, 32.5400390625, 34.396484375, 36.2529296875, 38.109375, 39.9658203125, 41.822265625, 43.6787109375, 45.53515625, 47.3916015625, 49.248046875, 51.1044921875, 52.9609375, 54.8173828125, 56.673828125, 58.5302734375, 60.38671875, 62.2431640625, 64.099609375, 65.9560546875, 67.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 13.0, 19.0, 13.0, 17.0, 34.0, 67.0, 94.0, 142.0, 130.0, 140.0, 93.0, 52.0, 38.0, 29.0, 23.0, 14.0, 9.0, 5.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.375, -14.88818359375, -14.4013671875, -13.91455078125, -13.427734375, -12.94091796875, -12.4541015625, -11.96728515625, -11.48046875, -10.99365234375, -10.5068359375, -10.02001953125, -9.533203125, -9.04638671875, -8.5595703125, -8.07275390625, -7.5859375, -7.09912109375, -6.6123046875, -6.12548828125, -5.638671875, -5.15185546875, -4.6650390625, -4.17822265625, -3.69140625, -3.20458984375, -2.7177734375, -2.23095703125, -1.744140625, -1.25732421875, -0.7705078125, -0.28369140625, 0.203125, 0.68994140625, 1.1767578125, 1.66357421875, 2.150390625, 2.63720703125, 3.1240234375, 3.61083984375, 4.09765625, 4.58447265625, 5.0712890625, 5.55810546875, 6.044921875, 6.53173828125, 7.0185546875, 7.50537109375, 7.9921875, 8.47900390625, 8.9658203125, 9.45263671875, 9.939453125, 10.42626953125, 10.9130859375, 11.39990234375, 11.88671875, 12.37353515625, 12.8603515625, 13.34716796875, 13.833984375, 14.32080078125, 14.8076171875, 15.29443359375, 15.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 5.0, 3.0, 6.0, 16.0, 21.0, 16.0, 24.0, 20.0, 28.0, 48.0, 45.0, 44.0, 51.0, 56.0, 57.0, 48.0, 50.0, 59.0, 53.0, 54.0, 40.0, 44.0, 33.0, 33.0, 25.0, 28.0, 10.0, 12.0, 5.0, 10.0, 10.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.071081161499023, -17.462955474853516, -16.85483169555664, -16.246706008911133, -15.638582229614258, -15.03045654296875, -14.422331809997559, -13.814207077026367, -13.206082344055176, -12.597957611083984, -11.989832878112793, -11.381708145141602, -10.773582458496094, -10.165458679199219, -9.557332992553711, -8.94920825958252, -8.341083526611328, -7.732958793640137, -7.124834060668945, -6.516708850860596, -5.908584117889404, -5.300459384918213, -4.692334175109863, -4.084209442138672, -3.4760847091674805, -2.867959976196289, -2.2598350048065186, -1.6517101526260376, -1.0435853004455566, -0.43546056747436523, 0.17266440391540527, 0.7807893753051758, 1.3889141082763672, 1.9970389604568481, 2.605163812637329, 3.2132887840270996, 3.821413516998291, 4.429538249969482, 5.037663459777832, 5.645788192749023, 6.253912925720215, 6.862037658691406, 7.470162391662598, 8.078287124633789, 8.686412811279297, 9.294536590576172, 9.90266227722168, 10.510787010192871, 11.118911743164062, 11.727036476135254, 12.335161209106445, 12.943285942077637, 13.551410675048828, 14.159536361694336, 14.767661094665527, 15.375785827636719, 15.98391056060791, 16.5920352935791, 17.20016098022461, 17.808284759521484, 18.416410446166992, 19.024534225463867, 19.632659912109375, 20.24078369140625, 20.848909378051758]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 7.0, 4.0, 6.0, 12.0, 11.0, 16.0, 22.0, 22.0, 22.0, 20.0, 31.0, 22.0, 31.0, 33.0, 46.0, 41.0, 41.0, 34.0, 39.0, 28.0, 35.0, 39.0, 36.0, 35.0, 36.0, 33.0, 30.0, 29.0, 25.0, 27.0, 18.0, 24.0, 18.0, 17.0, 16.0, 13.0, 10.0, 9.0, 8.0, 12.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.740565299987793, -12.29871654510498, -11.856867790222168, -11.415019035339355, -10.97317123413086, -10.531322479248047, -10.089473724365234, -9.647624969482422, -9.20577621459961, -8.763927459716797, -8.322078704833984, -7.88023042678833, -7.438381671905518, -6.996532917022705, -6.554684638977051, -6.112835884094238, -5.670987129211426, -5.229138374328613, -4.787289619445801, -4.3454413414001465, -3.903592586517334, -3.4617438316345215, -3.019895315170288, -2.5780467987060547, -2.136198043823242, -1.6943494081497192, -1.2525007724761963, -0.8106521368026733, -0.3688035011291504, 0.07304525375366211, 0.5148937702178955, 0.9567422866821289, 1.3985919952392578, 1.8404406309127808, 2.2822892665863037, 2.724137783050537, 3.1659865379333496, 3.607835292816162, 4.049683570861816, 4.491532325744629, 4.933381080627441, 5.375229835510254, 5.817078590393066, 6.258926868438721, 6.700775623321533, 7.142624378204346, 7.58447265625, 8.026321411132812, 8.468170166015625, 8.910018920898438, 9.35186767578125, 9.793716430664062, 10.235565185546875, 10.677413940429688, 11.119261741638184, 11.561110496520996, 12.002959251403809, 12.444808006286621, 12.886656761169434, 13.328505516052246, 13.770353317260742, 14.212202072143555, 14.654050827026367, 15.09589958190918, 15.537748336791992]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 10.0, 14.0, 16.0, 28.0, 30.0, 35.0, 81.0, 98.0, 150.0, 204.0, 275.0, 469.0, 641.0, 1044.0, 1581.0, 2638.0, 3935.0, 6727.0, 10983.0, 18707.0, 32006.0, 53409.0, 85479.0, 126046.0, 158708.0, 163373.0, 135618.0, 95433.0, 60449.0, 36274.0, 21360.0, 12529.0, 7551.0, 4625.0, 2813.0, 1824.0, 1114.0, 781.0, 430.0, 323.0, 205.0, 153.0, 126.0, 86.0, 49.0, 34.0, 26.0, 30.0, 18.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-22.796875, -22.108642578125, -21.42041015625, -20.732177734375, -20.0439453125, -19.355712890625, -18.66748046875, -17.979248046875, -17.291015625, -16.602783203125, -15.91455078125, -15.226318359375, -14.5380859375, -13.849853515625, -13.16162109375, -12.473388671875, -11.78515625, -11.096923828125, -10.40869140625, -9.720458984375, -9.0322265625, -8.343994140625, -7.65576171875, -6.967529296875, -6.279296875, -5.591064453125, -4.90283203125, -4.214599609375, -3.5263671875, -2.838134765625, -2.14990234375, -1.461669921875, -0.7734375, -0.085205078125, 0.60302734375, 1.291259765625, 1.9794921875, 2.667724609375, 3.35595703125, 4.044189453125, 4.732421875, 5.420654296875, 6.10888671875, 6.797119140625, 7.4853515625, 8.173583984375, 8.86181640625, 9.550048828125, 10.23828125, 10.926513671875, 11.61474609375, 12.302978515625, 12.9912109375, 13.679443359375, 14.36767578125, 15.055908203125, 15.744140625, 16.432373046875, 17.12060546875, 17.808837890625, 18.4970703125, 19.185302734375, 19.87353515625, 20.561767578125, 21.25]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 6.0, 1.0, 5.0, 7.0, 1.0, 5.0, 9.0, 7.0, 14.0, 11.0, 8.0, 15.0, 19.0, 20.0, 15.0, 30.0, 28.0, 28.0, 44.0, 30.0, 41.0, 44.0, 36.0, 37.0, 39.0, 44.0, 34.0, 39.0, 28.0, 35.0, 39.0, 45.0, 24.0, 26.0, 21.0, 25.0, 24.0, 24.0, 21.0, 14.0, 8.0, 7.0, 11.0, 9.0, 5.0, 5.0, 10.0, 1.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.147216796875, -11.71630859375, -11.285400390625, -10.8544921875, -10.423583984375, -9.99267578125, -9.561767578125, -9.130859375, -8.699951171875, -8.26904296875, -7.838134765625, -7.4072265625, -6.976318359375, -6.54541015625, -6.114501953125, -5.68359375, -5.252685546875, -4.82177734375, -4.390869140625, -3.9599609375, -3.529052734375, -3.09814453125, -2.667236328125, -2.236328125, -1.805419921875, -1.37451171875, -0.943603515625, -0.5126953125, -0.081787109375, 0.34912109375, 0.780029296875, 1.2109375, 1.641845703125, 2.07275390625, 2.503662109375, 2.9345703125, 3.365478515625, 3.79638671875, 4.227294921875, 4.658203125, 5.089111328125, 5.52001953125, 5.950927734375, 6.3818359375, 6.812744140625, 7.24365234375, 7.674560546875, 8.10546875, 8.536376953125, 8.96728515625, 9.398193359375, 9.8291015625, 10.260009765625, 10.69091796875, 11.121826171875, 11.552734375, 11.983642578125, 12.41455078125, 12.845458984375, 13.2763671875, 13.707275390625, 14.13818359375, 14.569091796875, 15.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 24.0, 17.0, 25.0, 41.0, 84.0, 108.0, 163.0, 262.0, 373.0, 632.0, 1113.0, 1758.0, 3127.0, 5446.0, 9664.0, 17666.0, 32348.0, 58525.0, 100302.0, 153719.0, 189500.0, 175633.0, 125578.0, 76356.0, 42674.0, 23467.0, 12863.0, 7112.0, 4068.0, 2364.0, 1329.0, 830.0, 505.0, 296.0, 190.0, 111.0, 87.0, 58.0, 34.0, 17.0, 21.0, 18.0, 15.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-26.0625, -25.266357421875, -24.47021484375, -23.674072265625, -22.8779296875, -22.081787109375, -21.28564453125, -20.489501953125, -19.693359375, -18.897216796875, -18.10107421875, -17.304931640625, -16.5087890625, -15.712646484375, -14.91650390625, -14.120361328125, -13.32421875, -12.528076171875, -11.73193359375, -10.935791015625, -10.1396484375, -9.343505859375, -8.54736328125, -7.751220703125, -6.955078125, -6.158935546875, -5.36279296875, -4.566650390625, -3.7705078125, -2.974365234375, -2.17822265625, -1.382080078125, -0.5859375, 0.210205078125, 1.00634765625, 1.802490234375, 2.5986328125, 3.394775390625, 4.19091796875, 4.987060546875, 5.783203125, 6.579345703125, 7.37548828125, 8.171630859375, 8.9677734375, 9.763916015625, 10.56005859375, 11.356201171875, 12.15234375, 12.948486328125, 13.74462890625, 14.540771484375, 15.3369140625, 16.133056640625, 16.92919921875, 17.725341796875, 18.521484375, 19.317626953125, 20.11376953125, 20.909912109375, 21.7060546875, 22.502197265625, 23.29833984375, 24.094482421875, 24.890625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 12.0, 17.0, 19.0, 21.0, 25.0, 31.0, 27.0, 20.0, 47.0, 46.0, 47.0, 45.0, 42.0, 38.0, 51.0, 58.0, 46.0, 46.0, 52.0, 44.0, 44.0, 39.0, 35.0, 33.0, 20.0, 21.0, 15.0, 11.0, 7.0, 9.0, 4.0, 2.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7734375, -14.3316650390625, -13.889892578125, -13.4481201171875, -13.00634765625, -12.5645751953125, -12.122802734375, -11.6810302734375, -11.2392578125, -10.7974853515625, -10.355712890625, -9.9139404296875, -9.47216796875, -9.0303955078125, -8.588623046875, -8.1468505859375, -7.705078125, -7.2633056640625, -6.821533203125, -6.3797607421875, -5.93798828125, -5.4962158203125, -5.054443359375, -4.6126708984375, -4.1708984375, -3.7291259765625, -3.287353515625, -2.8455810546875, -2.40380859375, -1.9620361328125, -1.520263671875, -1.0784912109375, -0.63671875, -0.1949462890625, 0.246826171875, 0.6885986328125, 1.13037109375, 1.5721435546875, 2.013916015625, 2.4556884765625, 2.8974609375, 3.3392333984375, 3.781005859375, 4.2227783203125, 4.66455078125, 5.1063232421875, 5.548095703125, 5.9898681640625, 6.431640625, 6.8734130859375, 7.315185546875, 7.7569580078125, 8.19873046875, 8.6405029296875, 9.082275390625, 9.5240478515625, 9.9658203125, 10.4075927734375, 10.849365234375, 11.2911376953125, 11.73291015625, 12.1746826171875, 12.616455078125, 13.0582275390625, 13.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 10.0, 7.0, 6.0, 16.0, 15.0, 27.0, 36.0, 42.0, 49.0, 62.0, 125.0, 141.0, 223.0, 323.0, 438.0, 690.0, 1002.0, 1482.0, 2179.0, 3523.0, 5494.0, 9122.0, 15720.0, 28199.0, 55333.0, 118164.0, 245989.0, 273412.0, 142247.0, 65800.0, 33005.0, 17816.0, 10309.0, 6176.0, 3909.0, 2408.0, 1596.0, 1061.0, 718.0, 508.0, 349.0, 229.0, 166.0, 126.0, 94.0, 48.0, 42.0, 29.0, 24.0, 27.0, 19.0, 3.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0], "bins": [-31.109375, -30.109619140625, -29.10986328125, -28.110107421875, -27.1103515625, -26.110595703125, -25.11083984375, -24.111083984375, -23.111328125, -22.111572265625, -21.11181640625, -20.112060546875, -19.1123046875, -18.112548828125, -17.11279296875, -16.113037109375, -15.11328125, -14.113525390625, -13.11376953125, -12.114013671875, -11.1142578125, -10.114501953125, -9.11474609375, -8.114990234375, -7.115234375, -6.115478515625, -5.11572265625, -4.115966796875, -3.1162109375, -2.116455078125, -1.11669921875, -0.116943359375, 0.8828125, 1.882568359375, 2.88232421875, 3.882080078125, 4.8818359375, 5.881591796875, 6.88134765625, 7.881103515625, 8.880859375, 9.880615234375, 10.88037109375, 11.880126953125, 12.8798828125, 13.879638671875, 14.87939453125, 15.879150390625, 16.87890625, 17.878662109375, 18.87841796875, 19.878173828125, 20.8779296875, 21.877685546875, 22.87744140625, 23.877197265625, 24.876953125, 25.876708984375, 26.87646484375, 27.876220703125, 28.8759765625, 29.875732421875, 30.87548828125, 31.875244140625, 32.875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 1.0, 1.0, 6.0, 14.0, 5.0, 9.0, 10.0, 20.0, 19.0, 18.0, 27.0, 40.0, 45.0, 41.0, 50.0, 85.0, 82.0, 97.0, 74.0, 78.0, 53.0, 43.0, 35.0, 27.0, 24.0, 23.0, 14.0, 14.0, 6.0, 12.0, 4.0, 6.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002758026123046875, -0.0026730895042419434, -0.0025881528854370117, -0.00250321626663208, -0.0024182796478271484, -0.002333343029022217, -0.002248406410217285, -0.0021634697914123535, -0.002078533172607422, -0.0019935965538024902, -0.0019086599349975586, -0.001823723316192627, -0.0017387866973876953, -0.0016538500785827637, -0.001568913459777832, -0.0014839768409729004, -0.0013990402221679688, -0.0013141036033630371, -0.0012291669845581055, -0.0011442303657531738, -0.0010592937469482422, -0.0009743571281433105, -0.0008894205093383789, -0.0008044838905334473, -0.0007195472717285156, -0.000634610652923584, -0.0005496740341186523, -0.0004647374153137207, -0.00037980079650878906, -0.0002948641777038574, -0.00020992755889892578, -0.00012499094009399414, -4.00543212890625e-05, 4.488229751586914e-05, 0.00012981891632080078, 0.00021475553512573242, 0.00029969215393066406, 0.0003846287727355957, 0.00046956539154052734, 0.000554502010345459, 0.0006394386291503906, 0.0007243752479553223, 0.0008093118667602539, 0.0008942484855651855, 0.0009791851043701172, 0.0010641217231750488, 0.0011490583419799805, 0.0012339949607849121, 0.0013189315795898438, 0.0014038681983947754, 0.001488804817199707, 0.0015737414360046387, 0.0016586780548095703, 0.001743614673614502, 0.0018285512924194336, 0.0019134879112243652, 0.001998424530029297, 0.0020833611488342285, 0.00216829776763916, 0.002253234386444092, 0.0023381710052490234, 0.002423107624053955, 0.0025080442428588867, 0.0025929808616638184, 0.00267791748046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 10.0, 15.0, 27.0, 50.0, 61.0, 109.0, 158.0, 246.0, 397.0, 626.0, 1042.0, 1751.0, 2882.0, 4967.0, 8946.0, 17014.0, 35991.0, 87977.0, 231949.0, 343645.0, 181064.0, 68045.0, 29476.0, 13996.0, 7467.0, 4194.0, 2505.0, 1473.0, 956.0, 549.0, 341.0, 217.0, 134.0, 99.0, 59.0, 39.0, 23.0, 16.0, 11.0, 8.0, 5.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -30.9208984375, -29.748046875, -28.5751953125, -27.40234375, -26.2294921875, -25.056640625, -23.8837890625, -22.7109375, -21.5380859375, -20.365234375, -19.1923828125, -18.01953125, -16.8466796875, -15.673828125, -14.5009765625, -13.328125, -12.1552734375, -10.982421875, -9.8095703125, -8.63671875, -7.4638671875, -6.291015625, -5.1181640625, -3.9453125, -2.7724609375, -1.599609375, -0.4267578125, 0.74609375, 1.9189453125, 3.091796875, 4.2646484375, 5.4375, 6.6103515625, 7.783203125, 8.9560546875, 10.12890625, 11.3017578125, 12.474609375, 13.6474609375, 14.8203125, 15.9931640625, 17.166015625, 18.3388671875, 19.51171875, 20.6845703125, 21.857421875, 23.0302734375, 24.203125, 25.3759765625, 26.548828125, 27.7216796875, 28.89453125, 30.0673828125, 31.240234375, 32.4130859375, 33.5859375, 34.7587890625, 35.931640625, 37.1044921875, 38.27734375, 39.4501953125, 40.623046875, 41.7958984375, 42.96875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 9.0, 6.0, 10.0, 6.0, 13.0, 23.0, 22.0, 15.0, 31.0, 40.0, 40.0, 48.0, 52.0, 69.0, 71.0, 76.0, 73.0, 65.0, 46.0, 45.0, 36.0, 28.0, 25.0, 20.0, 23.0, 15.0, 14.0, 10.0, 9.0, 5.0, 5.0, 10.0, 8.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.53125, -8.2652587890625, -7.999267578125, -7.7332763671875, -7.46728515625, -7.2012939453125, -6.935302734375, -6.6693115234375, -6.4033203125, -6.1373291015625, -5.871337890625, -5.6053466796875, -5.33935546875, -5.0733642578125, -4.807373046875, -4.5413818359375, -4.275390625, -4.0093994140625, -3.743408203125, -3.4774169921875, -3.21142578125, -2.9454345703125, -2.679443359375, -2.4134521484375, -2.1474609375, -1.8814697265625, -1.615478515625, -1.3494873046875, -1.08349609375, -0.8175048828125, -0.551513671875, -0.2855224609375, -0.01953125, 0.2464599609375, 0.512451171875, 0.7784423828125, 1.04443359375, 1.3104248046875, 1.576416015625, 1.8424072265625, 2.1083984375, 2.3743896484375, 2.640380859375, 2.9063720703125, 3.17236328125, 3.4383544921875, 3.704345703125, 3.9703369140625, 4.236328125, 4.5023193359375, 4.768310546875, 5.0343017578125, 5.30029296875, 5.5662841796875, 5.832275390625, 6.0982666015625, 6.3642578125, 6.6302490234375, 6.896240234375, 7.1622314453125, 7.42822265625, 7.6942138671875, 7.960205078125, 8.2261962890625, 8.4921875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 18.0, 20.0, 16.0, 23.0, 19.0, 28.0, 33.0, 32.0, 42.0, 55.0, 62.0, 57.0, 55.0, 45.0, 51.0, 47.0, 46.0, 39.0, 38.0, 36.0, 31.0, 19.0, 25.0, 19.0, 17.0, 19.0, 18.0, 11.0, 5.0, 13.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.966279983520508, -17.36782455444336, -16.769371032714844, -16.170915603637695, -15.57246208190918, -14.974006652832031, -14.3755521774292, -13.777097702026367, -13.178643226623535, -12.580188751220703, -11.981734275817871, -11.383279800415039, -10.78482437133789, -10.186370849609375, -9.587915420532227, -8.989460945129395, -8.391006469726562, -7.7925519943237305, -7.194097518920898, -6.595642566680908, -5.997188091278076, -5.398733615875244, -4.800278663635254, -4.201824188232422, -3.60336971282959, -3.004915237426758, -2.4064605236053467, -1.808005928993225, -1.2095513343811035, -0.6110968589782715, -0.012642145156860352, 0.5858125686645508, 1.1842689514160156, 1.7827235460281372, 2.381178140640259, 2.97963285446167, 3.578087329864502, 4.176541805267334, 4.774996757507324, 5.373451232910156, 5.971905708312988, 6.57036018371582, 7.168814659118652, 7.767269611358643, 8.365724563598633, 8.964178085327148, 9.562633514404297, 10.161087989807129, 10.759542465209961, 11.357996940612793, 11.956451416015625, 12.554905891418457, 13.153360366821289, 13.751815795898438, 14.35027027130127, 14.948724746704102, 15.547179222106934, 16.145633697509766, 16.744089126586914, 17.34254264831543, 17.940998077392578, 18.539451599121094, 19.137907028198242, 19.73636245727539, 20.334815979003906]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 4.0, 6.0, 6.0, 7.0, 8.0, 13.0, 17.0, 14.0, 15.0, 17.0, 23.0, 24.0, 28.0, 33.0, 34.0, 28.0, 34.0, 31.0, 37.0, 49.0, 45.0, 35.0, 37.0, 30.0, 42.0, 40.0, 33.0, 30.0, 31.0, 34.0, 28.0, 27.0, 15.0, 11.0, 26.0, 18.0, 13.0, 17.0, 14.0, 11.0, 7.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.088459014892578, -14.612427711486816, -14.136395454406738, -13.660364151000977, -13.184332847595215, -12.708300590515137, -12.232269287109375, -11.756237030029297, -11.280205726623535, -10.804174423217773, -10.328142166137695, -9.852110862731934, -9.376079559326172, -8.900047302246094, -8.424015998840332, -7.947984218597412, -7.47195291519165, -6.9959211349487305, -6.519889831542969, -6.043858051300049, -5.567826271057129, -5.091794967651367, -4.615763187408447, -4.139731407165527, -3.6636998653411865, -3.1876683235168457, -2.711636543273926, -2.235605001449585, -1.7595733404159546, -1.2835416793823242, -0.8075101375579834, -0.3314783573150635, 0.14455318450927734, 0.6205848455429077, 1.096616506576538, 1.572648048400879, 2.048679828643799, 2.5247113704681396, 3.0007429122924805, 3.4767746925354004, 3.952806234359741, 4.428837776184082, 4.904869556427002, 5.380901336669922, 5.856932640075684, 6.3329644203186035, 6.808996200561523, 7.285027503967285, 7.761059284210205, 8.237091064453125, 8.713122367858887, 9.189153671264648, 9.665185928344727, 10.141217231750488, 10.61724853515625, 11.093280792236328, 11.56931209564209, 12.045343399047852, 12.52137565612793, 12.997406959533691, 13.473438262939453, 13.949470520019531, 14.425501823425293, 14.901533126831055, 15.377565383911133]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 6.0, 6.0, 9.0, 8.0, 18.0, 20.0, 26.0, 46.0, 80.0, 104.0, 124.0, 214.0, 264.0, 509.0, 713.0, 1090.0, 1672.0, 2571.0, 4288.0, 6871.0, 11464.0, 19817.0, 34503.0, 61147.0, 110427.0, 196683.0, 338291.0, 527357.0, 688560.0, 709050.0, 571691.0, 380666.0, 227079.0, 128356.0, 72225.0, 40411.0, 23101.0, 13807.0, 8040.0, 4773.0, 2969.0, 1856.0, 1196.0, 763.0, 459.0, 330.0, 208.0, 132.0, 86.0, 61.0, 43.0, 41.0, 20.0, 14.0, 7.0, 7.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-14.6328125, -14.1627197265625, -13.692626953125, -13.2225341796875, -12.75244140625, -12.2823486328125, -11.812255859375, -11.3421630859375, -10.8720703125, -10.4019775390625, -9.931884765625, -9.4617919921875, -8.99169921875, -8.5216064453125, -8.051513671875, -7.5814208984375, -7.111328125, -6.6412353515625, -6.171142578125, -5.7010498046875, -5.23095703125, -4.7608642578125, -4.290771484375, -3.8206787109375, -3.3505859375, -2.8804931640625, -2.410400390625, -1.9403076171875, -1.47021484375, -1.0001220703125, -0.530029296875, -0.0599365234375, 0.41015625, 0.8802490234375, 1.350341796875, 1.8204345703125, 2.29052734375, 2.7606201171875, 3.230712890625, 3.7008056640625, 4.1708984375, 4.6409912109375, 5.111083984375, 5.5811767578125, 6.05126953125, 6.5213623046875, 6.991455078125, 7.4615478515625, 7.931640625, 8.4017333984375, 8.871826171875, 9.3419189453125, 9.81201171875, 10.2821044921875, 10.752197265625, 11.2222900390625, 11.6923828125, 12.1624755859375, 12.632568359375, 13.1026611328125, 13.57275390625, 14.0428466796875, 14.512939453125, 14.9830322265625, 15.453125]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 7.0, 13.0, 14.0, 22.0, 18.0, 19.0, 29.0, 20.0, 28.0, 30.0, 33.0, 30.0, 28.0, 40.0, 36.0, 39.0, 41.0, 36.0, 34.0, 38.0, 42.0, 35.0, 36.0, 36.0, 24.0, 27.0, 17.0, 22.0, 26.0, 21.0, 17.0, 22.0, 17.0, 13.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1015625, -9.759033203125, -9.41650390625, -9.073974609375, -8.7314453125, -8.388916015625, -8.04638671875, -7.703857421875, -7.361328125, -7.018798828125, -6.67626953125, -6.333740234375, -5.9912109375, -5.648681640625, -5.30615234375, -4.963623046875, -4.62109375, -4.278564453125, -3.93603515625, -3.593505859375, -3.2509765625, -2.908447265625, -2.56591796875, -2.223388671875, -1.880859375, -1.538330078125, -1.19580078125, -0.853271484375, -0.5107421875, -0.168212890625, 0.17431640625, 0.516845703125, 0.859375, 1.201904296875, 1.54443359375, 1.886962890625, 2.2294921875, 2.572021484375, 2.91455078125, 3.257080078125, 3.599609375, 3.942138671875, 4.28466796875, 4.627197265625, 4.9697265625, 5.312255859375, 5.65478515625, 5.997314453125, 6.33984375, 6.682373046875, 7.02490234375, 7.367431640625, 7.7099609375, 8.052490234375, 8.39501953125, 8.737548828125, 9.080078125, 9.422607421875, 9.76513671875, 10.107666015625, 10.4501953125, 10.792724609375, 11.13525390625, 11.477783203125, 11.8203125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 13.0, 5.0, 20.0, 39.0, 46.0, 66.0, 127.0, 211.0, 314.0, 528.0, 825.0, 1355.0, 2288.0, 3861.0, 6880.0, 12535.0, 23707.0, 46777.0, 95898.0, 194476.0, 377247.0, 641719.0, 850800.0, 796578.0, 540581.0, 296890.0, 149245.0, 72529.0, 36493.0, 18363.0, 10132.0, 5520.0, 3293.0, 1879.0, 1134.0, 680.0, 454.0, 279.0, 166.0, 129.0, 72.0, 40.0, 29.0, 27.0, 12.0, 7.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.484375, -19.860107421875, -19.23583984375, -18.611572265625, -17.9873046875, -17.363037109375, -16.73876953125, -16.114501953125, -15.490234375, -14.865966796875, -14.24169921875, -13.617431640625, -12.9931640625, -12.368896484375, -11.74462890625, -11.120361328125, -10.49609375, -9.871826171875, -9.24755859375, -8.623291015625, -7.9990234375, -7.374755859375, -6.75048828125, -6.126220703125, -5.501953125, -4.877685546875, -4.25341796875, -3.629150390625, -3.0048828125, -2.380615234375, -1.75634765625, -1.132080078125, -0.5078125, 0.116455078125, 0.74072265625, 1.364990234375, 1.9892578125, 2.613525390625, 3.23779296875, 3.862060546875, 4.486328125, 5.110595703125, 5.73486328125, 6.359130859375, 6.9833984375, 7.607666015625, 8.23193359375, 8.856201171875, 9.48046875, 10.104736328125, 10.72900390625, 11.353271484375, 11.9775390625, 12.601806640625, 13.22607421875, 13.850341796875, 14.474609375, 15.098876953125, 15.72314453125, 16.347412109375, 16.9716796875, 17.595947265625, 18.22021484375, 18.844482421875, 19.46875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 2.0, 11.0, 17.0, 12.0, 19.0, 19.0, 32.0, 39.0, 48.0, 51.0, 60.0, 85.0, 111.0, 124.0, 129.0, 178.0, 199.0, 203.0, 224.0, 268.0, 246.0, 267.0, 224.0, 225.0, 206.0, 199.0, 192.0, 153.0, 116.0, 90.0, 75.0, 68.0, 40.0, 33.0, 25.0, 24.0, 15.0, 13.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-7.12109375, -6.922119140625, -6.72314453125, -6.524169921875, -6.3251953125, -6.126220703125, -5.92724609375, -5.728271484375, -5.529296875, -5.330322265625, -5.13134765625, -4.932373046875, -4.7333984375, -4.534423828125, -4.33544921875, -4.136474609375, -3.9375, -3.738525390625, -3.53955078125, -3.340576171875, -3.1416015625, -2.942626953125, -2.74365234375, -2.544677734375, -2.345703125, -2.146728515625, -1.94775390625, -1.748779296875, -1.5498046875, -1.350830078125, -1.15185546875, -0.952880859375, -0.75390625, -0.554931640625, -0.35595703125, -0.156982421875, 0.0419921875, 0.240966796875, 0.43994140625, 0.638916015625, 0.837890625, 1.036865234375, 1.23583984375, 1.434814453125, 1.6337890625, 1.832763671875, 2.03173828125, 2.230712890625, 2.4296875, 2.628662109375, 2.82763671875, 3.026611328125, 3.2255859375, 3.424560546875, 3.62353515625, 3.822509765625, 4.021484375, 4.220458984375, 4.41943359375, 4.618408203125, 4.8173828125, 5.016357421875, 5.21533203125, 5.414306640625, 5.61328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 6.0, 16.0, 18.0, 16.0, 25.0, 32.0, 29.0, 41.0, 61.0, 56.0, 64.0, 60.0, 70.0, 68.0, 66.0, 59.0, 45.0, 49.0, 38.0, 29.0, 32.0, 27.0, 25.0, 15.0, 14.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.96455192565918, -24.27136993408203, -23.578187942504883, -22.885005950927734, -22.191823959350586, -21.498641967773438, -20.80545997619629, -20.11227798461914, -19.419095993041992, -18.725914001464844, -18.032732009887695, -17.339550018310547, -16.6463680267334, -15.95318603515625, -15.260004043579102, -14.566822052001953, -13.873640060424805, -13.180458068847656, -12.487276077270508, -11.79409408569336, -11.100912094116211, -10.407730102539062, -9.714548110961914, -9.021366119384766, -8.328184127807617, -7.635002136230469, -6.94182014465332, -6.248638153076172, -5.555456161499023, -4.862274169921875, -4.169092178344727, -3.475910186767578, -2.782726287841797, -2.0895442962646484, -1.3963623046875, -0.7031803131103516, -0.009998321533203125, 0.6831836700439453, 1.3763656616210938, 2.069547653198242, 2.7627296447753906, 3.455911636352539, 4.1490936279296875, 4.842275619506836, 5.535457611083984, 6.228639602661133, 6.921821594238281, 7.61500358581543, 8.308185577392578, 9.001367568969727, 9.694549560546875, 10.387731552124023, 11.080913543701172, 11.77409553527832, 12.467277526855469, 13.160459518432617, 13.853641510009766, 14.546823501586914, 15.240005493164062, 15.933187484741211, 16.62636947631836, 17.319551467895508, 18.012733459472656, 18.705915451049805, 19.399097442626953]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 8.0, 14.0, 19.0, 5.0, 28.0, 29.0, 33.0, 39.0, 35.0, 41.0, 24.0, 47.0, 39.0, 41.0, 47.0, 43.0, 60.0, 40.0, 56.0, 44.0, 32.0, 32.0, 39.0, 41.0, 25.0, 22.0, 14.0, 17.0, 12.0, 9.0, 14.0, 6.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.160979270935059, -13.660107612609863, -13.159235000610352, -12.658363342285156, -12.157491683959961, -11.656620025634766, -11.155747413635254, -10.654875755310059, -10.154003143310547, -9.653131484985352, -9.15225887298584, -8.651387214660645, -8.15051555633545, -7.649643421173096, -7.148771286010742, -6.647899627685547, -6.147027969360352, -5.646155834197998, -5.145284175872803, -4.644412040710449, -4.143540382385254, -3.6426682472229004, -3.141796112060547, -2.6409242153167725, -2.140052318572998, -1.6391804218292236, -1.1383084058761597, -0.6374363899230957, -0.1365644931793213, 0.3643074035644531, 0.8651795387268066, 1.366051435470581, 1.8669242858886719, 2.3677961826324463, 2.8686680793762207, 3.369540214538574, 3.8704121112823486, 4.371284008026123, 4.872156143188477, 5.373027801513672, 5.873899936676025, 6.374772071838379, 6.875643730163574, 7.376515865325928, 7.877388000488281, 8.378259658813477, 8.879131317138672, 9.380003929138184, 9.880875587463379, 10.381747245788574, 10.882619857788086, 11.383491516113281, 11.884363174438477, 12.385234832763672, 12.886107444763184, 13.386979103088379, 13.88785171508789, 14.388723373413086, 14.889595985412598, 15.390467643737793, 15.891339302062988, 16.3922119140625, 16.893083572387695, 17.39395523071289, 17.894826889038086]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 19.0, 27.0, 42.0, 72.0, 90.0, 166.0, 243.0, 402.0, 601.0, 900.0, 1527.0, 2328.0, 3871.0, 6139.0, 9870.0, 15886.0, 25953.0, 41002.0, 66054.0, 102504.0, 148632.0, 175002.0, 153601.0, 108552.0, 69451.0, 43465.0, 27397.0, 16807.0, 10461.0, 6536.0, 4056.0, 2515.0, 1570.0, 1026.0, 631.0, 435.0, 262.0, 146.0, 106.0, 72.0, 40.0, 23.0, 21.0, 13.0, 8.0, 6.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.765625, -30.819091796875, -29.87255859375, -28.926025390625, -27.9794921875, -27.032958984375, -26.08642578125, -25.139892578125, -24.193359375, -23.246826171875, -22.30029296875, -21.353759765625, -20.4072265625, -19.460693359375, -18.51416015625, -17.567626953125, -16.62109375, -15.674560546875, -14.72802734375, -13.781494140625, -12.8349609375, -11.888427734375, -10.94189453125, -9.995361328125, -9.048828125, -8.102294921875, -7.15576171875, -6.209228515625, -5.2626953125, -4.316162109375, -3.36962890625, -2.423095703125, -1.4765625, -0.530029296875, 0.41650390625, 1.363037109375, 2.3095703125, 3.256103515625, 4.20263671875, 5.149169921875, 6.095703125, 7.042236328125, 7.98876953125, 8.935302734375, 9.8818359375, 10.828369140625, 11.77490234375, 12.721435546875, 13.66796875, 14.614501953125, 15.56103515625, 16.507568359375, 17.4541015625, 18.400634765625, 19.34716796875, 20.293701171875, 21.240234375, 22.186767578125, 23.13330078125, 24.079833984375, 25.0263671875, 25.972900390625, 26.91943359375, 27.865966796875, 28.8125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 10.0, 13.0, 10.0, 10.0, 20.0, 22.0, 27.0, 40.0, 32.0, 40.0, 27.0, 48.0, 39.0, 33.0, 42.0, 43.0, 56.0, 54.0, 48.0, 40.0, 37.0, 41.0, 27.0, 38.0, 43.0, 12.0, 35.0, 23.0, 15.0, 14.0, 15.0, 11.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.187255859375, -12.70263671875, -12.218017578125, -11.7333984375, -11.248779296875, -10.76416015625, -10.279541015625, -9.794921875, -9.310302734375, -8.82568359375, -8.341064453125, -7.8564453125, -7.371826171875, -6.88720703125, -6.402587890625, -5.91796875, -5.433349609375, -4.94873046875, -4.464111328125, -3.9794921875, -3.494873046875, -3.01025390625, -2.525634765625, -2.041015625, -1.556396484375, -1.07177734375, -0.587158203125, -0.1025390625, 0.382080078125, 0.86669921875, 1.351318359375, 1.8359375, 2.320556640625, 2.80517578125, 3.289794921875, 3.7744140625, 4.259033203125, 4.74365234375, 5.228271484375, 5.712890625, 6.197509765625, 6.68212890625, 7.166748046875, 7.6513671875, 8.135986328125, 8.62060546875, 9.105224609375, 9.58984375, 10.074462890625, 10.55908203125, 11.043701171875, 11.5283203125, 12.012939453125, 12.49755859375, 12.982177734375, 13.466796875, 13.951416015625, 14.43603515625, 14.920654296875, 15.4052734375, 15.889892578125, 16.37451171875, 16.859130859375, 17.34375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 11.0, 24.0, 24.0, 31.0, 47.0, 74.0, 108.0, 138.0, 198.0, 350.0, 533.0, 868.0, 1379.0, 2280.0, 3713.0, 6196.0, 10932.0, 19717.0, 36710.0, 69588.0, 134712.0, 228754.0, 233764.0, 139593.0, 72929.0, 37902.0, 20398.0, 11222.0, 6295.0, 3860.0, 2275.0, 1419.0, 838.0, 566.0, 379.0, 220.0, 166.0, 97.0, 65.0, 59.0, 37.0, 26.0, 18.0, 15.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.3916015625, -33.283203125, -32.1748046875, -31.06640625, -29.9580078125, -28.849609375, -27.7412109375, -26.6328125, -25.5244140625, -24.416015625, -23.3076171875, -22.19921875, -21.0908203125, -19.982421875, -18.8740234375, -17.765625, -16.6572265625, -15.548828125, -14.4404296875, -13.33203125, -12.2236328125, -11.115234375, -10.0068359375, -8.8984375, -7.7900390625, -6.681640625, -5.5732421875, -4.46484375, -3.3564453125, -2.248046875, -1.1396484375, -0.03125, 1.0771484375, 2.185546875, 3.2939453125, 4.40234375, 5.5107421875, 6.619140625, 7.7275390625, 8.8359375, 9.9443359375, 11.052734375, 12.1611328125, 13.26953125, 14.3779296875, 15.486328125, 16.5947265625, 17.703125, 18.8115234375, 19.919921875, 21.0283203125, 22.13671875, 23.2451171875, 24.353515625, 25.4619140625, 26.5703125, 27.6787109375, 28.787109375, 29.8955078125, 31.00390625, 32.1123046875, 33.220703125, 34.3291015625, 35.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 2.0, 17.0, 14.0, 21.0, 22.0, 19.0, 23.0, 36.0, 44.0, 42.0, 58.0, 50.0, 58.0, 48.0, 65.0, 56.0, 55.0, 40.0, 55.0, 54.0, 33.0, 35.0, 22.0, 25.0, 23.0, 17.0, 18.0, 10.0, 12.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.125, -14.7047119140625, -14.284423828125, -13.8641357421875, -13.44384765625, -13.0235595703125, -12.603271484375, -12.1829833984375, -11.7626953125, -11.3424072265625, -10.922119140625, -10.5018310546875, -10.08154296875, -9.6612548828125, -9.240966796875, -8.8206787109375, -8.400390625, -7.9801025390625, -7.559814453125, -7.1395263671875, -6.71923828125, -6.2989501953125, -5.878662109375, -5.4583740234375, -5.0380859375, -4.6177978515625, -4.197509765625, -3.7772216796875, -3.35693359375, -2.9366455078125, -2.516357421875, -2.0960693359375, -1.67578125, -1.2554931640625, -0.835205078125, -0.4149169921875, 0.00537109375, 0.4256591796875, 0.845947265625, 1.2662353515625, 1.6865234375, 2.1068115234375, 2.527099609375, 2.9473876953125, 3.36767578125, 3.7879638671875, 4.208251953125, 4.6285400390625, 5.048828125, 5.4691162109375, 5.889404296875, 6.3096923828125, 6.72998046875, 7.1502685546875, 7.570556640625, 7.9908447265625, 8.4111328125, 8.8314208984375, 9.251708984375, 9.6719970703125, 10.09228515625, 10.5125732421875, 10.932861328125, 11.3531494140625, 11.7734375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 8.0, 6.0, 12.0, 5.0, 10.0, 19.0, 21.0, 24.0, 50.0, 59.0, 102.0, 101.0, 134.0, 204.0, 311.0, 405.0, 598.0, 1012.0, 1524.0, 2591.0, 4483.0, 8421.0, 18173.0, 47025.0, 241386.0, 593509.0, 77280.0, 25807.0, 11050.0, 5598.0, 3159.0, 1875.0, 1139.0, 790.0, 515.0, 323.0, 231.0, 183.0, 119.0, 86.0, 69.0, 42.0, 33.0, 25.0, 15.0, 7.0, 7.0, 11.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.0625, -87.17578125, -84.2890625, -81.40234375, -78.515625, -75.62890625, -72.7421875, -69.85546875, -66.96875, -64.08203125, -61.1953125, -58.30859375, -55.421875, -52.53515625, -49.6484375, -46.76171875, -43.875, -40.98828125, -38.1015625, -35.21484375, -32.328125, -29.44140625, -26.5546875, -23.66796875, -20.78125, -17.89453125, -15.0078125, -12.12109375, -9.234375, -6.34765625, -3.4609375, -0.57421875, 2.3125, 5.19921875, 8.0859375, 10.97265625, 13.859375, 16.74609375, 19.6328125, 22.51953125, 25.40625, 28.29296875, 31.1796875, 34.06640625, 36.953125, 39.83984375, 42.7265625, 45.61328125, 48.5, 51.38671875, 54.2734375, 57.16015625, 60.046875, 62.93359375, 65.8203125, 68.70703125, 71.59375, 74.48046875, 77.3671875, 80.25390625, 83.140625, 86.02734375, 88.9140625, 91.80078125, 94.6875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 2.0, 3.0, 10.0, 7.0, 10.0, 12.0, 14.0, 27.0, 35.0, 90.0, 223.0, 258.0, 110.0, 56.0, 21.0, 18.0, 16.0, 13.0, 12.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009151577949523926, -0.008857965469360352, -0.008564352989196777, -0.008270740509033203, -0.007977128028869629, -0.007683515548706055, -0.0073899030685424805, -0.007096290588378906, -0.006802678108215332, -0.006509065628051758, -0.006215453147888184, -0.005921840667724609, -0.005628228187561035, -0.005334615707397461, -0.005041003227233887, -0.0047473907470703125, -0.004453778266906738, -0.004160165786743164, -0.00386655330657959, -0.0035729408264160156, -0.0032793283462524414, -0.002985715866088867, -0.002692103385925293, -0.0023984909057617188, -0.0021048784255981445, -0.0018112659454345703, -0.001517653465270996, -0.0012240409851074219, -0.0009304285049438477, -0.0006368160247802734, -0.0003432035446166992, -4.9591064453125e-05, 0.00024402141571044922, 0.0005376338958740234, 0.0008312463760375977, 0.0011248588562011719, 0.001418471336364746, 0.0017120838165283203, 0.0020056962966918945, 0.0022993087768554688, 0.002592921257019043, 0.002886533737182617, 0.0031801462173461914, 0.0034737586975097656, 0.00376737117767334, 0.004060983657836914, 0.004354596138000488, 0.0046482086181640625, 0.004941821098327637, 0.005235433578491211, 0.005529046058654785, 0.005822658538818359, 0.006116271018981934, 0.006409883499145508, 0.006703495979309082, 0.006997108459472656, 0.0072907209396362305, 0.007584333419799805, 0.007877945899963379, 0.008171558380126953, 0.008465170860290527, 0.008758783340454102, 0.009052395820617676, 0.00934600830078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 14.0, 18.0, 20.0, 22.0, 33.0, 49.0, 77.0, 92.0, 165.0, 237.0, 317.0, 437.0, 599.0, 752.0, 1124.0, 1621.0, 2490.0, 4091.0, 7233.0, 13885.0, 32709.0, 100487.0, 420494.0, 326591.0, 78063.0, 27377.0, 12063.0, 6297.0, 3716.0, 2297.0, 1508.0, 1072.0, 730.0, 537.0, 364.0, 248.0, 200.0, 156.0, 94.0, 83.0, 60.0, 43.0, 26.0, 18.0, 14.0, 10.0, 8.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-60.75, -59.00927734375, -57.2685546875, -55.52783203125, -53.787109375, -52.04638671875, -50.3056640625, -48.56494140625, -46.82421875, -45.08349609375, -43.3427734375, -41.60205078125, -39.861328125, -38.12060546875, -36.3798828125, -34.63916015625, -32.8984375, -31.15771484375, -29.4169921875, -27.67626953125, -25.935546875, -24.19482421875, -22.4541015625, -20.71337890625, -18.97265625, -17.23193359375, -15.4912109375, -13.75048828125, -12.009765625, -10.26904296875, -8.5283203125, -6.78759765625, -5.046875, -3.30615234375, -1.5654296875, 0.17529296875, 1.916015625, 3.65673828125, 5.3974609375, 7.13818359375, 8.87890625, 10.61962890625, 12.3603515625, 14.10107421875, 15.841796875, 17.58251953125, 19.3232421875, 21.06396484375, 22.8046875, 24.54541015625, 26.2861328125, 28.02685546875, 29.767578125, 31.50830078125, 33.2490234375, 34.98974609375, 36.73046875, 38.47119140625, 40.2119140625, 41.95263671875, 43.693359375, 45.43408203125, 47.1748046875, 48.91552734375, 50.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 9.0, 6.0, 17.0, 18.0, 19.0, 32.0, 53.0, 57.0, 94.0, 144.0, 146.0, 117.0, 75.0, 51.0, 38.0, 19.0, 18.0, 14.0, 15.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.203125, -19.660400390625, -19.11767578125, -18.574951171875, -18.0322265625, -17.489501953125, -16.94677734375, -16.404052734375, -15.861328125, -15.318603515625, -14.77587890625, -14.233154296875, -13.6904296875, -13.147705078125, -12.60498046875, -12.062255859375, -11.51953125, -10.976806640625, -10.43408203125, -9.891357421875, -9.3486328125, -8.805908203125, -8.26318359375, -7.720458984375, -7.177734375, -6.635009765625, -6.09228515625, -5.549560546875, -5.0068359375, -4.464111328125, -3.92138671875, -3.378662109375, -2.8359375, -2.293212890625, -1.75048828125, -1.207763671875, -0.6650390625, -0.122314453125, 0.42041015625, 0.963134765625, 1.505859375, 2.048583984375, 2.59130859375, 3.134033203125, 3.6767578125, 4.219482421875, 4.76220703125, 5.304931640625, 5.84765625, 6.390380859375, 6.93310546875, 7.475830078125, 8.0185546875, 8.561279296875, 9.10400390625, 9.646728515625, 10.189453125, 10.732177734375, 11.27490234375, 11.817626953125, 12.3603515625, 12.903076171875, 13.44580078125, 13.988525390625, 14.53125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 8.0, 9.0, 5.0, 12.0, 26.0, 16.0, 28.0, 39.0, 37.0, 39.0, 50.0, 47.0, 53.0, 71.0, 78.0, 70.0, 69.0, 66.0, 54.0, 35.0, 40.0, 35.0, 23.0, 23.0, 12.0, 15.0, 7.0, 8.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.788639068603516, -30.958770751953125, -30.128902435302734, -29.299034118652344, -28.46916389465332, -27.63929557800293, -26.80942726135254, -25.97955894470215, -25.149688720703125, -24.319820404052734, -23.489952087402344, -22.660083770751953, -21.83021354675293, -21.00034523010254, -20.17047691345215, -19.340608596801758, -18.510740280151367, -17.680871963500977, -16.851003646850586, -16.021133422851562, -15.191265106201172, -14.361396789550781, -13.53152847290039, -12.70166015625, -11.871790885925293, -11.041922569274902, -10.212053298950195, -9.382184982299805, -8.552316665649414, -7.722447395324707, -6.892579078674316, -6.062710285186768, -5.232839584350586, -4.402970790863037, -3.5731022357940674, -2.7432336807250977, -1.9133648872375488, -1.08349609375, -0.2536277770996094, 0.5762410163879395, 1.4061098098754883, 2.235978603363037, 3.065847158432007, 3.8957157135009766, 4.725584506988525, 5.555453300476074, 6.385321617126465, 7.215190410614014, 8.045059204101562, 8.874927520751953, 9.70479679107666, 10.53466510772705, 11.364534378051758, 12.194402694702148, 13.024271011352539, 13.85413932800293, 14.684008598327637, 15.513876914978027, 16.343746185302734, 17.173614501953125, 18.003482818603516, 18.833351135253906, 19.663219451904297, 20.49308967590332, 21.32295799255371]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 10.0, 8.0, 13.0, 14.0, 16.0, 19.0, 27.0, 24.0, 22.0, 26.0, 23.0, 27.0, 29.0, 31.0, 48.0, 25.0, 44.0, 44.0, 38.0, 49.0, 36.0, 34.0, 27.0, 40.0, 30.0, 36.0, 29.0, 28.0, 30.0, 23.0, 18.0, 14.0, 18.0, 10.0, 13.0, 10.0, 11.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-18.461637496948242, -17.9154052734375, -17.369173049926758, -16.82294273376465, -16.276710510253906, -15.730478286743164, -15.184246063232422, -14.63801383972168, -14.091782569885254, -13.545550346374512, -12.999319076538086, -12.453086853027344, -11.906854629516602, -11.360623359680176, -10.814391136169434, -10.268159866333008, -9.721927642822266, -9.175695419311523, -8.629464149475098, -8.083231925964355, -7.5370001792907715, -6.9907684326171875, -6.444536209106445, -5.898304462432861, -5.352072715759277, -4.805840969085693, -4.259609222412109, -3.713376998901367, -3.167145252227783, -2.620913505554199, -2.074681520462036, -1.528449535369873, -0.9822158813476562, -0.4359840154647827, 0.11024785041809082, 0.6564797163009644, 1.202711582183838, 1.7489433288574219, 2.295175313949585, 2.841407299041748, 3.387639045715332, 3.933870792388916, 4.4801025390625, 5.026334762573242, 5.572566509246826, 6.11879825592041, 6.665030479431152, 7.211262226104736, 7.75749397277832, 8.303726196289062, 8.849957466125488, 9.39618968963623, 9.942420959472656, 10.488653182983398, 11.03488540649414, 11.581117630004883, 12.127348899841309, 12.67358112335205, 13.219812393188477, 13.766044616699219, 14.312276840209961, 14.858508110046387, 15.404740333557129, 15.950971603393555, 16.497203826904297]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 15.0, 12.0, 22.0, 28.0, 40.0, 69.0, 106.0, 108.0, 178.0, 281.0, 372.0, 556.0, 880.0, 1399.0, 2443.0, 4198.0, 7764.0, 15473.0, 33477.0, 79629.0, 186128.0, 302131.0, 227552.0, 102128.0, 42517.0, 19198.0, 9323.0, 4968.0, 2741.0, 1749.0, 1034.0, 639.0, 425.0, 291.0, 213.0, 127.0, 89.0, 61.0, 60.0, 28.0, 22.0, 22.0, 10.0, 13.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-44.46875, -43.1064453125, -41.744140625, -40.3818359375, -39.01953125, -37.6572265625, -36.294921875, -34.9326171875, -33.5703125, -32.2080078125, -30.845703125, -29.4833984375, -28.12109375, -26.7587890625, -25.396484375, -24.0341796875, -22.671875, -21.3095703125, -19.947265625, -18.5849609375, -17.22265625, -15.8603515625, -14.498046875, -13.1357421875, -11.7734375, -10.4111328125, -9.048828125, -7.6865234375, -6.32421875, -4.9619140625, -3.599609375, -2.2373046875, -0.875, 0.4873046875, 1.849609375, 3.2119140625, 4.57421875, 5.9365234375, 7.298828125, 8.6611328125, 10.0234375, 11.3857421875, 12.748046875, 14.1103515625, 15.47265625, 16.8349609375, 18.197265625, 19.5595703125, 20.921875, 22.2841796875, 23.646484375, 25.0087890625, 26.37109375, 27.7333984375, 29.095703125, 30.4580078125, 31.8203125, 33.1826171875, 34.544921875, 35.9072265625, 37.26953125, 38.6318359375, 39.994140625, 41.3564453125, 42.71875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 7.0, 5.0, 15.0, 9.0, 13.0, 19.0, 15.0, 22.0, 22.0, 30.0, 23.0, 28.0, 34.0, 44.0, 28.0, 38.0, 46.0, 41.0, 46.0, 40.0, 35.0, 47.0, 34.0, 41.0, 40.0, 34.0, 41.0, 30.0, 22.0, 21.0, 26.0, 19.0, 14.0, 11.0, 11.0, 8.0, 10.0, 6.0, 1.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.0, -18.427734375, -17.85546875, -17.283203125, -16.7109375, -16.138671875, -15.56640625, -14.994140625, -14.421875, -13.849609375, -13.27734375, -12.705078125, -12.1328125, -11.560546875, -10.98828125, -10.416015625, -9.84375, -9.271484375, -8.69921875, -8.126953125, -7.5546875, -6.982421875, -6.41015625, -5.837890625, -5.265625, -4.693359375, -4.12109375, -3.548828125, -2.9765625, -2.404296875, -1.83203125, -1.259765625, -0.6875, -0.115234375, 0.45703125, 1.029296875, 1.6015625, 2.173828125, 2.74609375, 3.318359375, 3.890625, 4.462890625, 5.03515625, 5.607421875, 6.1796875, 6.751953125, 7.32421875, 7.896484375, 8.46875, 9.041015625, 9.61328125, 10.185546875, 10.7578125, 11.330078125, 11.90234375, 12.474609375, 13.046875, 13.619140625, 14.19140625, 14.763671875, 15.3359375, 15.908203125, 16.48046875, 17.052734375, 17.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 11.0, 24.0, 29.0, 50.0, 54.0, 84.0, 150.0, 194.0, 265.0, 435.0, 597.0, 935.0, 1351.0, 2063.0, 3224.0, 5145.0, 8020.0, 13416.0, 22655.0, 40656.0, 75546.0, 141471.0, 220604.0, 214317.0, 133096.0, 70405.0, 37837.0, 21515.0, 12681.0, 7770.0, 4908.0, 3092.0, 1954.0, 1318.0, 864.0, 584.0, 389.0, 254.0, 184.0, 120.0, 76.0, 70.0, 33.0, 31.0, 23.0, 8.0, 9.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-30.984375, -29.983154296875, -28.98193359375, -27.980712890625, -26.9794921875, -25.978271484375, -24.97705078125, -23.975830078125, -22.974609375, -21.973388671875, -20.97216796875, -19.970947265625, -18.9697265625, -17.968505859375, -16.96728515625, -15.966064453125, -14.96484375, -13.963623046875, -12.96240234375, -11.961181640625, -10.9599609375, -9.958740234375, -8.95751953125, -7.956298828125, -6.955078125, -5.953857421875, -4.95263671875, -3.951416015625, -2.9501953125, -1.948974609375, -0.94775390625, 0.053466796875, 1.0546875, 2.055908203125, 3.05712890625, 4.058349609375, 5.0595703125, 6.060791015625, 7.06201171875, 8.063232421875, 9.064453125, 10.065673828125, 11.06689453125, 12.068115234375, 13.0693359375, 14.070556640625, 15.07177734375, 16.072998046875, 17.07421875, 18.075439453125, 19.07666015625, 20.077880859375, 21.0791015625, 22.080322265625, 23.08154296875, 24.082763671875, 25.083984375, 26.085205078125, 27.08642578125, 28.087646484375, 29.0888671875, 30.090087890625, 31.09130859375, 32.092529296875, 33.09375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 8.0, 1.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 15.0, 19.0, 16.0, 13.0, 17.0, 19.0, 22.0, 16.0, 27.0, 27.0, 39.0, 27.0, 29.0, 32.0, 46.0, 33.0, 44.0, 32.0, 40.0, 33.0, 24.0, 29.0, 32.0, 37.0, 32.0, 37.0, 26.0, 34.0, 23.0, 17.0, 19.0, 9.0, 7.0, 15.0, 10.0, 13.0, 12.0, 8.0, 7.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.6640625, -12.2310791015625, -11.798095703125, -11.3651123046875, -10.93212890625, -10.4991455078125, -10.066162109375, -9.6331787109375, -9.2001953125, -8.7672119140625, -8.334228515625, -7.9012451171875, -7.46826171875, -7.0352783203125, -6.602294921875, -6.1693115234375, -5.736328125, -5.3033447265625, -4.870361328125, -4.4373779296875, -4.00439453125, -3.5714111328125, -3.138427734375, -2.7054443359375, -2.2724609375, -1.8394775390625, -1.406494140625, -0.9735107421875, -0.54052734375, -0.1075439453125, 0.325439453125, 0.7584228515625, 1.19140625, 1.6243896484375, 2.057373046875, 2.4903564453125, 2.92333984375, 3.3563232421875, 3.789306640625, 4.2222900390625, 4.6552734375, 5.0882568359375, 5.521240234375, 5.9542236328125, 6.38720703125, 6.8201904296875, 7.253173828125, 7.6861572265625, 8.119140625, 8.5521240234375, 8.985107421875, 9.4180908203125, 9.85107421875, 10.2840576171875, 10.717041015625, 11.1500244140625, 11.5830078125, 12.0159912109375, 12.448974609375, 12.8819580078125, 13.31494140625, 13.7479248046875, 14.180908203125, 14.6138916015625, 15.046875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 12.0, 13.0, 11.0, 13.0, 22.0, 36.0, 45.0, 62.0, 74.0, 116.0, 148.0, 203.0, 275.0, 377.0, 482.0, 708.0, 1099.0, 1625.0, 2371.0, 3703.0, 6067.0, 10351.0, 18977.0, 37951.0, 91102.0, 262486.0, 359521.0, 138654.0, 53168.0, 24857.0, 12990.0, 7454.0, 4477.0, 2866.0, 1939.0, 1262.0, 850.0, 566.0, 473.0, 308.0, 198.0, 186.0, 115.0, 90.0, 79.0, 43.0, 30.0, 25.0, 25.0, 6.0, 15.0, 12.0, 6.0, 4.0, 0.0, 3.0, 3.0], "bins": [-61.21875, -59.375, -57.53125, -55.6875, -53.84375, -52.0, -50.15625, -48.3125, -46.46875, -44.625, -42.78125, -40.9375, -39.09375, -37.25, -35.40625, -33.5625, -31.71875, -29.875, -28.03125, -26.1875, -24.34375, -22.5, -20.65625, -18.8125, -16.96875, -15.125, -13.28125, -11.4375, -9.59375, -7.75, -5.90625, -4.0625, -2.21875, -0.375, 1.46875, 3.3125, 5.15625, 7.0, 8.84375, 10.6875, 12.53125, 14.375, 16.21875, 18.0625, 19.90625, 21.75, 23.59375, 25.4375, 27.28125, 29.125, 30.96875, 32.8125, 34.65625, 36.5, 38.34375, 40.1875, 42.03125, 43.875, 45.71875, 47.5625, 49.40625, 51.25, 53.09375, 54.9375, 56.78125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 5.0, 7.0, 6.0, 14.0, 12.0, 25.0, 44.0, 57.0, 67.0, 107.0, 145.0, 128.0, 104.0, 81.0, 59.0, 36.0, 23.0, 14.0, 17.0, 11.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005161285400390625, -0.004983842372894287, -0.004806399345397949, -0.004628956317901611, -0.0044515132904052734, -0.0042740702629089355, -0.004096627235412598, -0.00391918420791626, -0.003741741180419922, -0.003564298152923584, -0.003386855125427246, -0.003209412097930908, -0.0030319690704345703, -0.0028545260429382324, -0.0026770830154418945, -0.0024996399879455566, -0.0023221969604492188, -0.002144753932952881, -0.001967310905456543, -0.001789867877960205, -0.0016124248504638672, -0.0014349818229675293, -0.0012575387954711914, -0.0010800957679748535, -0.0009026527404785156, -0.0007252097129821777, -0.0005477666854858398, -0.00037032365798950195, -0.00019288063049316406, -1.5437602996826172e-05, 0.00016200542449951172, 0.0003394484519958496, 0.0005168914794921875, 0.0006943345069885254, 0.0008717775344848633, 0.0010492205619812012, 0.001226663589477539, 0.001404106616973877, 0.0015815496444702148, 0.0017589926719665527, 0.0019364356994628906, 0.0021138787269592285, 0.0022913217544555664, 0.0024687647819519043, 0.002646207809448242, 0.00282365083694458, 0.003001093864440918, 0.003178536891937256, 0.0033559799194335938, 0.0035334229469299316, 0.0037108659744262695, 0.0038883090019226074, 0.004065752029418945, 0.004243195056915283, 0.004420638084411621, 0.004598081111907959, 0.004775524139404297, 0.004952967166900635, 0.005130410194396973, 0.0053078532218933105, 0.0054852962493896484, 0.005662739276885986, 0.005840182304382324, 0.006017625331878662, 0.006195068359375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 10.0, 4.0, 8.0, 9.0, 10.0, 20.0, 28.0, 25.0, 33.0, 60.0, 50.0, 88.0, 104.0, 143.0, 174.0, 249.0, 346.0, 497.0, 732.0, 1058.0, 1680.0, 2881.0, 5376.0, 10425.0, 24858.0, 71642.0, 255669.0, 434636.0, 155413.0, 45859.0, 17354.0, 7980.0, 4253.0, 2340.0, 1325.0, 946.0, 664.0, 415.0, 302.0, 219.0, 162.0, 128.0, 76.0, 85.0, 58.0, 39.0, 35.0, 22.0, 15.0, 18.0, 10.0, 9.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-59.90625, -57.99267578125, -56.0791015625, -54.16552734375, -52.251953125, -50.33837890625, -48.4248046875, -46.51123046875, -44.59765625, -42.68408203125, -40.7705078125, -38.85693359375, -36.943359375, -35.02978515625, -33.1162109375, -31.20263671875, -29.2890625, -27.37548828125, -25.4619140625, -23.54833984375, -21.634765625, -19.72119140625, -17.8076171875, -15.89404296875, -13.98046875, -12.06689453125, -10.1533203125, -8.23974609375, -6.326171875, -4.41259765625, -2.4990234375, -0.58544921875, 1.328125, 3.24169921875, 5.1552734375, 7.06884765625, 8.982421875, 10.89599609375, 12.8095703125, 14.72314453125, 16.63671875, 18.55029296875, 20.4638671875, 22.37744140625, 24.291015625, 26.20458984375, 28.1181640625, 30.03173828125, 31.9453125, 33.85888671875, 35.7724609375, 37.68603515625, 39.599609375, 41.51318359375, 43.4267578125, 45.34033203125, 47.25390625, 49.16748046875, 51.0810546875, 52.99462890625, 54.908203125, 56.82177734375, 58.7353515625, 60.64892578125, 62.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 9.0, 7.0, 9.0, 14.0, 16.0, 21.0, 37.0, 40.0, 48.0, 68.0, 80.0, 91.0, 91.0, 75.0, 84.0, 64.0, 42.0, 34.0, 40.0, 29.0, 20.0, 20.0, 6.0, 7.0, 3.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.015625, -17.5037841796875, -16.991943359375, -16.4801025390625, -15.96826171875, -15.4564208984375, -14.944580078125, -14.4327392578125, -13.9208984375, -13.4090576171875, -12.897216796875, -12.3853759765625, -11.87353515625, -11.3616943359375, -10.849853515625, -10.3380126953125, -9.826171875, -9.3143310546875, -8.802490234375, -8.2906494140625, -7.77880859375, -7.2669677734375, -6.755126953125, -6.2432861328125, -5.7314453125, -5.2196044921875, -4.707763671875, -4.1959228515625, -3.68408203125, -3.1722412109375, -2.660400390625, -2.1485595703125, -1.63671875, -1.1248779296875, -0.613037109375, -0.1011962890625, 0.41064453125, 0.9224853515625, 1.434326171875, 1.9461669921875, 2.4580078125, 2.9698486328125, 3.481689453125, 3.9935302734375, 4.50537109375, 5.0172119140625, 5.529052734375, 6.0408935546875, 6.552734375, 7.0645751953125, 7.576416015625, 8.0882568359375, 8.60009765625, 9.1119384765625, 9.623779296875, 10.1356201171875, 10.6474609375, 11.1593017578125, 11.671142578125, 12.1829833984375, 12.69482421875, 13.2066650390625, 13.718505859375, 14.2303466796875, 14.7421875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 10.0, 13.0, 17.0, 25.0, 33.0, 40.0, 41.0, 68.0, 62.0, 71.0, 79.0, 80.0, 74.0, 82.0, 49.0, 52.0, 46.0, 38.0, 23.0, 17.0, 23.0, 10.0, 18.0, 4.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.158958435058594, -34.048431396484375, -32.937904357910156, -31.827377319335938, -30.71685028076172, -29.6063232421875, -28.49579620361328, -27.385269165039062, -26.274742126464844, -25.164215087890625, -24.053688049316406, -22.943161010742188, -21.83263397216797, -20.72210693359375, -19.61157989501953, -18.501052856445312, -17.39052391052246, -16.279996871948242, -15.169469833374023, -14.058942794799805, -12.948415756225586, -11.837888717651367, -10.727360725402832, -9.616833686828613, -8.506306648254395, -7.395779609680176, -6.285252571105957, -5.17472505569458, -4.064198017120361, -2.9536709785461426, -1.8431434631347656, -0.7326164245605469, 0.3779106140136719, 1.4884377717971802, 2.5989649295806885, 3.7094922065734863, 4.820019245147705, 5.930546283721924, 7.041073799133301, 8.15160083770752, 9.262127876281738, 10.372654914855957, 11.483181953430176, 12.593709945678711, 13.70423698425293, 14.814764022827148, 15.925291061401367, 17.035818099975586, 18.146345138549805, 19.256872177124023, 20.367399215698242, 21.47792625427246, 22.58845329284668, 23.6989803314209, 24.80950927734375, 25.92003631591797, 27.030563354492188, 28.141090393066406, 29.251617431640625, 30.362144470214844, 31.472671508789062, 32.58319854736328, 33.6937255859375, 34.80425262451172, 35.91477966308594]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 9.0, 11.0, 10.0, 13.0, 14.0, 24.0, 19.0, 23.0, 23.0, 27.0, 34.0, 42.0, 41.0, 30.0, 44.0, 44.0, 43.0, 56.0, 64.0, 31.0, 46.0, 40.0, 35.0, 34.0, 36.0, 25.0, 21.0, 26.0, 12.0, 18.0, 22.0, 20.0, 8.0, 11.0, 10.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0], "bins": [-25.682144165039062, -25.01441764831543, -24.34669303894043, -23.678966522216797, -23.011241912841797, -22.343515396118164, -21.675790786743164, -21.00806427001953, -20.34033966064453, -19.6726131439209, -19.0048885345459, -18.337162017822266, -17.669437408447266, -17.001710891723633, -16.333986282348633, -15.666259765625, -14.998534202575684, -14.330808639526367, -13.66308307647705, -12.995357513427734, -12.327631950378418, -11.659906387329102, -10.992179870605469, -10.324455261230469, -9.656728744506836, -8.98900318145752, -8.321277618408203, -7.653552055358887, -6.98582649230957, -6.318100929260254, -5.650374889373779, -4.982649326324463, -4.314924240112305, -3.6471986770629883, -2.979473114013672, -2.3117473125457764, -1.64402174949646, -0.9762961864471436, -0.30857038497924805, 0.35915517807006836, 1.0268807411193848, 1.6946063041687012, 2.3623318672180176, 3.030057668685913, 3.6977832317352295, 4.365509033203125, 5.033234596252441, 5.700960159301758, 6.368685722351074, 7.036411285400391, 7.704136848449707, 8.371862411499023, 9.03958797454834, 9.707313537597656, 10.375040054321289, 11.042764663696289, 11.710491180419922, 12.378216743469238, 13.045942306518555, 13.713667869567871, 14.381393432617188, 15.049118995666504, 15.71684455871582, 16.384571075439453, 17.052295684814453]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 0.0, 1.0, 10.0, 3.0, 8.0, 15.0, 19.0, 26.0, 29.0, 53.0, 59.0, 107.0, 130.0, 208.0, 274.0, 400.0, 563.0, 849.0, 1321.0, 1987.0, 3256.0, 5486.0, 9728.0, 18277.0, 36465.0, 78318.0, 189110.0, 481992.0, 1012605.0, 1180428.0, 680732.0, 276891.0, 111198.0, 49675.0, 23701.0, 12540.0, 6947.0, 3995.0, 2328.0, 1504.0, 954.0, 635.0, 448.0, 272.0, 217.0, 169.0, 111.0, 78.0, 44.0, 43.0, 29.0, 15.0, 15.0, 4.0, 7.0, 11.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-26.171875, -25.359130859375, -24.54638671875, -23.733642578125, -22.9208984375, -22.108154296875, -21.29541015625, -20.482666015625, -19.669921875, -18.857177734375, -18.04443359375, -17.231689453125, -16.4189453125, -15.606201171875, -14.79345703125, -13.980712890625, -13.16796875, -12.355224609375, -11.54248046875, -10.729736328125, -9.9169921875, -9.104248046875, -8.29150390625, -7.478759765625, -6.666015625, -5.853271484375, -5.04052734375, -4.227783203125, -3.4150390625, -2.602294921875, -1.78955078125, -0.976806640625, -0.1640625, 0.648681640625, 1.46142578125, 2.274169921875, 3.0869140625, 3.899658203125, 4.71240234375, 5.525146484375, 6.337890625, 7.150634765625, 7.96337890625, 8.776123046875, 9.5888671875, 10.401611328125, 11.21435546875, 12.027099609375, 12.83984375, 13.652587890625, 14.46533203125, 15.278076171875, 16.0908203125, 16.903564453125, 17.71630859375, 18.529052734375, 19.341796875, 20.154541015625, 20.96728515625, 21.780029296875, 22.5927734375, 23.405517578125, 24.21826171875, 25.031005859375, 25.84375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 11.0, 9.0, 9.0, 20.0, 17.0, 19.0, 28.0, 33.0, 38.0, 38.0, 42.0, 49.0, 36.0, 35.0, 53.0, 47.0, 52.0, 53.0, 33.0, 39.0, 36.0, 42.0, 36.0, 35.0, 24.0, 27.0, 21.0, 18.0, 14.0, 13.0, 11.0, 4.0, 13.0, 7.0, 10.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.203125, -16.73779296875, -16.2724609375, -15.80712890625, -15.341796875, -14.87646484375, -14.4111328125, -13.94580078125, -13.48046875, -13.01513671875, -12.5498046875, -12.08447265625, -11.619140625, -11.15380859375, -10.6884765625, -10.22314453125, -9.7578125, -9.29248046875, -8.8271484375, -8.36181640625, -7.896484375, -7.43115234375, -6.9658203125, -6.50048828125, -6.03515625, -5.56982421875, -5.1044921875, -4.63916015625, -4.173828125, -3.70849609375, -3.2431640625, -2.77783203125, -2.3125, -1.84716796875, -1.3818359375, -0.91650390625, -0.451171875, 0.01416015625, 0.4794921875, 0.94482421875, 1.41015625, 1.87548828125, 2.3408203125, 2.80615234375, 3.271484375, 3.73681640625, 4.2021484375, 4.66748046875, 5.1328125, 5.59814453125, 6.0634765625, 6.52880859375, 6.994140625, 7.45947265625, 7.9248046875, 8.39013671875, 8.85546875, 9.32080078125, 9.7861328125, 10.25146484375, 10.716796875, 11.18212890625, 11.6474609375, 12.11279296875, 12.578125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 2.0, 7.0, 18.0, 22.0, 30.0, 59.0, 91.0, 138.0, 225.0, 387.0, 639.0, 1103.0, 1928.0, 3652.0, 7004.0, 14974.0, 34399.0, 92583.0, 283054.0, 863133.0, 1504970.0, 915640.0, 304507.0, 98059.0, 36396.0, 15498.0, 7339.0, 3711.0, 1985.0, 1061.0, 603.0, 395.0, 238.0, 157.0, 95.0, 58.0, 45.0, 24.0, 10.0, 10.0, 11.0, 7.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.125, -31.037109375, -29.94921875, -28.861328125, -27.7734375, -26.685546875, -25.59765625, -24.509765625, -23.421875, -22.333984375, -21.24609375, -20.158203125, -19.0703125, -17.982421875, -16.89453125, -15.806640625, -14.71875, -13.630859375, -12.54296875, -11.455078125, -10.3671875, -9.279296875, -8.19140625, -7.103515625, -6.015625, -4.927734375, -3.83984375, -2.751953125, -1.6640625, -0.576171875, 0.51171875, 1.599609375, 2.6875, 3.775390625, 4.86328125, 5.951171875, 7.0390625, 8.126953125, 9.21484375, 10.302734375, 11.390625, 12.478515625, 13.56640625, 14.654296875, 15.7421875, 16.830078125, 17.91796875, 19.005859375, 20.09375, 21.181640625, 22.26953125, 23.357421875, 24.4453125, 25.533203125, 26.62109375, 27.708984375, 28.796875, 29.884765625, 30.97265625, 32.060546875, 33.1484375, 34.236328125, 35.32421875, 36.412109375, 37.5]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 3.0, 7.0, 10.0, 12.0, 19.0, 12.0, 24.0, 36.0, 50.0, 74.0, 66.0, 85.0, 113.0, 141.0, 176.0, 236.0, 237.0, 264.0, 289.0, 290.0, 269.0, 290.0, 264.0, 216.0, 168.0, 149.0, 118.0, 98.0, 79.0, 59.0, 45.0, 39.0, 31.0, 30.0, 9.0, 13.0, 18.0, 11.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.18359375, -6.93829345703125, -6.6929931640625, -6.44769287109375, -6.202392578125, -5.95709228515625, -5.7117919921875, -5.46649169921875, -5.22119140625, -4.97589111328125, -4.7305908203125, -4.48529052734375, -4.239990234375, -3.99468994140625, -3.7493896484375, -3.50408935546875, -3.2587890625, -3.01348876953125, -2.7681884765625, -2.52288818359375, -2.277587890625, -2.03228759765625, -1.7869873046875, -1.54168701171875, -1.29638671875, -1.05108642578125, -0.8057861328125, -0.56048583984375, -0.315185546875, -0.06988525390625, 0.1754150390625, 0.42071533203125, 0.666015625, 0.91131591796875, 1.1566162109375, 1.40191650390625, 1.647216796875, 1.89251708984375, 2.1378173828125, 2.38311767578125, 2.62841796875, 2.87371826171875, 3.1190185546875, 3.36431884765625, 3.609619140625, 3.85491943359375, 4.1002197265625, 4.34552001953125, 4.5908203125, 4.83612060546875, 5.0814208984375, 5.32672119140625, 5.572021484375, 5.81732177734375, 6.0626220703125, 6.30792236328125, 6.55322265625, 6.79852294921875, 7.0438232421875, 7.28912353515625, 7.534423828125, 7.77972412109375, 8.0250244140625, 8.27032470703125, 8.515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 9.0, 9.0, 15.0, 18.0, 32.0, 22.0, 55.0, 59.0, 69.0, 91.0, 100.0, 106.0, 82.0, 101.0, 62.0, 45.0, 35.0, 25.0, 16.0, 17.0, 13.0, 9.0, 7.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.2837028503418, -36.24574279785156, -35.207786560058594, -34.16982650756836, -33.131866455078125, -32.093910217285156, -31.055950164794922, -30.01799201965332, -28.98003387451172, -27.942075729370117, -26.904115676879883, -25.86615753173828, -24.82819938659668, -23.790241241455078, -22.752281188964844, -21.714323043823242, -20.676362991333008, -19.638404846191406, -18.600444793701172, -17.56248664855957, -16.52452850341797, -15.48656940460205, -14.448610305786133, -13.410652160644531, -12.372693061828613, -11.334733963012695, -10.296775817871094, -9.258816719055176, -8.220857620239258, -7.182899475097656, -6.144940376281738, -5.1069817543029785, -4.069023132324219, -3.031064510345459, -1.9931056499481201, -0.9551467895507812, 0.08281183242797852, 1.1207704544067383, 2.1587295532226562, 3.196688175201416, 4.234646797180176, 5.2726054191589355, 6.310564041137695, 7.348523139953613, 8.386482238769531, 9.424440383911133, 10.46239948272705, 11.500358581542969, 12.53831672668457, 13.576275825500488, 14.61423397064209, 15.652193069458008, 16.69015121459961, 17.728111267089844, 18.766069412231445, 19.804027557373047, 20.84198760986328, 21.879945755004883, 22.917905807495117, 23.95586395263672, 24.99382209777832, 26.031780242919922, 27.069740295410156, 28.107698440551758, 29.14565658569336]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 10.0, 6.0, 13.0, 7.0, 14.0, 18.0, 25.0, 22.0, 25.0, 22.0, 38.0, 29.0, 29.0, 38.0, 50.0, 50.0, 40.0, 43.0, 38.0, 37.0, 45.0, 48.0, 37.0, 35.0, 32.0, 31.0, 25.0, 22.0, 24.0, 25.0, 23.0, 21.0, 9.0, 17.0, 6.0, 7.0, 5.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.662553787231445, -19.122377395629883, -18.58220100402832, -18.042022705078125, -17.501846313476562, -16.961669921875, -16.421493530273438, -15.881317138671875, -15.341140747070312, -14.80096435546875, -14.260787010192871, -13.720610618591309, -13.180434226989746, -12.640256881713867, -12.100080490112305, -11.559904098510742, -11.019726753234863, -10.4795503616333, -9.939373016357422, -9.39919662475586, -8.859020233154297, -8.318843841552734, -7.7786664962768555, -7.238490104675293, -6.698313236236572, -6.158136367797852, -5.617959976196289, -5.077783107757568, -4.537606239318848, -3.997429847717285, -3.4572529792785645, -2.917076349258423, -2.3768997192382812, -1.8367230892181396, -1.2965463399887085, -0.7563695907592773, -0.21619296073913574, 0.32398366928100586, 0.8641605377197266, 1.4043371677398682, 1.9445137977600098, 2.4846904277801514, 3.024867057800293, 3.5650439262390137, 4.105220794677734, 4.645397186279297, 5.185574054718018, 5.725750923156738, 6.265927314758301, 6.8061041831970215, 7.346280574798584, 7.886457443237305, 8.426633834838867, 8.96681022644043, 9.506987571716309, 10.047163963317871, 10.58734130859375, 11.127517700195312, 11.667695045471191, 12.207871437072754, 12.748047828674316, 13.288225173950195, 13.828401565551758, 14.36857795715332, 14.908754348754883]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 6.0, 5.0, 10.0, 21.0, 22.0, 27.0, 36.0, 50.0, 75.0, 100.0, 130.0, 203.0, 278.0, 396.0, 582.0, 815.0, 1219.0, 1731.0, 2697.0, 4228.0, 6765.0, 11326.0, 19186.0, 33777.0, 62785.0, 123059.0, 228251.0, 246222.0, 140449.0, 71329.0, 37613.0, 21316.0, 12522.0, 7502.0, 4717.0, 2992.0, 1912.0, 1235.0, 877.0, 607.0, 442.0, 289.0, 187.0, 176.0, 113.0, 67.0, 76.0, 48.0, 25.0, 20.0, 15.0, 11.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.859375, -29.89794921875, -28.9365234375, -27.97509765625, -27.013671875, -26.05224609375, -25.0908203125, -24.12939453125, -23.16796875, -22.20654296875, -21.2451171875, -20.28369140625, -19.322265625, -18.36083984375, -17.3994140625, -16.43798828125, -15.4765625, -14.51513671875, -13.5537109375, -12.59228515625, -11.630859375, -10.66943359375, -9.7080078125, -8.74658203125, -7.78515625, -6.82373046875, -5.8623046875, -4.90087890625, -3.939453125, -2.97802734375, -2.0166015625, -1.05517578125, -0.09375, 0.86767578125, 1.8291015625, 2.79052734375, 3.751953125, 4.71337890625, 5.6748046875, 6.63623046875, 7.59765625, 8.55908203125, 9.5205078125, 10.48193359375, 11.443359375, 12.40478515625, 13.3662109375, 14.32763671875, 15.2890625, 16.25048828125, 17.2119140625, 18.17333984375, 19.134765625, 20.09619140625, 21.0576171875, 22.01904296875, 22.98046875, 23.94189453125, 24.9033203125, 25.86474609375, 26.826171875, 27.78759765625, 28.7490234375, 29.71044921875, 30.671875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 5.0, 4.0, 10.0, 12.0, 13.0, 10.0, 16.0, 24.0, 30.0, 25.0, 24.0, 27.0, 29.0, 32.0, 46.0, 32.0, 37.0, 47.0, 49.0, 50.0, 44.0, 44.0, 34.0, 39.0, 29.0, 44.0, 23.0, 27.0, 23.0, 22.0, 17.0, 14.0, 20.0, 17.0, 16.0, 10.0, 15.0, 6.0, 7.0, 1.0, 4.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-18.5625, -18.0382080078125, -17.513916015625, -16.9896240234375, -16.46533203125, -15.9410400390625, -15.416748046875, -14.8924560546875, -14.3681640625, -13.8438720703125, -13.319580078125, -12.7952880859375, -12.27099609375, -11.7467041015625, -11.222412109375, -10.6981201171875, -10.173828125, -9.6495361328125, -9.125244140625, -8.6009521484375, -8.07666015625, -7.5523681640625, -7.028076171875, -6.5037841796875, -5.9794921875, -5.4552001953125, -4.930908203125, -4.4066162109375, -3.88232421875, -3.3580322265625, -2.833740234375, -2.3094482421875, -1.78515625, -1.2608642578125, -0.736572265625, -0.2122802734375, 0.31201171875, 0.8363037109375, 1.360595703125, 1.8848876953125, 2.4091796875, 2.9334716796875, 3.457763671875, 3.9820556640625, 4.50634765625, 5.0306396484375, 5.554931640625, 6.0792236328125, 6.603515625, 7.1278076171875, 7.652099609375, 8.1763916015625, 8.70068359375, 9.2249755859375, 9.749267578125, 10.2735595703125, 10.7978515625, 11.3221435546875, 11.846435546875, 12.3707275390625, 12.89501953125, 13.4193115234375, 13.943603515625, 14.4678955078125, 14.9921875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 13.0, 18.0, 23.0, 38.0, 54.0, 82.0, 97.0, 161.0, 228.0, 375.0, 596.0, 962.0, 1520.0, 2698.0, 4725.0, 8208.0, 15908.0, 32888.0, 73997.0, 199742.0, 393212.0, 180466.0, 67856.0, 30835.0, 14949.0, 7986.0, 4433.0, 2462.0, 1429.0, 923.0, 587.0, 344.0, 231.0, 161.0, 94.0, 77.0, 46.0, 36.0, 29.0, 15.0, 7.0, 9.0, 8.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-45.25, -43.9365234375, -42.623046875, -41.3095703125, -39.99609375, -38.6826171875, -37.369140625, -36.0556640625, -34.7421875, -33.4287109375, -32.115234375, -30.8017578125, -29.48828125, -28.1748046875, -26.861328125, -25.5478515625, -24.234375, -22.9208984375, -21.607421875, -20.2939453125, -18.98046875, -17.6669921875, -16.353515625, -15.0400390625, -13.7265625, -12.4130859375, -11.099609375, -9.7861328125, -8.47265625, -7.1591796875, -5.845703125, -4.5322265625, -3.21875, -1.9052734375, -0.591796875, 0.7216796875, 2.03515625, 3.3486328125, 4.662109375, 5.9755859375, 7.2890625, 8.6025390625, 9.916015625, 11.2294921875, 12.54296875, 13.8564453125, 15.169921875, 16.4833984375, 17.796875, 19.1103515625, 20.423828125, 21.7373046875, 23.05078125, 24.3642578125, 25.677734375, 26.9912109375, 28.3046875, 29.6181640625, 30.931640625, 32.2451171875, 33.55859375, 34.8720703125, 36.185546875, 37.4990234375, 38.8125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 11.0, 12.0, 6.0, 10.0, 10.0, 12.0, 15.0, 22.0, 27.0, 28.0, 27.0, 22.0, 27.0, 35.0, 46.0, 43.0, 46.0, 49.0, 51.0, 43.0, 42.0, 63.0, 28.0, 33.0, 30.0, 34.0, 30.0, 29.0, 25.0, 26.0, 15.0, 21.0, 18.0, 15.0, 12.0, 8.0, 5.0, 3.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.15625, -11.763916015625, -11.37158203125, -10.979248046875, -10.5869140625, -10.194580078125, -9.80224609375, -9.409912109375, -9.017578125, -8.625244140625, -8.23291015625, -7.840576171875, -7.4482421875, -7.055908203125, -6.66357421875, -6.271240234375, -5.87890625, -5.486572265625, -5.09423828125, -4.701904296875, -4.3095703125, -3.917236328125, -3.52490234375, -3.132568359375, -2.740234375, -2.347900390625, -1.95556640625, -1.563232421875, -1.1708984375, -0.778564453125, -0.38623046875, 0.006103515625, 0.3984375, 0.790771484375, 1.18310546875, 1.575439453125, 1.9677734375, 2.360107421875, 2.75244140625, 3.144775390625, 3.537109375, 3.929443359375, 4.32177734375, 4.714111328125, 5.1064453125, 5.498779296875, 5.89111328125, 6.283447265625, 6.67578125, 7.068115234375, 7.46044921875, 7.852783203125, 8.2451171875, 8.637451171875, 9.02978515625, 9.422119140625, 9.814453125, 10.206787109375, 10.59912109375, 10.991455078125, 11.3837890625, 11.776123046875, 12.16845703125, 12.560791015625, 12.953125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 15.0, 9.0, 21.0, 26.0, 22.0, 39.0, 36.0, 77.0, 100.0, 142.0, 193.0, 282.0, 422.0, 669.0, 970.0, 1492.0, 2399.0, 3941.0, 6787.0, 12799.0, 27673.0, 75725.0, 295074.0, 432505.0, 112975.0, 37151.0, 16169.0, 8173.0, 4600.0, 2820.0, 1807.0, 1102.0, 736.0, 504.0, 311.0, 250.0, 174.0, 97.0, 77.0, 49.0, 35.0, 31.0, 27.0, 14.0, 9.0, 7.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-30.34375, -29.4287109375, -28.513671875, -27.5986328125, -26.68359375, -25.7685546875, -24.853515625, -23.9384765625, -23.0234375, -22.1083984375, -21.193359375, -20.2783203125, -19.36328125, -18.4482421875, -17.533203125, -16.6181640625, -15.703125, -14.7880859375, -13.873046875, -12.9580078125, -12.04296875, -11.1279296875, -10.212890625, -9.2978515625, -8.3828125, -7.4677734375, -6.552734375, -5.6376953125, -4.72265625, -3.8076171875, -2.892578125, -1.9775390625, -1.0625, -0.1474609375, 0.767578125, 1.6826171875, 2.59765625, 3.5126953125, 4.427734375, 5.3427734375, 6.2578125, 7.1728515625, 8.087890625, 9.0029296875, 9.91796875, 10.8330078125, 11.748046875, 12.6630859375, 13.578125, 14.4931640625, 15.408203125, 16.3232421875, 17.23828125, 18.1533203125, 19.068359375, 19.9833984375, 20.8984375, 21.8134765625, 22.728515625, 23.6435546875, 24.55859375, 25.4736328125, 26.388671875, 27.3037109375, 28.21875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 6.0, 8.0, 16.0, 6.0, 12.0, 24.0, 55.0, 74.0, 120.0, 165.0, 180.0, 96.0, 71.0, 36.0, 31.0, 13.0, 14.0, 11.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0026073455810546875, -0.0025326311588287354, -0.002457916736602783, -0.002383202314376831, -0.002308487892150879, -0.0022337734699249268, -0.0021590590476989746, -0.0020843446254730225, -0.0020096302032470703, -0.0019349157810211182, -0.001860201358795166, -0.0017854869365692139, -0.0017107725143432617, -0.0016360580921173096, -0.0015613436698913574, -0.0014866292476654053, -0.0014119148254394531, -0.001337200403213501, -0.0012624859809875488, -0.0011877715587615967, -0.0011130571365356445, -0.0010383427143096924, -0.0009636282920837402, -0.0008889138698577881, -0.0008141994476318359, -0.0007394850254058838, -0.0006647706031799316, -0.0005900561809539795, -0.0005153417587280273, -0.0004406273365020752, -0.00036591291427612305, -0.0002911984920501709, -0.00021648406982421875, -0.0001417696475982666, -6.705522537231445e-05, 7.659196853637695e-06, 8.237361907958984e-05, 0.000157088041305542, 0.00023180246353149414, 0.0003065168857574463, 0.00038123130798339844, 0.0004559457302093506, 0.0005306601524353027, 0.0006053745746612549, 0.000680088996887207, 0.0007548034191131592, 0.0008295178413391113, 0.0009042322635650635, 0.0009789466857910156, 0.0010536611080169678, 0.00112837553024292, 0.001203089952468872, 0.0012778043746948242, 0.0013525187969207764, 0.0014272332191467285, 0.0015019476413726807, 0.0015766620635986328, 0.001651376485824585, 0.0017260909080505371, 0.0018008053302764893, 0.0018755197525024414, 0.0019502341747283936, 0.0020249485969543457, 0.002099663019180298, 0.00217437744140625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 22.0, 18.0, 24.0, 48.0, 54.0, 62.0, 87.0, 151.0, 209.0, 312.0, 517.0, 730.0, 1097.0, 1633.0, 2732.0, 4273.0, 7241.0, 12758.0, 25490.0, 57481.0, 143500.0, 317207.0, 269719.0, 109830.0, 44866.0, 20990.0, 10791.0, 6195.0, 3798.0, 2325.0, 1454.0, 951.0, 622.0, 422.0, 304.0, 197.0, 132.0, 92.0, 68.0, 53.0, 29.0, 16.0, 16.0, 11.0, 11.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.4375, -22.76513671875, -22.0927734375, -21.42041015625, -20.748046875, -20.07568359375, -19.4033203125, -18.73095703125, -18.05859375, -17.38623046875, -16.7138671875, -16.04150390625, -15.369140625, -14.69677734375, -14.0244140625, -13.35205078125, -12.6796875, -12.00732421875, -11.3349609375, -10.66259765625, -9.990234375, -9.31787109375, -8.6455078125, -7.97314453125, -7.30078125, -6.62841796875, -5.9560546875, -5.28369140625, -4.611328125, -3.93896484375, -3.2666015625, -2.59423828125, -1.921875, -1.24951171875, -0.5771484375, 0.09521484375, 0.767578125, 1.43994140625, 2.1123046875, 2.78466796875, 3.45703125, 4.12939453125, 4.8017578125, 5.47412109375, 6.146484375, 6.81884765625, 7.4912109375, 8.16357421875, 8.8359375, 9.50830078125, 10.1806640625, 10.85302734375, 11.525390625, 12.19775390625, 12.8701171875, 13.54248046875, 14.21484375, 14.88720703125, 15.5595703125, 16.23193359375, 16.904296875, 17.57666015625, 18.2490234375, 18.92138671875, 19.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 8.0, 4.0, 4.0, 5.0, 7.0, 9.0, 19.0, 12.0, 21.0, 23.0, 35.0, 31.0, 57.0, 65.0, 87.0, 84.0, 104.0, 79.0, 79.0, 50.0, 31.0, 37.0, 24.0, 34.0, 17.0, 15.0, 4.0, 4.0, 7.0, 5.0, 5.0, 9.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.578125, -5.380126953125, -5.18212890625, -4.984130859375, -4.7861328125, -4.588134765625, -4.39013671875, -4.192138671875, -3.994140625, -3.796142578125, -3.59814453125, -3.400146484375, -3.2021484375, -3.004150390625, -2.80615234375, -2.608154296875, -2.41015625, -2.212158203125, -2.01416015625, -1.816162109375, -1.6181640625, -1.420166015625, -1.22216796875, -1.024169921875, -0.826171875, -0.628173828125, -0.43017578125, -0.232177734375, -0.0341796875, 0.163818359375, 0.36181640625, 0.559814453125, 0.7578125, 0.955810546875, 1.15380859375, 1.351806640625, 1.5498046875, 1.747802734375, 1.94580078125, 2.143798828125, 2.341796875, 2.539794921875, 2.73779296875, 2.935791015625, 3.1337890625, 3.331787109375, 3.52978515625, 3.727783203125, 3.92578125, 4.123779296875, 4.32177734375, 4.519775390625, 4.7177734375, 4.915771484375, 5.11376953125, 5.311767578125, 5.509765625, 5.707763671875, 5.90576171875, 6.103759765625, 6.3017578125, 6.499755859375, 6.69775390625, 6.895751953125, 7.09375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 9.0, 14.0, 17.0, 26.0, 26.0, 22.0, 47.0, 67.0, 86.0, 92.0, 96.0, 110.0, 99.0, 70.0, 52.0, 49.0, 27.0, 27.0, 23.0, 15.0, 9.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.76021194458008, -33.79523468017578, -32.830257415771484, -31.865278244018555, -30.900300979614258, -29.93532371520996, -28.97034454345703, -28.005367279052734, -27.040390014648438, -26.07541275024414, -25.110435485839844, -24.145456314086914, -23.180479049682617, -22.21550178527832, -21.25052261352539, -20.285545349121094, -19.320568084716797, -18.3555908203125, -17.390613555908203, -16.425634384155273, -15.460657119750977, -14.49567985534668, -13.530701637268066, -12.565723419189453, -11.600746154785156, -10.63576889038086, -9.670790672302246, -8.705812454223633, -7.740835189819336, -6.775857448577881, -5.810879707336426, -4.845901966094971, -3.880922317504883, -2.9159445762634277, -1.9509668350219727, -0.9859890937805176, -0.0210113525390625, 0.9439663887023926, 1.9089441299438477, 2.8739218711853027, 3.838899612426758, 4.803877353668213, 5.768855094909668, 6.733832836151123, 7.698810577392578, 8.663787841796875, 9.628766059875488, 10.593744277954102, 11.558721542358398, 12.523698806762695, 13.488677024841309, 14.453655242919922, 15.418632507324219, 16.383609771728516, 17.348587036132812, 18.313566207885742, 19.27854347229004, 20.243520736694336, 21.208499908447266, 22.173477172851562, 23.13845443725586, 24.103431701660156, 25.068408966064453, 26.033388137817383, 26.99836540222168]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 3.0, 7.0, 11.0, 11.0, 11.0, 16.0, 24.0, 21.0, 20.0, 20.0, 26.0, 24.0, 32.0, 36.0, 35.0, 38.0, 42.0, 45.0, 27.0, 51.0, 45.0, 38.0, 37.0, 42.0, 36.0, 34.0, 28.0, 37.0, 22.0, 19.0, 19.0, 23.0, 21.0, 17.0, 15.0, 13.0, 14.0, 7.0, 2.0, 5.0, 4.0, 12.0, 0.0, 3.0, 4.0, 1.0, 2.0], "bins": [-18.848363876342773, -18.33615493774414, -17.823945999145508, -17.311737060546875, -16.799528121948242, -16.28731918334961, -15.775110244750977, -15.262901306152344, -14.750692367553711, -14.238483428955078, -13.726274490356445, -13.214065551757812, -12.70185661315918, -12.189647674560547, -11.677438735961914, -11.165229797363281, -10.653019905090332, -10.1408109664917, -9.628602027893066, -9.116393089294434, -8.6041841506958, -8.091975212097168, -7.579765796661377, -7.067556858062744, -6.555347919464111, -6.0431389808654785, -5.530930042266846, -5.018720626831055, -4.506511688232422, -3.994302988052368, -3.4820938110351562, -2.9698848724365234, -2.4576759338378906, -1.9454669952392578, -1.4332579374313354, -0.9210488796234131, -0.4088399410247803, 0.10336899757385254, 0.6155781745910645, 1.1277871131896973, 1.63999605178833, 2.152204990386963, 2.6644139289855957, 3.1766231060028076, 3.6888320446014404, 4.201041221618652, 4.713250160217285, 5.225459098815918, 5.737668037414551, 6.249876976013184, 6.762085914611816, 7.274294853210449, 7.786503791809082, 8.298712730407715, 8.810922622680664, 9.323131561279297, 9.83534049987793, 10.347549438476562, 10.859758377075195, 11.371967315673828, 11.884176254272461, 12.396385192871094, 12.908594131469727, 13.42080307006836, 13.933012008666992]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 12.0, 12.0, 12.0, 17.0, 30.0, 42.0, 44.0, 70.0, 98.0, 137.0, 184.0, 289.0, 443.0, 639.0, 1032.0, 1677.0, 2718.0, 4701.0, 8176.0, 14723.0, 27208.0, 50536.0, 92392.0, 155488.0, 208755.0, 192348.0, 127225.0, 71836.0, 39098.0, 20855.0, 11583.0, 6468.0, 3685.0, 2198.0, 1296.0, 821.0, 549.0, 357.0, 216.0, 164.0, 100.0, 85.0, 60.0, 58.0, 34.0, 27.0, 16.0, 16.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 5.0, 2.0], "bins": [-24.671875, -23.895751953125, -23.11962890625, -22.343505859375, -21.5673828125, -20.791259765625, -20.01513671875, -19.239013671875, -18.462890625, -17.686767578125, -16.91064453125, -16.134521484375, -15.3583984375, -14.582275390625, -13.80615234375, -13.030029296875, -12.25390625, -11.477783203125, -10.70166015625, -9.925537109375, -9.1494140625, -8.373291015625, -7.59716796875, -6.821044921875, -6.044921875, -5.268798828125, -4.49267578125, -3.716552734375, -2.9404296875, -2.164306640625, -1.38818359375, -0.612060546875, 0.1640625, 0.940185546875, 1.71630859375, 2.492431640625, 3.2685546875, 4.044677734375, 4.82080078125, 5.596923828125, 6.373046875, 7.149169921875, 7.92529296875, 8.701416015625, 9.4775390625, 10.253662109375, 11.02978515625, 11.805908203125, 12.58203125, 13.358154296875, 14.13427734375, 14.910400390625, 15.6865234375, 16.462646484375, 17.23876953125, 18.014892578125, 18.791015625, 19.567138671875, 20.34326171875, 21.119384765625, 21.8955078125, 22.671630859375, 23.44775390625, 24.223876953125, 25.0]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 7.0, 12.0, 13.0, 15.0, 23.0, 27.0, 26.0, 26.0, 21.0, 29.0, 41.0, 35.0, 29.0, 48.0, 42.0, 44.0, 43.0, 56.0, 35.0, 42.0, 40.0, 31.0, 32.0, 30.0, 40.0, 26.0, 20.0, 20.0, 25.0, 17.0, 15.0, 16.0, 14.0, 7.0, 5.0, 9.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.015625, -19.498046875, -18.98046875, -18.462890625, -17.9453125, -17.427734375, -16.91015625, -16.392578125, -15.875, -15.357421875, -14.83984375, -14.322265625, -13.8046875, -13.287109375, -12.76953125, -12.251953125, -11.734375, -11.216796875, -10.69921875, -10.181640625, -9.6640625, -9.146484375, -8.62890625, -8.111328125, -7.59375, -7.076171875, -6.55859375, -6.041015625, -5.5234375, -5.005859375, -4.48828125, -3.970703125, -3.453125, -2.935546875, -2.41796875, -1.900390625, -1.3828125, -0.865234375, -0.34765625, 0.169921875, 0.6875, 1.205078125, 1.72265625, 2.240234375, 2.7578125, 3.275390625, 3.79296875, 4.310546875, 4.828125, 5.345703125, 5.86328125, 6.380859375, 6.8984375, 7.416015625, 7.93359375, 8.451171875, 8.96875, 9.486328125, 10.00390625, 10.521484375, 11.0390625, 11.556640625, 12.07421875, 12.591796875, 13.109375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 13.0, 18.0, 16.0, 29.0, 53.0, 71.0, 95.0, 157.0, 261.0, 475.0, 759.0, 1350.0, 2343.0, 4291.0, 8288.0, 15986.0, 32683.0, 68361.0, 134378.0, 217507.0, 234706.0, 160673.0, 83622.0, 40690.0, 19781.0, 9983.0, 5133.0, 2865.0, 1612.0, 924.0, 519.0, 348.0, 200.0, 131.0, 59.0, 73.0, 31.0, 23.0, 10.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -21.942138671875, -21.10302734375, -20.263916015625, -19.4248046875, -18.585693359375, -17.74658203125, -16.907470703125, -16.068359375, -15.229248046875, -14.39013671875, -13.551025390625, -12.7119140625, -11.872802734375, -11.03369140625, -10.194580078125, -9.35546875, -8.516357421875, -7.67724609375, -6.838134765625, -5.9990234375, -5.159912109375, -4.32080078125, -3.481689453125, -2.642578125, -1.803466796875, -0.96435546875, -0.125244140625, 0.7138671875, 1.552978515625, 2.39208984375, 3.231201171875, 4.0703125, 4.909423828125, 5.74853515625, 6.587646484375, 7.4267578125, 8.265869140625, 9.10498046875, 9.944091796875, 10.783203125, 11.622314453125, 12.46142578125, 13.300537109375, 14.1396484375, 14.978759765625, 15.81787109375, 16.656982421875, 17.49609375, 18.335205078125, 19.17431640625, 20.013427734375, 20.8525390625, 21.691650390625, 22.53076171875, 23.369873046875, 24.208984375, 25.048095703125, 25.88720703125, 26.726318359375, 27.5654296875, 28.404541015625, 29.24365234375, 30.082763671875, 30.921875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 6.0, 5.0, 4.0, 13.0, 7.0, 7.0, 14.0, 15.0, 36.0, 28.0, 15.0, 26.0, 22.0, 16.0, 34.0, 24.0, 24.0, 38.0, 43.0, 38.0, 34.0, 46.0, 38.0, 47.0, 49.0, 32.0, 44.0, 34.0, 27.0, 33.0, 33.0, 26.0, 17.0, 17.0, 17.0, 15.0, 11.0, 17.0, 12.0, 9.0, 4.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-11.9375, -11.574951171875, -11.21240234375, -10.849853515625, -10.4873046875, -10.124755859375, -9.76220703125, -9.399658203125, -9.037109375, -8.674560546875, -8.31201171875, -7.949462890625, -7.5869140625, -7.224365234375, -6.86181640625, -6.499267578125, -6.13671875, -5.774169921875, -5.41162109375, -5.049072265625, -4.6865234375, -4.323974609375, -3.96142578125, -3.598876953125, -3.236328125, -2.873779296875, -2.51123046875, -2.148681640625, -1.7861328125, -1.423583984375, -1.06103515625, -0.698486328125, -0.3359375, 0.026611328125, 0.38916015625, 0.751708984375, 1.1142578125, 1.476806640625, 1.83935546875, 2.201904296875, 2.564453125, 2.927001953125, 3.28955078125, 3.652099609375, 4.0146484375, 4.377197265625, 4.73974609375, 5.102294921875, 5.46484375, 5.827392578125, 6.18994140625, 6.552490234375, 6.9150390625, 7.277587890625, 7.64013671875, 8.002685546875, 8.365234375, 8.727783203125, 9.09033203125, 9.452880859375, 9.8154296875, 10.177978515625, 10.54052734375, 10.903076171875, 11.265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 18.0, 18.0, 40.0, 59.0, 90.0, 126.0, 191.0, 295.0, 362.0, 603.0, 1008.0, 1512.0, 2628.0, 4468.0, 7970.0, 15788.0, 33204.0, 79549.0, 217725.0, 368834.0, 184525.0, 68239.0, 29288.0, 13986.0, 7495.0, 4094.0, 2328.0, 1516.0, 904.0, 612.0, 353.0, 228.0, 166.0, 98.0, 56.0, 52.0, 39.0, 23.0, 19.0, 13.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.625, -37.46923828125, -36.3134765625, -35.15771484375, -34.001953125, -32.84619140625, -31.6904296875, -30.53466796875, -29.37890625, -28.22314453125, -27.0673828125, -25.91162109375, -24.755859375, -23.60009765625, -22.4443359375, -21.28857421875, -20.1328125, -18.97705078125, -17.8212890625, -16.66552734375, -15.509765625, -14.35400390625, -13.1982421875, -12.04248046875, -10.88671875, -9.73095703125, -8.5751953125, -7.41943359375, -6.263671875, -5.10791015625, -3.9521484375, -2.79638671875, -1.640625, -0.48486328125, 0.6708984375, 1.82666015625, 2.982421875, 4.13818359375, 5.2939453125, 6.44970703125, 7.60546875, 8.76123046875, 9.9169921875, 11.07275390625, 12.228515625, 13.38427734375, 14.5400390625, 15.69580078125, 16.8515625, 18.00732421875, 19.1630859375, 20.31884765625, 21.474609375, 22.63037109375, 23.7861328125, 24.94189453125, 26.09765625, 27.25341796875, 28.4091796875, 29.56494140625, 30.720703125, 31.87646484375, 33.0322265625, 34.18798828125, 35.34375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 8.0, 6.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 24.0, 33.0, 38.0, 58.0, 52.0, 63.0, 73.0, 81.0, 78.0, 77.0, 70.0, 54.0, 49.0, 49.0, 26.0, 28.0, 16.0, 14.0, 10.0, 7.0, 11.0, 8.0, 4.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002002716064453125, -0.0019365549087524414, -0.0018703937530517578, -0.0018042325973510742, -0.0017380714416503906, -0.001671910285949707, -0.0016057491302490234, -0.0015395879745483398, -0.0014734268188476562, -0.0014072656631469727, -0.001341104507446289, -0.0012749433517456055, -0.0012087821960449219, -0.0011426210403442383, -0.0010764598846435547, -0.001010298728942871, -0.0009441375732421875, -0.0008779764175415039, -0.0008118152618408203, -0.0007456541061401367, -0.0006794929504394531, -0.0006133317947387695, -0.0005471706390380859, -0.00048100948333740234, -0.00041484832763671875, -0.00034868717193603516, -0.00028252601623535156, -0.00021636486053466797, -0.00015020370483398438, -8.404254913330078e-05, -1.7881393432617188e-05, 4.8279762268066406e-05, 0.00011444091796875, 0.0001806020736694336, 0.0002467632293701172, 0.0003129243850708008, 0.0003790855407714844, 0.00044524669647216797, 0.0005114078521728516, 0.0005775690078735352, 0.0006437301635742188, 0.0007098913192749023, 0.0007760524749755859, 0.0008422136306762695, 0.0009083747863769531, 0.0009745359420776367, 0.0010406970977783203, 0.001106858253479004, 0.0011730194091796875, 0.001239180564880371, 0.0013053417205810547, 0.0013715028762817383, 0.0014376640319824219, 0.0015038251876831055, 0.001569986343383789, 0.0016361474990844727, 0.0017023086547851562, 0.0017684698104858398, 0.0018346309661865234, 0.001900792121887207, 0.0019669532775878906, 0.0020331144332885742, 0.002099275588989258, 0.0021654367446899414, 0.002231597900390625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 0.0, 5.0, 9.0, 9.0, 5.0, 15.0, 25.0, 25.0, 36.0, 51.0, 55.0, 105.0, 116.0, 187.0, 277.0, 443.0, 645.0, 949.0, 1577.0, 2885.0, 5283.0, 10742.0, 25981.0, 73518.0, 230999.0, 401591.0, 190337.0, 59934.0, 22018.0, 9492.0, 4553.0, 2465.0, 1420.0, 898.0, 564.0, 388.0, 264.0, 187.0, 146.0, 85.0, 71.0, 55.0, 41.0, 35.0, 29.0, 19.0, 8.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.8125, -34.67236328125, -33.5322265625, -32.39208984375, -31.251953125, -30.11181640625, -28.9716796875, -27.83154296875, -26.69140625, -25.55126953125, -24.4111328125, -23.27099609375, -22.130859375, -20.99072265625, -19.8505859375, -18.71044921875, -17.5703125, -16.43017578125, -15.2900390625, -14.14990234375, -13.009765625, -11.86962890625, -10.7294921875, -9.58935546875, -8.44921875, -7.30908203125, -6.1689453125, -5.02880859375, -3.888671875, -2.74853515625, -1.6083984375, -0.46826171875, 0.671875, 1.81201171875, 2.9521484375, 4.09228515625, 5.232421875, 6.37255859375, 7.5126953125, 8.65283203125, 9.79296875, 10.93310546875, 12.0732421875, 13.21337890625, 14.353515625, 15.49365234375, 16.6337890625, 17.77392578125, 18.9140625, 20.05419921875, 21.1943359375, 22.33447265625, 23.474609375, 24.61474609375, 25.7548828125, 26.89501953125, 28.03515625, 29.17529296875, 30.3154296875, 31.45556640625, 32.595703125, 33.73583984375, 34.8759765625, 36.01611328125, 37.15625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 1.0, 1.0, 6.0, 3.0, 1.0, 5.0, 6.0, 11.0, 6.0, 12.0, 16.0, 19.0, 26.0, 35.0, 36.0, 37.0, 54.0, 78.0, 74.0, 90.0, 81.0, 72.0, 53.0, 66.0, 45.0, 38.0, 26.0, 31.0, 15.0, 10.0, 9.0, 14.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2255859375, -8.880859375, -8.5361328125, -8.19140625, -7.8466796875, -7.501953125, -7.1572265625, -6.8125, -6.4677734375, -6.123046875, -5.7783203125, -5.43359375, -5.0888671875, -4.744140625, -4.3994140625, -4.0546875, -3.7099609375, -3.365234375, -3.0205078125, -2.67578125, -2.3310546875, -1.986328125, -1.6416015625, -1.296875, -0.9521484375, -0.607421875, -0.2626953125, 0.08203125, 0.4267578125, 0.771484375, 1.1162109375, 1.4609375, 1.8056640625, 2.150390625, 2.4951171875, 2.83984375, 3.1845703125, 3.529296875, 3.8740234375, 4.21875, 4.5634765625, 4.908203125, 5.2529296875, 5.59765625, 5.9423828125, 6.287109375, 6.6318359375, 6.9765625, 7.3212890625, 7.666015625, 8.0107421875, 8.35546875, 8.7001953125, 9.044921875, 9.3896484375, 9.734375, 10.0791015625, 10.423828125, 10.7685546875, 11.11328125, 11.4580078125, 11.802734375, 12.1474609375, 12.4921875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 6.0, 5.0, 16.0, 16.0, 16.0, 27.0, 36.0, 49.0, 40.0, 64.0, 79.0, 87.0, 88.0, 93.0, 77.0, 69.0, 39.0, 57.0, 31.0, 33.0, 15.0, 16.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.420326232910156, -33.53227233886719, -32.644222259521484, -31.75617027282715, -30.868118286132812, -29.980066299438477, -29.09201431274414, -28.203962326049805, -27.31591033935547, -26.427858352661133, -25.539806365966797, -24.65175437927246, -23.763702392578125, -22.87565040588379, -21.987598419189453, -21.099546432495117, -20.21149444580078, -19.323442459106445, -18.43539047241211, -17.547338485717773, -16.659286499023438, -15.771234512329102, -14.883182525634766, -13.99513053894043, -13.107078552246094, -12.219026565551758, -11.330974578857422, -10.442922592163086, -9.55487060546875, -8.666818618774414, -7.778766632080078, -6.890714645385742, -6.002662658691406, -5.11461067199707, -4.226558685302734, -3.3385066986083984, -2.4504547119140625, -1.5624027252197266, -0.6743507385253906, 0.2137012481689453, 1.1017532348632812, 1.9898052215576172, 2.877857208251953, 3.765909194946289, 4.653961181640625, 5.542013168334961, 6.430065155029297, 7.318117141723633, 8.206169128417969, 9.094221115112305, 9.98227310180664, 10.870325088500977, 11.758377075195312, 12.646429061889648, 13.534481048583984, 14.42253303527832, 15.310585021972656, 16.198637008666992, 17.086688995361328, 17.974740982055664, 18.86279296875, 19.750844955444336, 20.638896942138672, 21.526948928833008, 22.415000915527344]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 11.0, 17.0, 20.0, 17.0, 23.0, 26.0, 32.0, 28.0, 42.0, 31.0, 48.0, 40.0, 39.0, 57.0, 34.0, 36.0, 47.0, 45.0, 38.0, 38.0, 34.0, 31.0, 45.0, 22.0, 22.0, 31.0, 22.0, 13.0, 21.0, 9.0, 6.0, 13.0, 6.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.10556411743164, -19.556655883789062, -19.007749557495117, -18.45884132385254, -17.909934997558594, -17.361026763916016, -16.812118530273438, -16.263212203979492, -15.714303970336914, -15.165396690368652, -14.61648941040039, -14.067581176757812, -13.51867389678955, -12.969766616821289, -12.420858383178711, -11.87195110321045, -11.323043823242188, -10.774136543273926, -10.225229263305664, -9.676321029663086, -9.127413749694824, -8.578506469726562, -8.029598236083984, -7.480690956115723, -6.931783676147461, -6.382876396179199, -5.833968639373779, -5.285060882568359, -4.736153602600098, -4.187246322631836, -3.638338565826416, -3.089431047439575, -2.540524482727051, -1.99161696434021, -1.4427094459533691, -0.8938019275665283, -0.3448944091796875, 0.20401310920715332, 0.7529206275939941, 1.301828145980835, 1.8507356643676758, 2.3996431827545166, 2.9485507011413574, 3.4974582195281982, 4.046365737915039, 4.595273017883301, 5.144180774688721, 5.693088531494141, 6.241995811462402, 6.790903091430664, 7.339810848236084, 7.888718605041504, 8.437625885009766, 8.986533164978027, 9.535440444946289, 10.084348678588867, 10.633255958557129, 11.18216323852539, 11.731071472167969, 12.27997875213623, 12.828886032104492, 13.377793312072754, 13.926700592041016, 14.475608825683594, 15.024516105651855]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 17.0, 26.0, 17.0, 23.0, 41.0, 46.0, 84.0, 137.0, 203.0, 302.0, 408.0, 657.0, 964.0, 1524.0, 2395.0, 3938.0, 7138.0, 13333.0, 27064.0, 61491.0, 158531.0, 463907.0, 1142940.0, 1320206.0, 626961.0, 212786.0, 78153.0, 33675.0, 15998.0, 8405.0, 4866.0, 2764.0, 1701.0, 1191.0, 757.0, 514.0, 324.0, 233.0, 186.0, 118.0, 84.0, 46.0, 37.0, 28.0, 18.0, 18.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.484375, -23.72265625, -22.9609375, -22.19921875, -21.4375, -20.67578125, -19.9140625, -19.15234375, -18.390625, -17.62890625, -16.8671875, -16.10546875, -15.34375, -14.58203125, -13.8203125, -13.05859375, -12.296875, -11.53515625, -10.7734375, -10.01171875, -9.25, -8.48828125, -7.7265625, -6.96484375, -6.203125, -5.44140625, -4.6796875, -3.91796875, -3.15625, -2.39453125, -1.6328125, -0.87109375, -0.109375, 0.65234375, 1.4140625, 2.17578125, 2.9375, 3.69921875, 4.4609375, 5.22265625, 5.984375, 6.74609375, 7.5078125, 8.26953125, 9.03125, 9.79296875, 10.5546875, 11.31640625, 12.078125, 12.83984375, 13.6015625, 14.36328125, 15.125, 15.88671875, 16.6484375, 17.41015625, 18.171875, 18.93359375, 19.6953125, 20.45703125, 21.21875, 21.98046875, 22.7421875, 23.50390625, 24.265625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 13.0, 10.0, 15.0, 11.0, 20.0, 13.0, 25.0, 27.0, 25.0, 25.0, 34.0, 30.0, 52.0, 45.0, 39.0, 47.0, 45.0, 32.0, 48.0, 38.0, 39.0, 37.0, 35.0, 40.0, 32.0, 35.0, 25.0, 15.0, 31.0, 14.0, 10.0, 21.0, 15.0, 10.0, 10.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-13.609375, -13.254150390625, -12.89892578125, -12.543701171875, -12.1884765625, -11.833251953125, -11.47802734375, -11.122802734375, -10.767578125, -10.412353515625, -10.05712890625, -9.701904296875, -9.3466796875, -8.991455078125, -8.63623046875, -8.281005859375, -7.92578125, -7.570556640625, -7.21533203125, -6.860107421875, -6.5048828125, -6.149658203125, -5.79443359375, -5.439208984375, -5.083984375, -4.728759765625, -4.37353515625, -4.018310546875, -3.6630859375, -3.307861328125, -2.95263671875, -2.597412109375, -2.2421875, -1.886962890625, -1.53173828125, -1.176513671875, -0.8212890625, -0.466064453125, -0.11083984375, 0.244384765625, 0.599609375, 0.954833984375, 1.31005859375, 1.665283203125, 2.0205078125, 2.375732421875, 2.73095703125, 3.086181640625, 3.44140625, 3.796630859375, 4.15185546875, 4.507080078125, 4.8623046875, 5.217529296875, 5.57275390625, 5.927978515625, 6.283203125, 6.638427734375, 6.99365234375, 7.348876953125, 7.7041015625, 8.059326171875, 8.41455078125, 8.769775390625, 9.125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 14.0, 24.0, 24.0, 48.0, 69.0, 116.0, 145.0, 250.0, 390.0, 586.0, 915.0, 1375.0, 2298.0, 3767.0, 6473.0, 11448.0, 21063.0, 42234.0, 93501.0, 232140.0, 593061.0, 1161019.0, 1108769.0, 536457.0, 208841.0, 84433.0, 38944.0, 19445.0, 10574.0, 6112.0, 3647.0, 2198.0, 1421.0, 886.0, 545.0, 374.0, 205.0, 151.0, 86.0, 67.0, 54.0, 34.0, 29.0, 12.0, 7.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.28125, -20.593505859375, -19.90576171875, -19.218017578125, -18.5302734375, -17.842529296875, -17.15478515625, -16.467041015625, -15.779296875, -15.091552734375, -14.40380859375, -13.716064453125, -13.0283203125, -12.340576171875, -11.65283203125, -10.965087890625, -10.27734375, -9.589599609375, -8.90185546875, -8.214111328125, -7.5263671875, -6.838623046875, -6.15087890625, -5.463134765625, -4.775390625, -4.087646484375, -3.39990234375, -2.712158203125, -2.0244140625, -1.336669921875, -0.64892578125, 0.038818359375, 0.7265625, 1.414306640625, 2.10205078125, 2.789794921875, 3.4775390625, 4.165283203125, 4.85302734375, 5.540771484375, 6.228515625, 6.916259765625, 7.60400390625, 8.291748046875, 8.9794921875, 9.667236328125, 10.35498046875, 11.042724609375, 11.73046875, 12.418212890625, 13.10595703125, 13.793701171875, 14.4814453125, 15.169189453125, 15.85693359375, 16.544677734375, 17.232421875, 17.920166015625, 18.60791015625, 19.295654296875, 19.9833984375, 20.671142578125, 21.35888671875, 22.046630859375, 22.734375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 7.0, 9.0, 10.0, 13.0, 16.0, 29.0, 25.0, 40.0, 49.0, 72.0, 89.0, 91.0, 125.0, 167.0, 229.0, 245.0, 266.0, 285.0, 343.0, 304.0, 297.0, 265.0, 244.0, 192.0, 160.0, 120.0, 87.0, 75.0, 53.0, 31.0, 44.0, 20.0, 13.0, 20.0, 7.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.05078125, -6.83477783203125, -6.6187744140625, -6.40277099609375, -6.186767578125, -5.97076416015625, -5.7547607421875, -5.53875732421875, -5.32275390625, -5.10675048828125, -4.8907470703125, -4.67474365234375, -4.458740234375, -4.24273681640625, -4.0267333984375, -3.81072998046875, -3.5947265625, -3.37872314453125, -3.1627197265625, -2.94671630859375, -2.730712890625, -2.51470947265625, -2.2987060546875, -2.08270263671875, -1.86669921875, -1.65069580078125, -1.4346923828125, -1.21868896484375, -1.002685546875, -0.78668212890625, -0.5706787109375, -0.35467529296875, -0.138671875, 0.07733154296875, 0.2933349609375, 0.50933837890625, 0.725341796875, 0.94134521484375, 1.1573486328125, 1.37335205078125, 1.58935546875, 1.80535888671875, 2.0213623046875, 2.23736572265625, 2.453369140625, 2.66937255859375, 2.8853759765625, 3.10137939453125, 3.3173828125, 3.53338623046875, 3.7493896484375, 3.96539306640625, 4.181396484375, 4.39739990234375, 4.6134033203125, 4.82940673828125, 5.04541015625, 5.26141357421875, 5.4774169921875, 5.69342041015625, 5.909423828125, 6.12542724609375, 6.3414306640625, 6.55743408203125, 6.7734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 4.0, 9.0, 16.0, 22.0, 33.0, 40.0, 34.0, 39.0, 80.0, 74.0, 108.0, 100.0, 87.0, 68.0, 58.0, 55.0, 39.0, 24.0, 24.0, 16.0, 11.0, 10.0, 5.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.15639877319336, -24.414915084838867, -23.673431396484375, -22.93194580078125, -22.190462112426758, -21.448978424072266, -20.70749282836914, -19.96600914001465, -19.224525451660156, -18.483041763305664, -17.741558074951172, -17.000072479248047, -16.258588790893555, -15.517105102539062, -14.775620460510254, -14.034135818481445, -13.292652130126953, -12.551168441772461, -11.809683799743652, -11.068199157714844, -10.326715469360352, -9.58523178100586, -8.84374713897705, -8.102262496948242, -7.36077880859375, -6.6192946434021, -5.877810478210449, -5.136326313018799, -4.394842147827148, -3.653357982635498, -2.9118738174438477, -2.1703896522521973, -1.4289073944091797, -0.6874232292175293, 0.054060935974121094, 0.7955451011657715, 1.5370292663574219, 2.2785134315490723, 3.0199975967407227, 3.761481761932373, 4.502965927124023, 5.244450092315674, 5.985934257507324, 6.727418422698975, 7.468902587890625, 8.210386276245117, 8.951870918273926, 9.693355560302734, 10.434839248657227, 11.176322937011719, 11.917807579040527, 12.659292221069336, 13.400775909423828, 14.14225959777832, 14.883744239807129, 15.625228881835938, 16.36671257019043, 17.108196258544922, 17.849681854248047, 18.59116554260254, 19.33264923095703, 20.074132919311523, 20.815616607666016, 21.55710220336914, 22.298585891723633]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 9.0, 13.0, 19.0, 11.0, 20.0, 28.0, 26.0, 23.0, 22.0, 28.0, 27.0, 34.0, 39.0, 41.0, 31.0, 48.0, 51.0, 38.0, 38.0, 48.0, 41.0, 48.0, 28.0, 32.0, 44.0, 29.0, 25.0, 22.0, 19.0, 20.0, 14.0, 15.0, 12.0, 8.0, 5.0, 5.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-16.193523406982422, -15.731340408325195, -15.269157409667969, -14.806974411010742, -14.3447904586792, -13.882607460021973, -13.420424461364746, -12.95824146270752, -12.496057510375977, -12.03387451171875, -11.571691513061523, -11.109508514404297, -10.647324562072754, -10.185141563415527, -9.7229585647583, -9.260775566101074, -8.798592567443848, -8.336409568786621, -7.874226093292236, -7.41204309463501, -6.949859619140625, -6.487676620483398, -6.025493621826172, -5.563310623168945, -5.1011271476745605, -4.638944149017334, -4.176760673522949, -3.7145776748657227, -3.252394437789917, -2.7902112007141113, -2.3280282020568848, -1.865844964981079, -1.4036626815795898, -0.941479504108429, -0.47929632663726807, -0.017113208770751953, 0.4450700283050537, 0.9072532653808594, 1.369436264038086, 1.8316195011138916, 2.2938027381896973, 2.755985975265503, 3.2181692123413086, 3.680352210998535, 4.142535209655762, 4.6047186851501465, 5.066901683807373, 5.529085159301758, 5.991268157958984, 6.453451156616211, 6.915634632110596, 7.377817630767822, 7.840001106262207, 8.302184104919434, 8.76436710357666, 9.226550102233887, 9.68873405456543, 10.150917053222656, 10.613100051879883, 11.07528305053711, 11.537467002868652, 11.999650001525879, 12.461833000183105, 12.924015998840332, 13.386198997497559]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 7.0, 13.0, 8.0, 27.0, 19.0, 45.0, 45.0, 94.0, 113.0, 171.0, 241.0, 379.0, 484.0, 740.0, 1049.0, 1469.0, 2168.0, 3337.0, 5162.0, 8477.0, 14347.0, 26150.0, 49458.0, 98889.0, 189055.0, 254284.0, 184469.0, 96183.0, 48427.0, 25462.0, 14199.0, 8366.0, 5100.0, 3251.0, 2212.0, 1419.0, 963.0, 669.0, 517.0, 311.0, 238.0, 158.0, 105.0, 83.0, 69.0, 41.0, 28.0, 17.0, 17.0, 4.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-18.546875, -17.975830078125, -17.40478515625, -16.833740234375, -16.2626953125, -15.691650390625, -15.12060546875, -14.549560546875, -13.978515625, -13.407470703125, -12.83642578125, -12.265380859375, -11.6943359375, -11.123291015625, -10.55224609375, -9.981201171875, -9.41015625, -8.839111328125, -8.26806640625, -7.697021484375, -7.1259765625, -6.554931640625, -5.98388671875, -5.412841796875, -4.841796875, -4.270751953125, -3.69970703125, -3.128662109375, -2.5576171875, -1.986572265625, -1.41552734375, -0.844482421875, -0.2734375, 0.297607421875, 0.86865234375, 1.439697265625, 2.0107421875, 2.581787109375, 3.15283203125, 3.723876953125, 4.294921875, 4.865966796875, 5.43701171875, 6.008056640625, 6.5791015625, 7.150146484375, 7.72119140625, 8.292236328125, 8.86328125, 9.434326171875, 10.00537109375, 10.576416015625, 11.1474609375, 11.718505859375, 12.28955078125, 12.860595703125, 13.431640625, 14.002685546875, 14.57373046875, 15.144775390625, 15.7158203125, 16.286865234375, 16.85791015625, 17.428955078125, 18.0]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 6.0, 5.0, 13.0, 8.0, 14.0, 20.0, 20.0, 26.0, 21.0, 17.0, 22.0, 37.0, 37.0, 23.0, 43.0, 52.0, 46.0, 52.0, 37.0, 48.0, 49.0, 50.0, 39.0, 27.0, 38.0, 40.0, 29.0, 34.0, 20.0, 24.0, 21.0, 15.0, 18.0, 10.0, 6.0, 5.0, 6.0, 8.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.40625, -16.90478515625, -16.4033203125, -15.90185546875, -15.400390625, -14.89892578125, -14.3974609375, -13.89599609375, -13.39453125, -12.89306640625, -12.3916015625, -11.89013671875, -11.388671875, -10.88720703125, -10.3857421875, -9.88427734375, -9.3828125, -8.88134765625, -8.3798828125, -7.87841796875, -7.376953125, -6.87548828125, -6.3740234375, -5.87255859375, -5.37109375, -4.86962890625, -4.3681640625, -3.86669921875, -3.365234375, -2.86376953125, -2.3623046875, -1.86083984375, -1.359375, -0.85791015625, -0.3564453125, 0.14501953125, 0.646484375, 1.14794921875, 1.6494140625, 2.15087890625, 2.65234375, 3.15380859375, 3.6552734375, 4.15673828125, 4.658203125, 5.15966796875, 5.6611328125, 6.16259765625, 6.6640625, 7.16552734375, 7.6669921875, 8.16845703125, 8.669921875, 9.17138671875, 9.6728515625, 10.17431640625, 10.67578125, 11.17724609375, 11.6787109375, 12.18017578125, 12.681640625, 13.18310546875, 13.6845703125, 14.18603515625, 14.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 8.0, 7.0, 7.0, 20.0, 23.0, 27.0, 48.0, 56.0, 79.0, 119.0, 181.0, 255.0, 383.0, 505.0, 754.0, 1203.0, 1893.0, 3101.0, 5299.0, 9433.0, 18260.0, 39359.0, 97074.0, 264596.0, 351411.0, 146086.0, 55039.0, 24397.0, 12149.0, 6367.0, 3818.0, 2276.0, 1414.0, 962.0, 601.0, 397.0, 281.0, 192.0, 140.0, 81.0, 73.0, 51.0, 34.0, 21.0, 20.0, 14.0, 14.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.703125, -22.967041015625, -22.23095703125, -21.494873046875, -20.7587890625, -20.022705078125, -19.28662109375, -18.550537109375, -17.814453125, -17.078369140625, -16.34228515625, -15.606201171875, -14.8701171875, -14.134033203125, -13.39794921875, -12.661865234375, -11.92578125, -11.189697265625, -10.45361328125, -9.717529296875, -8.9814453125, -8.245361328125, -7.50927734375, -6.773193359375, -6.037109375, -5.301025390625, -4.56494140625, -3.828857421875, -3.0927734375, -2.356689453125, -1.62060546875, -0.884521484375, -0.1484375, 0.587646484375, 1.32373046875, 2.059814453125, 2.7958984375, 3.531982421875, 4.26806640625, 5.004150390625, 5.740234375, 6.476318359375, 7.21240234375, 7.948486328125, 8.6845703125, 9.420654296875, 10.15673828125, 10.892822265625, 11.62890625, 12.364990234375, 13.10107421875, 13.837158203125, 14.5732421875, 15.309326171875, 16.04541015625, 16.781494140625, 17.517578125, 18.253662109375, 18.98974609375, 19.725830078125, 20.4619140625, 21.197998046875, 21.93408203125, 22.670166015625, 23.40625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 12.0, 7.0, 10.0, 13.0, 7.0, 25.0, 24.0, 23.0, 27.0, 28.0, 39.0, 29.0, 29.0, 47.0, 46.0, 56.0, 45.0, 50.0, 38.0, 49.0, 47.0, 46.0, 49.0, 34.0, 36.0, 38.0, 25.0, 20.0, 24.0, 12.0, 14.0, 14.0, 6.0, 7.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.4453125, -10.12353515625, -9.8017578125, -9.47998046875, -9.158203125, -8.83642578125, -8.5146484375, -8.19287109375, -7.87109375, -7.54931640625, -7.2275390625, -6.90576171875, -6.583984375, -6.26220703125, -5.9404296875, -5.61865234375, -5.296875, -4.97509765625, -4.6533203125, -4.33154296875, -4.009765625, -3.68798828125, -3.3662109375, -3.04443359375, -2.72265625, -2.40087890625, -2.0791015625, -1.75732421875, -1.435546875, -1.11376953125, -0.7919921875, -0.47021484375, -0.1484375, 0.17333984375, 0.4951171875, 0.81689453125, 1.138671875, 1.46044921875, 1.7822265625, 2.10400390625, 2.42578125, 2.74755859375, 3.0693359375, 3.39111328125, 3.712890625, 4.03466796875, 4.3564453125, 4.67822265625, 5.0, 5.32177734375, 5.6435546875, 5.96533203125, 6.287109375, 6.60888671875, 6.9306640625, 7.25244140625, 7.57421875, 7.89599609375, 8.2177734375, 8.53955078125, 8.861328125, 9.18310546875, 9.5048828125, 9.82666015625, 10.1484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 10.0, 17.0, 18.0, 30.0, 39.0, 37.0, 72.0, 80.0, 124.0, 166.0, 262.0, 311.0, 440.0, 668.0, 956.0, 1396.0, 2482.0, 4184.0, 7978.0, 17077.0, 41000.0, 121540.0, 397920.0, 302357.0, 87510.0, 31904.0, 13536.0, 6663.0, 3533.0, 2030.0, 1334.0, 803.0, 609.0, 395.0, 319.0, 216.0, 134.0, 111.0, 80.0, 50.0, 45.0, 33.0, 20.0, 16.0, 13.0, 7.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-16.25, -15.7554931640625, -15.260986328125, -14.7664794921875, -14.27197265625, -13.7774658203125, -13.282958984375, -12.7884521484375, -12.2939453125, -11.7994384765625, -11.304931640625, -10.8104248046875, -10.31591796875, -9.8214111328125, -9.326904296875, -8.8323974609375, -8.337890625, -7.8433837890625, -7.348876953125, -6.8543701171875, -6.35986328125, -5.8653564453125, -5.370849609375, -4.8763427734375, -4.3818359375, -3.8873291015625, -3.392822265625, -2.8983154296875, -2.40380859375, -1.9093017578125, -1.414794921875, -0.9202880859375, -0.42578125, 0.0687255859375, 0.563232421875, 1.0577392578125, 1.55224609375, 2.0467529296875, 2.541259765625, 3.0357666015625, 3.5302734375, 4.0247802734375, 4.519287109375, 5.0137939453125, 5.50830078125, 6.0028076171875, 6.497314453125, 6.9918212890625, 7.486328125, 7.9808349609375, 8.475341796875, 8.9698486328125, 9.46435546875, 9.9588623046875, 10.453369140625, 10.9478759765625, 11.4423828125, 11.9368896484375, 12.431396484375, 12.9259033203125, 13.42041015625, 13.9149169921875, 14.409423828125, 14.9039306640625, 15.3984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 11.0, 12.0, 15.0, 21.0, 69.0, 107.0, 169.0, 241.0, 169.0, 74.0, 35.0, 20.0, 13.0, 11.0, 4.0, 5.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018768310546875, -0.0018237382173538208, -0.0017706453800201416, -0.0017175525426864624, -0.0016644597053527832, -0.001611366868019104, -0.0015582740306854248, -0.0015051811933517456, -0.0014520883560180664, -0.0013989955186843872, -0.001345902681350708, -0.0012928098440170288, -0.0012397170066833496, -0.0011866241693496704, -0.0011335313320159912, -0.001080438494682312, -0.0010273456573486328, -0.0009742528200149536, -0.0009211599826812744, -0.0008680671453475952, -0.000814974308013916, -0.0007618814706802368, -0.0007087886333465576, -0.0006556957960128784, -0.0006026029586791992, -0.00054951012134552, -0.0004964172840118408, -0.0004433244466781616, -0.0003902316093444824, -0.0003371387720108032, -0.000284045934677124, -0.00023095309734344482, -0.00017786026000976562, -0.00012476742267608643, -7.167458534240723e-05, -1.8581748008728027e-05, 3.451108932495117e-05, 8.760392665863037e-05, 0.00014069676399230957, 0.00019378960132598877, 0.00024688243865966797, 0.00029997527599334717, 0.00035306811332702637, 0.00040616095066070557, 0.00045925378799438477, 0.000512346625328064, 0.0005654394626617432, 0.0006185322999954224, 0.0006716251373291016, 0.0007247179746627808, 0.00077781081199646, 0.0008309036493301392, 0.0008839964866638184, 0.0009370893239974976, 0.0009901821613311768, 0.001043274998664856, 0.0010963678359985352, 0.0011494606733322144, 0.0012025535106658936, 0.0012556463479995728, 0.001308739185333252, 0.0013618320226669312, 0.0014149248600006104, 0.0014680176973342896, 0.0015211105346679688]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 8.0, 15.0, 25.0, 30.0, 56.0, 64.0, 95.0, 186.0, 223.0, 370.0, 590.0, 1017.0, 1801.0, 3408.0, 6943.0, 16841.0, 45391.0, 141753.0, 382272.0, 295516.0, 95897.0, 31941.0, 12263.0, 5395.0, 2658.0, 1505.0, 830.0, 522.0, 311.0, 222.0, 105.0, 89.0, 55.0, 44.0, 33.0, 17.0, 14.0, 12.0, 6.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.96875, -16.451904296875, -15.93505859375, -15.418212890625, -14.9013671875, -14.384521484375, -13.86767578125, -13.350830078125, -12.833984375, -12.317138671875, -11.80029296875, -11.283447265625, -10.7666015625, -10.249755859375, -9.73291015625, -9.216064453125, -8.69921875, -8.182373046875, -7.66552734375, -7.148681640625, -6.6318359375, -6.114990234375, -5.59814453125, -5.081298828125, -4.564453125, -4.047607421875, -3.53076171875, -3.013916015625, -2.4970703125, -1.980224609375, -1.46337890625, -0.946533203125, -0.4296875, 0.087158203125, 0.60400390625, 1.120849609375, 1.6376953125, 2.154541015625, 2.67138671875, 3.188232421875, 3.705078125, 4.221923828125, 4.73876953125, 5.255615234375, 5.7724609375, 6.289306640625, 6.80615234375, 7.322998046875, 7.83984375, 8.356689453125, 8.87353515625, 9.390380859375, 9.9072265625, 10.424072265625, 10.94091796875, 11.457763671875, 11.974609375, 12.491455078125, 13.00830078125, 13.525146484375, 14.0419921875, 14.558837890625, 15.07568359375, 15.592529296875, 16.109375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 8.0, 9.0, 16.0, 6.0, 17.0, 23.0, 28.0, 47.0, 55.0, 52.0, 61.0, 72.0, 77.0, 72.0, 77.0, 80.0, 52.0, 52.0, 45.0, 32.0, 23.0, 15.0, 11.0, 17.0, 16.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.85546875, -3.7276611328125, -3.599853515625, -3.4720458984375, -3.34423828125, -3.2164306640625, -3.088623046875, -2.9608154296875, -2.8330078125, -2.7052001953125, -2.577392578125, -2.4495849609375, -2.32177734375, -2.1939697265625, -2.066162109375, -1.9383544921875, -1.810546875, -1.6827392578125, -1.554931640625, -1.4271240234375, -1.29931640625, -1.1715087890625, -1.043701171875, -0.9158935546875, -0.7880859375, -0.6602783203125, -0.532470703125, -0.4046630859375, -0.27685546875, -0.1490478515625, -0.021240234375, 0.1065673828125, 0.234375, 0.3621826171875, 0.489990234375, 0.6177978515625, 0.74560546875, 0.8734130859375, 1.001220703125, 1.1290283203125, 1.2568359375, 1.3846435546875, 1.512451171875, 1.6402587890625, 1.76806640625, 1.8958740234375, 2.023681640625, 2.1514892578125, 2.279296875, 2.4071044921875, 2.534912109375, 2.6627197265625, 2.79052734375, 2.9183349609375, 3.046142578125, 3.1739501953125, 3.3017578125, 3.4295654296875, 3.557373046875, 3.6851806640625, 3.81298828125, 3.9407958984375, 4.068603515625, 4.1964111328125, 4.32421875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 5.0, 12.0, 18.0, 27.0, 20.0, 30.0, 40.0, 53.0, 69.0, 88.0, 98.0, 88.0, 79.0, 76.0, 58.0, 61.0, 32.0, 29.0, 29.0, 19.0, 15.0, 7.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.597742080688477, -22.88474464416504, -22.1717472076416, -21.458749771118164, -20.745752334594727, -20.03275489807129, -19.31975746154785, -18.606760025024414, -17.893762588500977, -17.18076515197754, -16.4677677154541, -15.754770278930664, -15.041772842407227, -14.328775405883789, -13.615777969360352, -12.902780532836914, -12.189783096313477, -11.476785659790039, -10.763788223266602, -10.050790786743164, -9.337793350219727, -8.624795913696289, -7.911798477172852, -7.198801040649414, -6.485803604125977, -5.772806167602539, -5.059808731079102, -4.346811294555664, -3.6338138580322266, -2.920816421508789, -2.2078189849853516, -1.494821548461914, -0.7818260192871094, -0.06882858276367188, 0.6441688537597656, 1.3571662902832031, 2.0701637268066406, 2.783161163330078, 3.4961585998535156, 4.209156036376953, 4.922153472900391, 5.635150909423828, 6.348148345947266, 7.061145782470703, 7.774143218994141, 8.487140655517578, 9.200138092041016, 9.913135528564453, 10.62613296508789, 11.339130401611328, 12.052127838134766, 12.765125274658203, 13.47812271118164, 14.191120147705078, 14.904117584228516, 15.617115020751953, 16.33011245727539, 17.043109893798828, 17.756107330322266, 18.469104766845703, 19.18210220336914, 19.895099639892578, 20.608097076416016, 21.321094512939453, 22.03409194946289]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 13.0, 14.0, 21.0, 20.0, 24.0, 24.0, 35.0, 19.0, 35.0, 22.0, 42.0, 39.0, 31.0, 28.0, 56.0, 38.0, 39.0, 47.0, 45.0, 33.0, 38.0, 39.0, 40.0, 35.0, 30.0, 22.0, 21.0, 24.0, 16.0, 18.0, 15.0, 13.0, 4.0, 5.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.475081443786621, -15.032533645629883, -14.589986801147461, -14.147439002990723, -13.704891204833984, -13.262344360351562, -12.819796562194824, -12.377248764038086, -11.934701919555664, -11.492154121398926, -11.049607276916504, -10.607059478759766, -10.164511680603027, -9.721963882446289, -9.279417037963867, -8.836869239807129, -8.39432144165039, -7.9517741203308105, -7.509226322174072, -7.066679000854492, -6.624131202697754, -6.181583881378174, -5.739036560058594, -5.2964887619018555, -4.853941440582275, -4.411394119262695, -3.968846321105957, -3.526298999786377, -3.0837514400482178, -2.6412038803100586, -2.1986565589904785, -1.7561089992523193, -1.3135623931884766, -0.8710148930549622, -0.42846739292144775, 0.014080047607421875, 0.45662760734558105, 0.8991751670837402, 1.3417224884033203, 1.7842700481414795, 2.2268176078796387, 2.669365167617798, 3.111912727355957, 3.554460048675537, 3.9970076084136963, 4.4395551681518555, 4.8821024894714355, 5.324649810791016, 5.767197608947754, 6.209744930267334, 6.652292728424072, 7.094840049743652, 7.537387847900391, 7.979935169219971, 8.42248249053955, 8.865030288696289, 9.307577133178711, 9.75012493133545, 10.192671775817871, 10.63521957397461, 11.077767372131348, 11.520315170288086, 11.962862014770508, 12.405409812927246, 12.847957611083984]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 4.0, 13.0, 26.0, 20.0, 45.0, 42.0, 63.0, 61.0, 99.0, 132.0, 160.0, 243.0, 315.0, 509.0, 799.0, 1184.0, 1872.0, 3061.0, 5848.0, 10557.0, 21465.0, 45771.0, 100314.0, 195725.0, 263848.0, 199100.0, 102900.0, 46640.0, 22294.0, 10779.0, 5755.0, 3275.0, 1921.0, 1152.0, 734.0, 541.0, 359.0, 224.0, 195.0, 127.0, 95.0, 71.0, 50.0, 35.0, 28.0, 29.0, 22.0, 17.0, 10.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-27.59375, -26.7451171875, -25.896484375, -25.0478515625, -24.19921875, -23.3505859375, -22.501953125, -21.6533203125, -20.8046875, -19.9560546875, -19.107421875, -18.2587890625, -17.41015625, -16.5615234375, -15.712890625, -14.8642578125, -14.015625, -13.1669921875, -12.318359375, -11.4697265625, -10.62109375, -9.7724609375, -8.923828125, -8.0751953125, -7.2265625, -6.3779296875, -5.529296875, -4.6806640625, -3.83203125, -2.9833984375, -2.134765625, -1.2861328125, -0.4375, 0.4111328125, 1.259765625, 2.1083984375, 2.95703125, 3.8056640625, 4.654296875, 5.5029296875, 6.3515625, 7.2001953125, 8.048828125, 8.8974609375, 9.74609375, 10.5947265625, 11.443359375, 12.2919921875, 13.140625, 13.9892578125, 14.837890625, 15.6865234375, 16.53515625, 17.3837890625, 18.232421875, 19.0810546875, 19.9296875, 20.7783203125, 21.626953125, 22.4755859375, 23.32421875, 24.1728515625, 25.021484375, 25.8701171875, 26.71875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 4.0, 12.0, 12.0, 19.0, 18.0, 15.0, 24.0, 25.0, 23.0, 35.0, 40.0, 36.0, 43.0, 36.0, 40.0, 35.0, 49.0, 44.0, 45.0, 32.0, 40.0, 45.0, 37.0, 40.0, 31.0, 28.0, 37.0, 19.0, 30.0, 18.0, 12.0, 12.0, 15.0, 5.0, 6.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.5234375, -15.0849609375, -14.646484375, -14.2080078125, -13.76953125, -13.3310546875, -12.892578125, -12.4541015625, -12.015625, -11.5771484375, -11.138671875, -10.7001953125, -10.26171875, -9.8232421875, -9.384765625, -8.9462890625, -8.5078125, -8.0693359375, -7.630859375, -7.1923828125, -6.75390625, -6.3154296875, -5.876953125, -5.4384765625, -5.0, -4.5615234375, -4.123046875, -3.6845703125, -3.24609375, -2.8076171875, -2.369140625, -1.9306640625, -1.4921875, -1.0537109375, -0.615234375, -0.1767578125, 0.26171875, 0.7001953125, 1.138671875, 1.5771484375, 2.015625, 2.4541015625, 2.892578125, 3.3310546875, 3.76953125, 4.2080078125, 4.646484375, 5.0849609375, 5.5234375, 5.9619140625, 6.400390625, 6.8388671875, 7.27734375, 7.7158203125, 8.154296875, 8.5927734375, 9.03125, 9.4697265625, 9.908203125, 10.3466796875, 10.78515625, 11.2236328125, 11.662109375, 12.1005859375, 12.5390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 17.0, 29.0, 27.0, 34.0, 65.0, 84.0, 143.0, 163.0, 291.0, 405.0, 557.0, 817.0, 1287.0, 2031.0, 3062.0, 4985.0, 8115.0, 13416.0, 22602.0, 38082.0, 65311.0, 110580.0, 165327.0, 192305.0, 159744.0, 104910.0, 62341.0, 36222.0, 21373.0, 12805.0, 7800.0, 4796.0, 2975.0, 1943.0, 1321.0, 831.0, 539.0, 391.0, 232.0, 185.0, 134.0, 81.0, 51.0, 40.0, 26.0, 20.0, 15.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0], "bins": [-17.9375, -17.384765625, -16.83203125, -16.279296875, -15.7265625, -15.173828125, -14.62109375, -14.068359375, -13.515625, -12.962890625, -12.41015625, -11.857421875, -11.3046875, -10.751953125, -10.19921875, -9.646484375, -9.09375, -8.541015625, -7.98828125, -7.435546875, -6.8828125, -6.330078125, -5.77734375, -5.224609375, -4.671875, -4.119140625, -3.56640625, -3.013671875, -2.4609375, -1.908203125, -1.35546875, -0.802734375, -0.25, 0.302734375, 0.85546875, 1.408203125, 1.9609375, 2.513671875, 3.06640625, 3.619140625, 4.171875, 4.724609375, 5.27734375, 5.830078125, 6.3828125, 6.935546875, 7.48828125, 8.041015625, 8.59375, 9.146484375, 9.69921875, 10.251953125, 10.8046875, 11.357421875, 11.91015625, 12.462890625, 13.015625, 13.568359375, 14.12109375, 14.673828125, 15.2265625, 15.779296875, 16.33203125, 16.884765625, 17.4375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 13.0, 9.0, 15.0, 15.0, 9.0, 22.0, 18.0, 21.0, 29.0, 32.0, 27.0, 30.0, 21.0, 31.0, 32.0, 37.0, 34.0, 49.0, 37.0, 47.0, 41.0, 31.0, 38.0, 37.0, 36.0, 28.0, 27.0, 31.0, 26.0, 19.0, 27.0, 25.0, 14.0, 18.0, 19.0, 10.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.015625, -8.7208251953125, -8.426025390625, -8.1312255859375, -7.83642578125, -7.5416259765625, -7.246826171875, -6.9520263671875, -6.6572265625, -6.3624267578125, -6.067626953125, -5.7728271484375, -5.47802734375, -5.1832275390625, -4.888427734375, -4.5936279296875, -4.298828125, -4.0040283203125, -3.709228515625, -3.4144287109375, -3.11962890625, -2.8248291015625, -2.530029296875, -2.2352294921875, -1.9404296875, -1.6456298828125, -1.350830078125, -1.0560302734375, -0.76123046875, -0.4664306640625, -0.171630859375, 0.1231689453125, 0.41796875, 0.7127685546875, 1.007568359375, 1.3023681640625, 1.59716796875, 1.8919677734375, 2.186767578125, 2.4815673828125, 2.7763671875, 3.0711669921875, 3.365966796875, 3.6607666015625, 3.95556640625, 4.2503662109375, 4.545166015625, 4.8399658203125, 5.134765625, 5.4295654296875, 5.724365234375, 6.0191650390625, 6.31396484375, 6.6087646484375, 6.903564453125, 7.1983642578125, 7.4931640625, 7.7879638671875, 8.082763671875, 8.3775634765625, 8.67236328125, 8.9671630859375, 9.261962890625, 9.5567626953125, 9.8515625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 5.0, 3.0, 4.0, 4.0, 9.0, 17.0, 18.0, 32.0, 44.0, 52.0, 68.0, 99.0, 143.0, 194.0, 265.0, 366.0, 519.0, 806.0, 1179.0, 1709.0, 2660.0, 4481.0, 7652.0, 14512.0, 29513.0, 66009.0, 171962.0, 355987.0, 227123.0, 85712.0, 36576.0, 17437.0, 9200.0, 5056.0, 3110.0, 1895.0, 1289.0, 802.0, 577.0, 426.0, 277.0, 212.0, 145.0, 123.0, 90.0, 58.0, 48.0, 31.0, 19.0, 14.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-23.515625, -22.694580078125, -21.87353515625, -21.052490234375, -20.2314453125, -19.410400390625, -18.58935546875, -17.768310546875, -16.947265625, -16.126220703125, -15.30517578125, -14.484130859375, -13.6630859375, -12.842041015625, -12.02099609375, -11.199951171875, -10.37890625, -9.557861328125, -8.73681640625, -7.915771484375, -7.0947265625, -6.273681640625, -5.45263671875, -4.631591796875, -3.810546875, -2.989501953125, -2.16845703125, -1.347412109375, -0.5263671875, 0.294677734375, 1.11572265625, 1.936767578125, 2.7578125, 3.578857421875, 4.39990234375, 5.220947265625, 6.0419921875, 6.863037109375, 7.68408203125, 8.505126953125, 9.326171875, 10.147216796875, 10.96826171875, 11.789306640625, 12.6103515625, 13.431396484375, 14.25244140625, 15.073486328125, 15.89453125, 16.715576171875, 17.53662109375, 18.357666015625, 19.1787109375, 19.999755859375, 20.82080078125, 21.641845703125, 22.462890625, 23.283935546875, 24.10498046875, 24.926025390625, 25.7470703125, 26.568115234375, 27.38916015625, 28.210205078125, 29.03125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 12.0, 8.0, 20.0, 22.0, 21.0, 39.0, 59.0, 67.0, 73.0, 133.0, 101.0, 100.0, 90.0, 66.0, 36.0, 29.0, 25.0, 25.0, 15.0, 13.0, 8.0, 5.0, 0.0, 5.0, 2.0, 9.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023937225341796875, -0.0023223459720611572, -0.002250969409942627, -0.0021795928478240967, -0.0021082162857055664, -0.002036839723587036, -0.001965463161468506, -0.0018940865993499756, -0.0018227100372314453, -0.001751333475112915, -0.0016799569129943848, -0.0016085803508758545, -0.0015372037887573242, -0.001465827226638794, -0.0013944506645202637, -0.0013230741024017334, -0.0012516975402832031, -0.0011803209781646729, -0.0011089444160461426, -0.0010375678539276123, -0.000966191291809082, -0.0008948147296905518, -0.0008234381675720215, -0.0007520616054534912, -0.0006806850433349609, -0.0006093084812164307, -0.0005379319190979004, -0.0004665553569793701, -0.00039517879486083984, -0.00032380223274230957, -0.0002524256706237793, -0.00018104910850524902, -0.00010967254638671875, -3.8295984268188477e-05, 3.30805778503418e-05, 0.00010445713996887207, 0.00017583370208740234, 0.0002472102642059326, 0.0003185868263244629, 0.00038996338844299316, 0.00046133995056152344, 0.0005327165126800537, 0.000604093074798584, 0.0006754696369171143, 0.0007468461990356445, 0.0008182227611541748, 0.0008895993232727051, 0.0009609758853912354, 0.0010323524475097656, 0.001103729009628296, 0.0011751055717468262, 0.0012464821338653564, 0.0013178586959838867, 0.001389235258102417, 0.0014606118202209473, 0.0015319883823394775, 0.0016033649444580078, 0.001674741506576538, 0.0017461180686950684, 0.0018174946308135986, 0.001888871192932129, 0.001960247755050659, 0.0020316243171691895, 0.0021030008792877197, 0.00217437744140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 10.0, 19.0, 19.0, 39.0, 62.0, 105.0, 147.0, 228.0, 347.0, 492.0, 829.0, 1361.0, 2085.0, 3634.0, 6224.0, 11860.0, 23215.0, 50154.0, 123925.0, 279000.0, 295279.0, 138737.0, 56226.0, 25025.0, 12776.0, 6832.0, 3786.0, 2298.0, 1347.0, 858.0, 589.0, 346.0, 254.0, 141.0, 101.0, 62.0, 43.0, 26.0, 20.0, 23.0, 12.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.46875, -19.830322265625, -19.19189453125, -18.553466796875, -17.9150390625, -17.276611328125, -16.63818359375, -15.999755859375, -15.361328125, -14.722900390625, -14.08447265625, -13.446044921875, -12.8076171875, -12.169189453125, -11.53076171875, -10.892333984375, -10.25390625, -9.615478515625, -8.97705078125, -8.338623046875, -7.7001953125, -7.061767578125, -6.42333984375, -5.784912109375, -5.146484375, -4.508056640625, -3.86962890625, -3.231201171875, -2.5927734375, -1.954345703125, -1.31591796875, -0.677490234375, -0.0390625, 0.599365234375, 1.23779296875, 1.876220703125, 2.5146484375, 3.153076171875, 3.79150390625, 4.429931640625, 5.068359375, 5.706787109375, 6.34521484375, 6.983642578125, 7.6220703125, 8.260498046875, 8.89892578125, 9.537353515625, 10.17578125, 10.814208984375, 11.45263671875, 12.091064453125, 12.7294921875, 13.367919921875, 14.00634765625, 14.644775390625, 15.283203125, 15.921630859375, 16.56005859375, 17.198486328125, 17.8369140625, 18.475341796875, 19.11376953125, 19.752197265625, 20.390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 7.0, 15.0, 27.0, 19.0, 17.0, 26.0, 39.0, 43.0, 54.0, 52.0, 65.0, 82.0, 80.0, 68.0, 71.0, 55.0, 51.0, 29.0, 32.0, 25.0, 16.0, 16.0, 20.0, 18.0, 10.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.61236572265625, -5.4278564453125, -5.24334716796875, -5.058837890625, -4.87432861328125, -4.6898193359375, -4.50531005859375, -4.32080078125, -4.13629150390625, -3.9517822265625, -3.76727294921875, -3.582763671875, -3.39825439453125, -3.2137451171875, -3.02923583984375, -2.8447265625, -2.66021728515625, -2.4757080078125, -2.29119873046875, -2.106689453125, -1.92218017578125, -1.7376708984375, -1.55316162109375, -1.36865234375, -1.18414306640625, -0.9996337890625, -0.81512451171875, -0.630615234375, -0.44610595703125, -0.2615966796875, -0.07708740234375, 0.107421875, 0.29193115234375, 0.4764404296875, 0.66094970703125, 0.845458984375, 1.02996826171875, 1.2144775390625, 1.39898681640625, 1.58349609375, 1.76800537109375, 1.9525146484375, 2.13702392578125, 2.321533203125, 2.50604248046875, 2.6905517578125, 2.87506103515625, 3.0595703125, 3.24407958984375, 3.4285888671875, 3.61309814453125, 3.797607421875, 3.98211669921875, 4.1666259765625, 4.35113525390625, 4.53564453125, 4.72015380859375, 4.9046630859375, 5.08917236328125, 5.273681640625, 5.45819091796875, 5.6427001953125, 5.82720947265625, 6.01171875]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 18.0, 20.0, 17.0, 28.0, 40.0, 39.0, 49.0, 58.0, 75.0, 70.0, 94.0, 100.0, 82.0, 55.0, 54.0, 40.0, 29.0, 27.0, 26.0, 7.0, 7.0, 12.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.743560791015625, -27.035123825073242, -26.326688766479492, -25.61825180053711, -24.90981674194336, -24.201379776000977, -23.492942810058594, -22.784507751464844, -22.07607078552246, -21.367633819580078, -20.659198760986328, -19.950761795043945, -19.242324829101562, -18.533889770507812, -17.82545280456543, -17.117015838623047, -16.408580780029297, -15.70014476776123, -14.991708755493164, -14.283271789550781, -13.574835777282715, -12.866399765014648, -12.157962799072266, -11.4495267868042, -10.741090774536133, -10.032654762268066, -9.32421875, -8.615781784057617, -7.907345771789551, -7.198909759521484, -6.49047327041626, -5.782036781311035, -5.073600769042969, -4.365164756774902, -3.6567282676696777, -2.9482920169830322, -2.2398557662963867, -1.5314195156097412, -0.8229832649230957, -0.1145467758178711, 0.5938892364501953, 1.3023254871368408, 2.0107617378234863, 2.719197988510132, 3.4276342391967773, 4.136070251464844, 4.844506740570068, 5.552943229675293, 6.261379241943359, 6.969815254211426, 7.67825174331665, 8.386688232421875, 9.095124244689941, 9.803560256958008, 10.51199722290039, 11.220433235168457, 11.928869247436523, 12.63730525970459, 13.345741271972656, 14.054178237915039, 14.762614250183105, 15.471050262451172, 16.179487228393555, 16.887924194335938, 17.596359252929688]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 12.0, 14.0, 6.0, 10.0, 16.0, 15.0, 16.0, 18.0, 28.0, 27.0, 32.0, 28.0, 28.0, 38.0, 43.0, 41.0, 37.0, 36.0, 40.0, 44.0, 48.0, 49.0, 40.0, 41.0, 42.0, 29.0, 40.0, 23.0, 17.0, 13.0, 28.0, 24.0, 12.0, 16.0, 6.0, 9.0, 7.0, 3.0, 9.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.803695678710938, -15.339011192321777, -14.874327659606934, -14.409643173217773, -13.94495964050293, -13.48027515411377, -13.01559066772461, -12.550907135009766, -12.086223602294922, -11.621539115905762, -11.156855583190918, -10.692171096801758, -10.227487564086914, -9.762803077697754, -9.298118591308594, -8.83343505859375, -8.36875057220459, -7.904066562652588, -7.439382553100586, -6.974698066711426, -6.510014533996582, -6.045330047607422, -5.58064603805542, -5.115962028503418, -4.651278018951416, -4.186594009399414, -3.721909999847412, -3.257225751876831, -2.792541742324829, -2.327857732772827, -1.863173484802246, -1.3984894752502441, -0.9338045120239258, -0.46912044286727905, -0.004436373710632324, 0.4602477550506592, 0.9249317646026611, 1.389615774154663, 1.8543000221252441, 2.318984031677246, 2.783668041229248, 3.24835205078125, 3.713036060333252, 4.177720069885254, 4.642404556274414, 5.107088088989258, 5.571772575378418, 6.03645658493042, 6.501140594482422, 6.965824604034424, 7.430508613586426, 7.895193099975586, 8.35987663269043, 8.82456111907959, 9.28924560546875, 9.753929138183594, 10.218612670898438, 10.683297157287598, 11.147980690002441, 11.612665176391602, 12.077348709106445, 12.542033195495605, 13.006717681884766, 13.47140121459961, 13.93608570098877]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 3.0, 12.0, 12.0, 14.0, 27.0, 28.0, 39.0, 60.0, 89.0, 153.0, 189.0, 297.0, 394.0, 694.0, 928.0, 1618.0, 2307.0, 3748.0, 6259.0, 10538.0, 19411.0, 37819.0, 82547.0, 198401.0, 499195.0, 1033980.0, 1169580.0, 650329.0, 260502.0, 105378.0, 48287.0, 24180.0, 13727.0, 8248.0, 5028.0, 3414.0, 2174.0, 1513.0, 954.0, 665.0, 475.0, 322.0, 239.0, 172.0, 79.0, 87.0, 49.0, 31.0, 19.0, 26.0, 17.0, 12.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-16.359375, -15.81689453125, -15.2744140625, -14.73193359375, -14.189453125, -13.64697265625, -13.1044921875, -12.56201171875, -12.01953125, -11.47705078125, -10.9345703125, -10.39208984375, -9.849609375, -9.30712890625, -8.7646484375, -8.22216796875, -7.6796875, -7.13720703125, -6.5947265625, -6.05224609375, -5.509765625, -4.96728515625, -4.4248046875, -3.88232421875, -3.33984375, -2.79736328125, -2.2548828125, -1.71240234375, -1.169921875, -0.62744140625, -0.0849609375, 0.45751953125, 1.0, 1.54248046875, 2.0849609375, 2.62744140625, 3.169921875, 3.71240234375, 4.2548828125, 4.79736328125, 5.33984375, 5.88232421875, 6.4248046875, 6.96728515625, 7.509765625, 8.05224609375, 8.5947265625, 9.13720703125, 9.6796875, 10.22216796875, 10.7646484375, 11.30712890625, 11.849609375, 12.39208984375, 12.9345703125, 13.47705078125, 14.01953125, 14.56201171875, 15.1044921875, 15.64697265625, 16.189453125, 16.73193359375, 17.2744140625, 17.81689453125, 18.359375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 14.0, 6.0, 12.0, 16.0, 13.0, 24.0, 26.0, 29.0, 37.0, 42.0, 25.0, 33.0, 45.0, 46.0, 44.0, 51.0, 49.0, 41.0, 49.0, 36.0, 50.0, 34.0, 50.0, 32.0, 33.0, 16.0, 18.0, 15.0, 29.0, 10.0, 13.0, 11.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.58740234375, -10.2607421875, -9.93408203125, -9.607421875, -9.28076171875, -8.9541015625, -8.62744140625, -8.30078125, -7.97412109375, -7.6474609375, -7.32080078125, -6.994140625, -6.66748046875, -6.3408203125, -6.01416015625, -5.6875, -5.36083984375, -5.0341796875, -4.70751953125, -4.380859375, -4.05419921875, -3.7275390625, -3.40087890625, -3.07421875, -2.74755859375, -2.4208984375, -2.09423828125, -1.767578125, -1.44091796875, -1.1142578125, -0.78759765625, -0.4609375, -0.13427734375, 0.1923828125, 0.51904296875, 0.845703125, 1.17236328125, 1.4990234375, 1.82568359375, 2.15234375, 2.47900390625, 2.8056640625, 3.13232421875, 3.458984375, 3.78564453125, 4.1123046875, 4.43896484375, 4.765625, 5.09228515625, 5.4189453125, 5.74560546875, 6.072265625, 6.39892578125, 6.7255859375, 7.05224609375, 7.37890625, 7.70556640625, 8.0322265625, 8.35888671875, 8.685546875, 9.01220703125, 9.3388671875, 9.66552734375, 9.9921875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 13.0, 20.0, 29.0, 38.0, 56.0, 76.0, 98.0, 151.0, 207.0, 309.0, 505.0, 823.0, 1227.0, 2008.0, 3481.0, 5679.0, 10004.0, 18349.0, 37423.0, 85794.0, 234171.0, 683432.0, 1393427.0, 1067402.0, 399270.0, 137379.0, 54919.0, 25681.0, 13169.0, 7413.0, 4373.0, 2712.0, 1614.0, 994.0, 687.0, 403.0, 269.0, 189.0, 145.0, 105.0, 72.0, 31.0, 30.0, 18.0, 23.0, 16.0, 9.0, 6.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.60107421875, -19.9521484375, -19.30322265625, -18.654296875, -18.00537109375, -17.3564453125, -16.70751953125, -16.05859375, -15.40966796875, -14.7607421875, -14.11181640625, -13.462890625, -12.81396484375, -12.1650390625, -11.51611328125, -10.8671875, -10.21826171875, -9.5693359375, -8.92041015625, -8.271484375, -7.62255859375, -6.9736328125, -6.32470703125, -5.67578125, -5.02685546875, -4.3779296875, -3.72900390625, -3.080078125, -2.43115234375, -1.7822265625, -1.13330078125, -0.484375, 0.16455078125, 0.8134765625, 1.46240234375, 2.111328125, 2.76025390625, 3.4091796875, 4.05810546875, 4.70703125, 5.35595703125, 6.0048828125, 6.65380859375, 7.302734375, 7.95166015625, 8.6005859375, 9.24951171875, 9.8984375, 10.54736328125, 11.1962890625, 11.84521484375, 12.494140625, 13.14306640625, 13.7919921875, 14.44091796875, 15.08984375, 15.73876953125, 16.3876953125, 17.03662109375, 17.685546875, 18.33447265625, 18.9833984375, 19.63232421875, 20.28125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 15.0, 9.0, 20.0, 30.0, 39.0, 53.0, 53.0, 69.0, 84.0, 100.0, 139.0, 160.0, 219.0, 285.0, 318.0, 344.0, 321.0, 347.0, 291.0, 257.0, 214.0, 164.0, 135.0, 90.0, 66.0, 62.0, 34.0, 24.0, 23.0, 25.0, 10.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.37109375, -7.177490234375, -6.98388671875, -6.790283203125, -6.5966796875, -6.403076171875, -6.20947265625, -6.015869140625, -5.822265625, -5.628662109375, -5.43505859375, -5.241455078125, -5.0478515625, -4.854248046875, -4.66064453125, -4.467041015625, -4.2734375, -4.079833984375, -3.88623046875, -3.692626953125, -3.4990234375, -3.305419921875, -3.11181640625, -2.918212890625, -2.724609375, -2.531005859375, -2.33740234375, -2.143798828125, -1.9501953125, -1.756591796875, -1.56298828125, -1.369384765625, -1.17578125, -0.982177734375, -0.78857421875, -0.594970703125, -0.4013671875, -0.207763671875, -0.01416015625, 0.179443359375, 0.373046875, 0.566650390625, 0.76025390625, 0.953857421875, 1.1474609375, 1.341064453125, 1.53466796875, 1.728271484375, 1.921875, 2.115478515625, 2.30908203125, 2.502685546875, 2.6962890625, 2.889892578125, 3.08349609375, 3.277099609375, 3.470703125, 3.664306640625, 3.85791015625, 4.051513671875, 4.2451171875, 4.438720703125, 4.63232421875, 4.825927734375, 5.01953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 6.0, 18.0, 7.0, 21.0, 31.0, 43.0, 56.0, 70.0, 110.0, 117.0, 114.0, 69.0, 118.0, 60.0, 39.0, 30.0, 27.0, 11.0, 14.0, 7.0, 8.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.934629440307617, -29.168359756469727, -28.40209197998047, -27.635822296142578, -26.86955451965332, -26.10328483581543, -25.337017059326172, -24.57074737548828, -23.80447769165039, -23.0382080078125, -22.271940231323242, -21.50567054748535, -20.739402770996094, -19.973133087158203, -19.206863403320312, -18.440595626831055, -17.674327850341797, -16.908058166503906, -16.14179039001465, -15.375520706176758, -14.6092529296875, -13.84298324584961, -13.076714515686035, -12.310445785522461, -11.544177055358887, -10.777908325195312, -10.011639595031738, -9.245370864868164, -8.479101181030273, -7.712832927703857, -6.946563720703125, -6.180294990539551, -5.414026260375977, -4.647757530212402, -3.881488561630249, -3.1152195930480957, -2.3489508628845215, -1.5826821327209473, -0.8164129257202148, -0.050144195556640625, 0.7161245346069336, 1.4823933839797974, 2.248662233352661, 3.0149312019348145, 3.7811999320983887, 4.547468662261963, 5.313737869262695, 6.0800065994262695, 6.846275329589844, 7.612544059753418, 8.378812789916992, 9.145082473754883, 9.91135025024414, 10.677619934082031, 11.443888664245605, 12.21015739440918, 12.976426124572754, 13.742694854736328, 14.508963584899902, 15.275232315063477, 16.041501998901367, 16.807769775390625, 17.574039459228516, 18.340309143066406, 19.106576919555664]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 4.0, 5.0, 6.0, 17.0, 20.0, 16.0, 20.0, 30.0, 32.0, 19.0, 32.0, 34.0, 50.0, 35.0, 55.0, 33.0, 49.0, 38.0, 61.0, 48.0, 38.0, 47.0, 31.0, 46.0, 35.0, 29.0, 29.0, 22.0, 23.0, 21.0, 13.0, 12.0, 8.0, 12.0, 10.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.543462753295898, -15.096383094787598, -14.649303436279297, -14.20222282409668, -13.755143165588379, -13.308063507080078, -12.860983848571777, -12.413904190063477, -11.96682357788086, -11.519743919372559, -11.072664260864258, -10.62558364868164, -10.17850399017334, -9.731424331665039, -9.284344673156738, -8.837265014648438, -8.390185356140137, -7.943105697631836, -7.496025562286377, -7.048945903778076, -6.601865768432617, -6.154786109924316, -5.707706451416016, -5.260626792907715, -4.813546657562256, -4.366466999053955, -3.919386863708496, -3.4723072052001953, -3.0252273082733154, -2.5781474113464355, -2.1310677528381348, -1.6839878559112549, -1.2369070053100586, -0.7898271679878235, -0.3427473306655884, 0.10433244705200195, 0.5514123439788818, 0.9984922409057617, 1.4455718994140625, 1.8926517963409424, 2.3397316932678223, 2.786811590194702, 3.233891487121582, 3.680971145629883, 4.128050804138184, 4.575130939483643, 5.022210597991943, 5.469290733337402, 5.916370391845703, 6.363450050354004, 6.810530185699463, 7.257609844207764, 7.704689979553223, 8.151769638061523, 8.598849296569824, 9.045928955078125, 9.493009567260742, 9.940089225769043, 10.387168884277344, 10.834249496459961, 11.281329154968262, 11.728408813476562, 12.175488471984863, 12.622568130493164, 13.069647789001465]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 16.0, 20.0, 36.0, 39.0, 63.0, 98.0, 141.0, 202.0, 346.0, 442.0, 656.0, 1036.0, 1486.0, 2499.0, 3999.0, 6315.0, 10862.0, 18910.0, 34072.0, 62855.0, 115731.0, 188334.0, 219537.0, 165174.0, 95884.0, 51656.0, 27836.0, 15942.0, 9211.0, 5548.0, 3354.0, 2135.0, 1327.0, 945.0, 597.0, 364.0, 294.0, 190.0, 119.0, 89.0, 61.0, 50.0, 29.0, 20.0, 10.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.40625, -10.07421875, -9.7421875, -9.41015625, -9.078125, -8.74609375, -8.4140625, -8.08203125, -7.75, -7.41796875, -7.0859375, -6.75390625, -6.421875, -6.08984375, -5.7578125, -5.42578125, -5.09375, -4.76171875, -4.4296875, -4.09765625, -3.765625, -3.43359375, -3.1015625, -2.76953125, -2.4375, -2.10546875, -1.7734375, -1.44140625, -1.109375, -0.77734375, -0.4453125, -0.11328125, 0.21875, 0.55078125, 0.8828125, 1.21484375, 1.546875, 1.87890625, 2.2109375, 2.54296875, 2.875, 3.20703125, 3.5390625, 3.87109375, 4.203125, 4.53515625, 4.8671875, 5.19921875, 5.53125, 5.86328125, 6.1953125, 6.52734375, 6.859375, 7.19140625, 7.5234375, 7.85546875, 8.1875, 8.51953125, 8.8515625, 9.18359375, 9.515625, 9.84765625, 10.1796875, 10.51171875, 10.84375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 4.0, 6.0, 12.0, 11.0, 13.0, 27.0, 26.0, 21.0, 27.0, 31.0, 35.0, 34.0, 38.0, 63.0, 60.0, 41.0, 40.0, 39.0, 53.0, 39.0, 39.0, 40.0, 42.0, 29.0, 41.0, 33.0, 22.0, 19.0, 22.0, 17.0, 13.0, 13.0, 5.0, 9.0, 10.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.0546875, -14.60107421875, -14.1474609375, -13.69384765625, -13.240234375, -12.78662109375, -12.3330078125, -11.87939453125, -11.42578125, -10.97216796875, -10.5185546875, -10.06494140625, -9.611328125, -9.15771484375, -8.7041015625, -8.25048828125, -7.796875, -7.34326171875, -6.8896484375, -6.43603515625, -5.982421875, -5.52880859375, -5.0751953125, -4.62158203125, -4.16796875, -3.71435546875, -3.2607421875, -2.80712890625, -2.353515625, -1.89990234375, -1.4462890625, -0.99267578125, -0.5390625, -0.08544921875, 0.3681640625, 0.82177734375, 1.275390625, 1.72900390625, 2.1826171875, 2.63623046875, 3.08984375, 3.54345703125, 3.9970703125, 4.45068359375, 4.904296875, 5.35791015625, 5.8115234375, 6.26513671875, 6.71875, 7.17236328125, 7.6259765625, 8.07958984375, 8.533203125, 8.98681640625, 9.4404296875, 9.89404296875, 10.34765625, 10.80126953125, 11.2548828125, 11.70849609375, 12.162109375, 12.61572265625, 13.0693359375, 13.52294921875, 13.9765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 3.0, 9.0, 8.0, 10.0, 6.0, 17.0, 15.0, 17.0, 39.0, 35.0, 64.0, 71.0, 122.0, 134.0, 200.0, 281.0, 426.0, 587.0, 875.0, 1360.0, 2026.0, 3382.0, 5347.0, 9272.0, 16801.0, 31691.0, 64571.0, 135151.0, 252105.0, 251304.0, 135500.0, 64379.0, 31650.0, 16619.0, 9231.0, 5486.0, 3276.0, 2095.0, 1365.0, 872.0, 589.0, 454.0, 275.0, 238.0, 163.0, 118.0, 86.0, 52.0, 41.0, 42.0, 16.0, 23.0, 20.0, 8.0, 9.0, 7.0, 6.0, 6.0, 4.0, 4.0, 1.0], "bins": [-12.1796875, -11.799072265625, -11.41845703125, -11.037841796875, -10.6572265625, -10.276611328125, -9.89599609375, -9.515380859375, -9.134765625, -8.754150390625, -8.37353515625, -7.992919921875, -7.6123046875, -7.231689453125, -6.85107421875, -6.470458984375, -6.08984375, -5.709228515625, -5.32861328125, -4.947998046875, -4.5673828125, -4.186767578125, -3.80615234375, -3.425537109375, -3.044921875, -2.664306640625, -2.28369140625, -1.903076171875, -1.5224609375, -1.141845703125, -0.76123046875, -0.380615234375, 0.0, 0.380615234375, 0.76123046875, 1.141845703125, 1.5224609375, 1.903076171875, 2.28369140625, 2.664306640625, 3.044921875, 3.425537109375, 3.80615234375, 4.186767578125, 4.5673828125, 4.947998046875, 5.32861328125, 5.709228515625, 6.08984375, 6.470458984375, 6.85107421875, 7.231689453125, 7.6123046875, 7.992919921875, 8.37353515625, 8.754150390625, 9.134765625, 9.515380859375, 9.89599609375, 10.276611328125, 10.6572265625, 11.037841796875, 11.41845703125, 11.799072265625, 12.1796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 9.0, 9.0, 11.0, 11.0, 14.0, 12.0, 29.0, 19.0, 25.0, 26.0, 34.0, 27.0, 28.0, 29.0, 34.0, 48.0, 34.0, 61.0, 35.0, 51.0, 31.0, 39.0, 42.0, 36.0, 31.0, 27.0, 33.0, 35.0, 37.0, 23.0, 19.0, 11.0, 17.0, 21.0, 12.0, 4.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.2813720703125, -7.015869140625, -6.7503662109375, -6.48486328125, -6.2193603515625, -5.953857421875, -5.6883544921875, -5.4228515625, -5.1573486328125, -4.891845703125, -4.6263427734375, -4.36083984375, -4.0953369140625, -3.829833984375, -3.5643310546875, -3.298828125, -3.0333251953125, -2.767822265625, -2.5023193359375, -2.23681640625, -1.9713134765625, -1.705810546875, -1.4403076171875, -1.1748046875, -0.9093017578125, -0.643798828125, -0.3782958984375, -0.11279296875, 0.1527099609375, 0.418212890625, 0.6837158203125, 0.94921875, 1.2147216796875, 1.480224609375, 1.7457275390625, 2.01123046875, 2.2767333984375, 2.542236328125, 2.8077392578125, 3.0732421875, 3.3387451171875, 3.604248046875, 3.8697509765625, 4.13525390625, 4.4007568359375, 4.666259765625, 4.9317626953125, 5.197265625, 5.4627685546875, 5.728271484375, 5.9937744140625, 6.25927734375, 6.5247802734375, 6.790283203125, 7.0557861328125, 7.3212890625, 7.5867919921875, 7.852294921875, 8.1177978515625, 8.38330078125, 8.6488037109375, 8.914306640625, 9.1798095703125, 9.4453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 13.0, 11.0, 12.0, 17.0, 32.0, 46.0, 58.0, 92.0, 160.0, 180.0, 270.0, 491.0, 807.0, 1344.0, 2444.0, 4869.0, 10488.0, 26145.0, 76071.0, 258401.0, 431373.0, 154381.0, 47594.0, 17528.0, 7514.0, 3506.0, 1852.0, 1024.0, 610.0, 392.0, 254.0, 185.0, 114.0, 82.0, 55.0, 42.0, 27.0, 14.0, 13.0, 17.0, 5.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.46875, -11.124267578125, -10.77978515625, -10.435302734375, -10.0908203125, -9.746337890625, -9.40185546875, -9.057373046875, -8.712890625, -8.368408203125, -8.02392578125, -7.679443359375, -7.3349609375, -6.990478515625, -6.64599609375, -6.301513671875, -5.95703125, -5.612548828125, -5.26806640625, -4.923583984375, -4.5791015625, -4.234619140625, -3.89013671875, -3.545654296875, -3.201171875, -2.856689453125, -2.51220703125, -2.167724609375, -1.8232421875, -1.478759765625, -1.13427734375, -0.789794921875, -0.4453125, -0.100830078125, 0.24365234375, 0.588134765625, 0.9326171875, 1.277099609375, 1.62158203125, 1.966064453125, 2.310546875, 2.655029296875, 2.99951171875, 3.343994140625, 3.6884765625, 4.032958984375, 4.37744140625, 4.721923828125, 5.06640625, 5.410888671875, 5.75537109375, 6.099853515625, 6.4443359375, 6.788818359375, 7.13330078125, 7.477783203125, 7.822265625, 8.166748046875, 8.51123046875, 8.855712890625, 9.2001953125, 9.544677734375, 9.88916015625, 10.233642578125, 10.578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 9.0, 9.0, 11.0, 10.0, 27.0, 24.0, 31.0, 58.0, 73.0, 88.0, 122.0, 113.0, 111.0, 82.0, 50.0, 47.0, 37.0, 19.0, 19.0, 12.0, 10.0, 4.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005164146423339844, -0.0005009956657886505, -0.00048557668924331665, -0.0004701577126979828, -0.0004547387361526489, -0.00043931975960731506, -0.0004239007830619812, -0.00040848180651664734, -0.0003930628299713135, -0.0003776438534259796, -0.00036222487688064575, -0.0003468059003353119, -0.00033138692378997803, -0.00031596794724464417, -0.0003005489706993103, -0.00028512999415397644, -0.0002697110176086426, -0.0002542920410633087, -0.00023887306451797485, -0.000223454087972641, -0.00020803511142730713, -0.00019261613488197327, -0.0001771971583366394, -0.00016177818179130554, -0.00014635920524597168, -0.00013094022870063782, -0.00011552125215530396, -0.00010010227560997009, -8.468329906463623e-05, -6.926432251930237e-05, -5.3845345973968506e-05, -3.8426369428634644e-05, -2.300739288330078e-05, -7.588416337966919e-06, 7.830560207366943e-06, 2.3249536752700806e-05, 3.866851329803467e-05, 5.408748984336853e-05, 6.950646638870239e-05, 8.492544293403625e-05, 0.00010034441947937012, 0.00011576339602470398, 0.00013118237257003784, 0.0001466013491153717, 0.00016202032566070557, 0.00017743930220603943, 0.0001928582787513733, 0.00020827725529670715, 0.00022369623184204102, 0.00023911520838737488, 0.00025453418493270874, 0.0002699531614780426, 0.00028537213802337646, 0.00030079111456871033, 0.0003162100911140442, 0.00033162906765937805, 0.0003470480442047119, 0.0003624670207500458, 0.00037788599729537964, 0.0003933049738407135, 0.00040872395038604736, 0.0004241429269313812, 0.0004395619034767151, 0.00045498088002204895, 0.0004703998565673828]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 12.0, 16.0, 19.0, 32.0, 72.0, 74.0, 121.0, 178.0, 298.0, 445.0, 667.0, 1094.0, 1887.0, 3534.0, 7021.0, 15322.0, 37000.0, 101098.0, 283413.0, 357514.0, 147192.0, 51466.0, 20510.0, 9288.0, 4405.0, 2320.0, 1316.0, 783.0, 481.0, 328.0, 212.0, 137.0, 90.0, 63.0, 44.0, 15.0, 22.0, 10.0, 9.0, 4.0, 10.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1700439453125, -8.855712890625, -8.5413818359375, -8.22705078125, -7.9127197265625, -7.598388671875, -7.2840576171875, -6.9697265625, -6.6553955078125, -6.341064453125, -6.0267333984375, -5.71240234375, -5.3980712890625, -5.083740234375, -4.7694091796875, -4.455078125, -4.1407470703125, -3.826416015625, -3.5120849609375, -3.19775390625, -2.8834228515625, -2.569091796875, -2.2547607421875, -1.9404296875, -1.6260986328125, -1.311767578125, -0.9974365234375, -0.68310546875, -0.3687744140625, -0.054443359375, 0.2598876953125, 0.57421875, 0.8885498046875, 1.202880859375, 1.5172119140625, 1.83154296875, 2.1458740234375, 2.460205078125, 2.7745361328125, 3.0888671875, 3.4031982421875, 3.717529296875, 4.0318603515625, 4.34619140625, 4.6605224609375, 4.974853515625, 5.2891845703125, 5.603515625, 5.9178466796875, 6.232177734375, 6.5465087890625, 6.86083984375, 7.1751708984375, 7.489501953125, 7.8038330078125, 8.1181640625, 8.4324951171875, 8.746826171875, 9.0611572265625, 9.37548828125, 9.6898193359375, 10.004150390625, 10.3184814453125, 10.6328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 12.0, 13.0, 20.0, 32.0, 34.0, 43.0, 50.0, 55.0, 73.0, 57.0, 75.0, 83.0, 80.0, 72.0, 51.0, 50.0, 47.0, 24.0, 19.0, 23.0, 16.0, 9.0, 11.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.9661865234375, -2.860107421875, -2.7540283203125, -2.64794921875, -2.5418701171875, -2.435791015625, -2.3297119140625, -2.2236328125, -2.1175537109375, -2.011474609375, -1.9053955078125, -1.79931640625, -1.6932373046875, -1.587158203125, -1.4810791015625, -1.375, -1.2689208984375, -1.162841796875, -1.0567626953125, -0.95068359375, -0.8446044921875, -0.738525390625, -0.6324462890625, -0.5263671875, -0.4202880859375, -0.314208984375, -0.2081298828125, -0.10205078125, 0.0040283203125, 0.110107421875, 0.2161865234375, 0.322265625, 0.4283447265625, 0.534423828125, 0.6405029296875, 0.74658203125, 0.8526611328125, 0.958740234375, 1.0648193359375, 1.1708984375, 1.2769775390625, 1.383056640625, 1.4891357421875, 1.59521484375, 1.7012939453125, 1.807373046875, 1.9134521484375, 2.01953125, 2.1256103515625, 2.231689453125, 2.3377685546875, 2.44384765625, 2.5499267578125, 2.656005859375, 2.7620849609375, 2.8681640625, 2.9742431640625, 3.080322265625, 3.1864013671875, 3.29248046875, 3.3985595703125, 3.504638671875, 3.6107177734375, 3.716796875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 0.0, 5.0, 8.0, 15.0, 15.0, 15.0, 30.0, 46.0, 67.0, 69.0, 108.0, 114.0, 105.0, 102.0, 79.0, 61.0, 45.0, 34.0, 20.0, 13.0, 13.0, 12.0, 5.0, 1.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.49533462524414, -27.763118743896484, -27.030900955200195, -26.29868507385254, -25.56646728515625, -24.834251403808594, -24.102035522460938, -23.36981773376465, -22.63759994506836, -21.905384063720703, -21.173166275024414, -20.440950393676758, -19.70873260498047, -18.976516723632812, -18.244300842285156, -17.512083053588867, -16.77986717224121, -16.047651290893555, -15.315433502197266, -14.58321762084961, -13.85099983215332, -13.118783950805664, -12.386567115783691, -11.654350280761719, -10.922133445739746, -10.189916610717773, -9.4576997756958, -8.725482940673828, -7.993266582489014, -7.261049747467041, -6.528833389282227, -5.796616554260254, -5.064399719238281, -4.332182884216309, -3.599966287612915, -2.8677496910095215, -2.135532855987549, -1.4033160209655762, -0.6710996627807617, 0.06111717224121094, 0.7933340072631836, 1.5255507230758667, 2.25776743888855, 2.9899840354919434, 3.722200870513916, 4.454417705535889, 5.186634063720703, 5.918850898742676, 6.651067733764648, 7.383284568786621, 8.115501403808594, 8.84771728515625, 9.579935073852539, 10.312150955200195, 11.044367790222168, 11.77658462524414, 12.508801460266113, 13.241018295288086, 13.973235130310059, 14.705451965332031, 15.437667846679688, 16.169885635375977, 16.902101516723633, 17.634319305419922, 18.366535186767578]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 8.0, 7.0, 5.0, 12.0, 11.0, 15.0, 18.0, 19.0, 25.0, 35.0, 33.0, 27.0, 36.0, 42.0, 37.0, 49.0, 46.0, 42.0, 46.0, 44.0, 49.0, 48.0, 33.0, 33.0, 42.0, 38.0, 33.0, 23.0, 17.0, 21.0, 24.0, 15.0, 17.0, 13.0, 8.0, 9.0, 8.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.731971740722656, -14.319819450378418, -13.907666206359863, -13.495513916015625, -13.08336067199707, -12.671208381652832, -12.259056091308594, -11.846902847290039, -11.434749603271484, -11.022597312927246, -10.610444068908691, -10.198291778564453, -9.786138534545898, -9.37398624420166, -8.961833953857422, -8.549680709838867, -8.137528419494629, -7.725375652313232, -7.313222885131836, -6.901070594787598, -6.488917350769043, -6.076765060424805, -5.664612293243408, -5.252459526062012, -4.840306758880615, -4.428153991699219, -4.016001224517822, -3.603848695755005, -3.1916959285736084, -2.779543161392212, -2.3673906326293945, -1.955237865447998, -1.5430850982666016, -1.130932331085205, -0.7187796831130981, -0.3066270351409912, 0.10552573204040527, 0.5176784992218018, 0.9298310279846191, 1.3419837951660156, 1.754136562347412, 2.1662893295288086, 2.578442096710205, 2.9905946254730225, 3.402747392654419, 3.8149001598358154, 4.227052688598633, 4.639205455780029, 5.051358222961426, 5.463510990142822, 5.875663757324219, 6.287816047668457, 6.699969291687012, 7.11212158203125, 7.5242743492126465, 7.936427116394043, 8.348579406738281, 8.76073169708252, 9.172884941101074, 9.585037231445312, 9.997190475463867, 10.409342765808105, 10.821495056152344, 11.233648300170898, 11.645801544189453]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 11.0, 24.0, 25.0, 41.0, 76.0, 83.0, 107.0, 190.0, 311.0, 422.0, 703.0, 1123.0, 1771.0, 2952.0, 5180.0, 9411.0, 17785.0, 34845.0, 70830.0, 138559.0, 220921.0, 230184.0, 151416.0, 79166.0, 38708.0, 19573.0, 10309.0, 5520.0, 3146.0, 1955.0, 1137.0, 703.0, 459.0, 316.0, 178.0, 118.0, 89.0, 65.0, 40.0, 36.0, 18.0, 17.0, 5.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.03125, -19.443359375, -18.85546875, -18.267578125, -17.6796875, -17.091796875, -16.50390625, -15.916015625, -15.328125, -14.740234375, -14.15234375, -13.564453125, -12.9765625, -12.388671875, -11.80078125, -11.212890625, -10.625, -10.037109375, -9.44921875, -8.861328125, -8.2734375, -7.685546875, -7.09765625, -6.509765625, -5.921875, -5.333984375, -4.74609375, -4.158203125, -3.5703125, -2.982421875, -2.39453125, -1.806640625, -1.21875, -0.630859375, -0.04296875, 0.544921875, 1.1328125, 1.720703125, 2.30859375, 2.896484375, 3.484375, 4.072265625, 4.66015625, 5.248046875, 5.8359375, 6.423828125, 7.01171875, 7.599609375, 8.1875, 8.775390625, 9.36328125, 9.951171875, 10.5390625, 11.126953125, 11.71484375, 12.302734375, 12.890625, 13.478515625, 14.06640625, 14.654296875, 15.2421875, 15.830078125, 16.41796875, 17.005859375, 17.59375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 9.0, 5.0, 10.0, 14.0, 13.0, 21.0, 33.0, 29.0, 30.0, 26.0, 28.0, 40.0, 38.0, 50.0, 35.0, 48.0, 45.0, 47.0, 45.0, 39.0, 46.0, 31.0, 33.0, 45.0, 34.0, 30.0, 21.0, 19.0, 18.0, 16.0, 17.0, 17.0, 16.0, 11.0, 7.0, 5.0, 4.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-14.1796875, -13.7786865234375, -13.377685546875, -12.9766845703125, -12.57568359375, -12.1746826171875, -11.773681640625, -11.3726806640625, -10.9716796875, -10.5706787109375, -10.169677734375, -9.7686767578125, -9.36767578125, -8.9666748046875, -8.565673828125, -8.1646728515625, -7.763671875, -7.3626708984375, -6.961669921875, -6.5606689453125, -6.15966796875, -5.7586669921875, -5.357666015625, -4.9566650390625, -4.5556640625, -4.1546630859375, -3.753662109375, -3.3526611328125, -2.95166015625, -2.5506591796875, -2.149658203125, -1.7486572265625, -1.34765625, -0.9466552734375, -0.545654296875, -0.1446533203125, 0.25634765625, 0.6573486328125, 1.058349609375, 1.4593505859375, 1.8603515625, 2.2613525390625, 2.662353515625, 3.0633544921875, 3.46435546875, 3.8653564453125, 4.266357421875, 4.6673583984375, 5.068359375, 5.4693603515625, 5.870361328125, 6.2713623046875, 6.67236328125, 7.0733642578125, 7.474365234375, 7.8753662109375, 8.2763671875, 8.6773681640625, 9.078369140625, 9.4793701171875, 9.88037109375, 10.2813720703125, 10.682373046875, 11.0833740234375, 11.484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 2.0, 8.0, 8.0, 14.0, 20.0, 22.0, 25.0, 58.0, 61.0, 105.0, 148.0, 204.0, 359.0, 549.0, 798.0, 1212.0, 1939.0, 2838.0, 4603.0, 7344.0, 12304.0, 20372.0, 34733.0, 59550.0, 100906.0, 156867.0, 193453.0, 169732.0, 113194.0, 68149.0, 38999.0, 22975.0, 14128.0, 8371.0, 5152.0, 3316.0, 2120.0, 1337.0, 839.0, 561.0, 380.0, 267.0, 171.0, 110.0, 73.0, 63.0, 34.0, 23.0, 14.0, 20.0, 19.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.046875, -13.588134765625, -13.12939453125, -12.670654296875, -12.2119140625, -11.753173828125, -11.29443359375, -10.835693359375, -10.376953125, -9.918212890625, -9.45947265625, -9.000732421875, -8.5419921875, -8.083251953125, -7.62451171875, -7.165771484375, -6.70703125, -6.248291015625, -5.78955078125, -5.330810546875, -4.8720703125, -4.413330078125, -3.95458984375, -3.495849609375, -3.037109375, -2.578369140625, -2.11962890625, -1.660888671875, -1.2021484375, -0.743408203125, -0.28466796875, 0.174072265625, 0.6328125, 1.091552734375, 1.55029296875, 2.009033203125, 2.4677734375, 2.926513671875, 3.38525390625, 3.843994140625, 4.302734375, 4.761474609375, 5.22021484375, 5.678955078125, 6.1376953125, 6.596435546875, 7.05517578125, 7.513916015625, 7.97265625, 8.431396484375, 8.89013671875, 9.348876953125, 9.8076171875, 10.266357421875, 10.72509765625, 11.183837890625, 11.642578125, 12.101318359375, 12.56005859375, 13.018798828125, 13.4775390625, 13.936279296875, 14.39501953125, 14.853759765625, 15.3125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 11.0, 11.0, 11.0, 12.0, 9.0, 18.0, 22.0, 18.0, 18.0, 23.0, 25.0, 33.0, 32.0, 34.0, 34.0, 33.0, 35.0, 35.0, 39.0, 37.0, 32.0, 37.0, 33.0, 25.0, 35.0, 39.0, 28.0, 38.0, 38.0, 32.0, 17.0, 24.0, 15.0, 17.0, 11.0, 16.0, 12.0, 8.0, 8.0, 5.0, 2.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.046875, -7.7847900390625, -7.522705078125, -7.2606201171875, -6.99853515625, -6.7364501953125, -6.474365234375, -6.2122802734375, -5.9501953125, -5.6881103515625, -5.426025390625, -5.1639404296875, -4.90185546875, -4.6397705078125, -4.377685546875, -4.1156005859375, -3.853515625, -3.5914306640625, -3.329345703125, -3.0672607421875, -2.80517578125, -2.5430908203125, -2.281005859375, -2.0189208984375, -1.7568359375, -1.4947509765625, -1.232666015625, -0.9705810546875, -0.70849609375, -0.4464111328125, -0.184326171875, 0.0777587890625, 0.33984375, 0.6019287109375, 0.864013671875, 1.1260986328125, 1.38818359375, 1.6502685546875, 1.912353515625, 2.1744384765625, 2.4365234375, 2.6986083984375, 2.960693359375, 3.2227783203125, 3.48486328125, 3.7469482421875, 4.009033203125, 4.2711181640625, 4.533203125, 4.7952880859375, 5.057373046875, 5.3194580078125, 5.58154296875, 5.8436279296875, 6.105712890625, 6.3677978515625, 6.6298828125, 6.8919677734375, 7.154052734375, 7.4161376953125, 7.67822265625, 7.9403076171875, 8.202392578125, 8.4644775390625, 8.7265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 14.0, 27.0, 50.0, 62.0, 97.0, 142.0, 198.0, 343.0, 597.0, 991.0, 1643.0, 2940.0, 5320.0, 10734.0, 24020.0, 64939.0, 215472.0, 439480.0, 182282.0, 55960.0, 21852.0, 9865.0, 4934.0, 2678.0, 1502.0, 913.0, 536.0, 341.0, 214.0, 146.0, 79.0, 55.0, 39.0, 23.0, 18.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.921875, -29.968505859375, -29.01513671875, -28.061767578125, -27.1083984375, -26.155029296875, -25.20166015625, -24.248291015625, -23.294921875, -22.341552734375, -21.38818359375, -20.434814453125, -19.4814453125, -18.528076171875, -17.57470703125, -16.621337890625, -15.66796875, -14.714599609375, -13.76123046875, -12.807861328125, -11.8544921875, -10.901123046875, -9.94775390625, -8.994384765625, -8.041015625, -7.087646484375, -6.13427734375, -5.180908203125, -4.2275390625, -3.274169921875, -2.32080078125, -1.367431640625, -0.4140625, 0.539306640625, 1.49267578125, 2.446044921875, 3.3994140625, 4.352783203125, 5.30615234375, 6.259521484375, 7.212890625, 8.166259765625, 9.11962890625, 10.072998046875, 11.0263671875, 11.979736328125, 12.93310546875, 13.886474609375, 14.83984375, 15.793212890625, 16.74658203125, 17.699951171875, 18.6533203125, 19.606689453125, 20.56005859375, 21.513427734375, 22.466796875, 23.420166015625, 24.37353515625, 25.326904296875, 26.2802734375, 27.233642578125, 28.18701171875, 29.140380859375, 30.09375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 6.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 19.0, 8.0, 30.0, 37.0, 44.0, 65.0, 78.0, 104.0, 104.0, 96.0, 76.0, 63.0, 50.0, 40.0, 28.0, 19.0, 19.0, 9.0, 14.0, 8.0, 4.0, 8.0, 3.0, 8.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016937255859375, -0.001638263463973999, -0.001582801342010498, -0.001527339220046997, -0.001471877098083496, -0.0014164149761199951, -0.0013609528541564941, -0.0013054907321929932, -0.0012500286102294922, -0.0011945664882659912, -0.0011391043663024902, -0.0010836422443389893, -0.0010281801223754883, -0.0009727180004119873, -0.0009172558784484863, -0.0008617937564849854, -0.0008063316345214844, -0.0007508695125579834, -0.0006954073905944824, -0.0006399452686309814, -0.0005844831466674805, -0.0005290210247039795, -0.0004735589027404785, -0.00041809678077697754, -0.00036263465881347656, -0.0003071725368499756, -0.0002517104148864746, -0.00019624829292297363, -0.00014078617095947266, -8.532404899597168e-05, -2.9861927032470703e-05, 2.5600194931030273e-05, 8.106231689453125e-05, 0.00013652443885803223, 0.0001919865608215332, 0.0002474486827850342, 0.00030291080474853516, 0.00035837292671203613, 0.0004138350486755371, 0.0004692971706390381, 0.0005247592926025391, 0.00058022141456604, 0.000635683536529541, 0.000691145658493042, 0.000746607780456543, 0.0008020699024200439, 0.0008575320243835449, 0.0009129941463470459, 0.0009684562683105469, 0.0010239183902740479, 0.0010793805122375488, 0.0011348426342010498, 0.0011903047561645508, 0.0012457668781280518, 0.0013012290000915527, 0.0013566911220550537, 0.0014121532440185547, 0.0014676153659820557, 0.0015230774879455566, 0.0015785396099090576, 0.0016340017318725586, 0.0016894638538360596, 0.0017449259757995605, 0.0018003880977630615, 0.0018558502197265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 27.0, 28.0, 50.0, 49.0, 71.0, 75.0, 146.0, 191.0, 262.0, 439.0, 685.0, 1038.0, 1658.0, 2756.0, 4522.0, 8054.0, 15867.0, 33336.0, 75227.0, 182761.0, 322338.0, 223451.0, 93592.0, 40106.0, 18791.0, 9537.0, 5128.0, 3060.0, 1796.0, 1176.0, 722.0, 493.0, 350.0, 231.0, 157.0, 124.0, 60.0, 55.0, 27.0, 29.0, 11.0, 11.0, 12.0, 12.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0], "bins": [-20.40625, -19.79931640625, -19.1923828125, -18.58544921875, -17.978515625, -17.37158203125, -16.7646484375, -16.15771484375, -15.55078125, -14.94384765625, -14.3369140625, -13.72998046875, -13.123046875, -12.51611328125, -11.9091796875, -11.30224609375, -10.6953125, -10.08837890625, -9.4814453125, -8.87451171875, -8.267578125, -7.66064453125, -7.0537109375, -6.44677734375, -5.83984375, -5.23291015625, -4.6259765625, -4.01904296875, -3.412109375, -2.80517578125, -2.1982421875, -1.59130859375, -0.984375, -0.37744140625, 0.2294921875, 0.83642578125, 1.443359375, 2.05029296875, 2.6572265625, 3.26416015625, 3.87109375, 4.47802734375, 5.0849609375, 5.69189453125, 6.298828125, 6.90576171875, 7.5126953125, 8.11962890625, 8.7265625, 9.33349609375, 9.9404296875, 10.54736328125, 11.154296875, 11.76123046875, 12.3681640625, 12.97509765625, 13.58203125, 14.18896484375, 14.7958984375, 15.40283203125, 16.009765625, 16.61669921875, 17.2236328125, 17.83056640625, 18.4375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 6.0, 2.0, 5.0, 11.0, 20.0, 23.0, 29.0, 37.0, 55.0, 71.0, 76.0, 77.0, 97.0, 94.0, 67.0, 73.0, 66.0, 47.0, 40.0, 23.0, 19.0, 20.0, 13.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.625, -9.3397216796875, -9.054443359375, -8.7691650390625, -8.48388671875, -8.1986083984375, -7.913330078125, -7.6280517578125, -7.3427734375, -7.0574951171875, -6.772216796875, -6.4869384765625, -6.20166015625, -5.9163818359375, -5.631103515625, -5.3458251953125, -5.060546875, -4.7752685546875, -4.489990234375, -4.2047119140625, -3.91943359375, -3.6341552734375, -3.348876953125, -3.0635986328125, -2.7783203125, -2.4930419921875, -2.207763671875, -1.9224853515625, -1.63720703125, -1.3519287109375, -1.066650390625, -0.7813720703125, -0.49609375, -0.2108154296875, 0.074462890625, 0.3597412109375, 0.64501953125, 0.9302978515625, 1.215576171875, 1.5008544921875, 1.7861328125, 2.0714111328125, 2.356689453125, 2.6419677734375, 2.92724609375, 3.2125244140625, 3.497802734375, 3.7830810546875, 4.068359375, 4.3536376953125, 4.638916015625, 4.9241943359375, 5.20947265625, 5.4947509765625, 5.780029296875, 6.0653076171875, 6.3505859375, 6.6358642578125, 6.921142578125, 7.2064208984375, 7.49169921875, 7.7769775390625, 8.062255859375, 8.3475341796875, 8.6328125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 10.0, 19.0, 14.0, 25.0, 25.0, 29.0, 33.0, 55.0, 62.0, 75.0, 81.0, 74.0, 76.0, 70.0, 59.0, 55.0, 47.0, 33.0, 29.0, 30.0, 13.0, 12.0, 11.0, 11.0, 4.0, 8.0, 6.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.959487915039062, -18.40255355834961, -17.845619201660156, -17.28868293762207, -16.731748580932617, -16.174814224243164, -15.617879867553711, -15.060945510864258, -14.504010200500488, -13.947075843811035, -13.390140533447266, -12.833206176757812, -12.27627182006836, -11.71933650970459, -11.162402153015137, -10.605466842651367, -10.048532485961914, -9.491598129272461, -8.934662818908691, -8.377728462219238, -7.820793628692627, -7.263858795166016, -6.7069244384765625, -6.149989604949951, -5.59305477142334, -5.0361199378967285, -4.479185104370117, -3.922250747680664, -3.3653159141540527, -2.8083810806274414, -2.251446485519409, -1.694511890411377, -1.1375789642333984, -0.5806442499160767, -0.023709535598754883, 0.5332251787185669, 1.0901598930358887, 1.6470947265625, 2.2040293216705322, 2.7609639167785645, 3.317898750305176, 3.874833583831787, 4.431768417358398, 4.988702774047852, 5.545637607574463, 6.102572441101074, 6.659506797790527, 7.216441631317139, 7.77337646484375, 8.330310821533203, 8.887246131896973, 9.444180488586426, 10.001115798950195, 10.558050155639648, 11.114984512329102, 11.671918869018555, 12.228854179382324, 12.785788536071777, 13.342723846435547, 13.899658203125, 14.456592559814453, 15.013527870178223, 15.570462226867676, 16.127397537231445, 16.6843318939209]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 8.0, 3.0, 9.0, 8.0, 17.0, 12.0, 24.0, 32.0, 30.0, 42.0, 42.0, 35.0, 40.0, 44.0, 47.0, 38.0, 52.0, 42.0, 43.0, 58.0, 54.0, 35.0, 36.0, 31.0, 35.0, 36.0, 39.0, 21.0, 16.0, 15.0, 12.0, 9.0, 9.0, 5.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.434259414672852, -13.986702919006348, -13.539145469665527, -13.091588973999023, -12.644031524658203, -12.1964750289917, -11.748918533325195, -11.301361083984375, -10.853803634643555, -10.40624713897705, -9.95868968963623, -9.511133193969727, -9.063575744628906, -8.616019248962402, -8.168462753295898, -7.720905303955078, -7.273348808288574, -6.825791835784912, -6.37823486328125, -5.930678367614746, -5.483120918273926, -5.035564422607422, -4.58800745010376, -4.140450477600098, -3.6928935050964355, -3.2453365325927734, -2.7977795600891113, -2.3502228260040283, -1.9026658535003662, -1.455108880996704, -1.007552146911621, -0.559995174407959, -0.11243724822998047, 0.33511966466903687, 0.7826765775680542, 1.2302334308624268, 1.6777904033660889, 2.125347375869751, 2.572904109954834, 3.020461082458496, 3.468018054962158, 3.9155750274658203, 4.363131999969482, 4.8106889724731445, 5.258245468139648, 5.705802917480469, 6.153359413146973, 6.600916385650635, 7.048473358154297, 7.496030330657959, 7.943587303161621, 8.391143798828125, 8.838701248168945, 9.28625774383545, 9.733814239501953, 10.181371688842773, 10.628929138183594, 11.076485633850098, 11.524043083190918, 11.971599578857422, 12.419157028198242, 12.866713523864746, 13.31427001953125, 13.76182746887207, 14.209383964538574]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 11.0, 21.0, 29.0, 43.0, 85.0, 128.0, 189.0, 296.0, 523.0, 816.0, 1241.0, 2172.0, 3643.0, 6650.0, 12763.0, 26094.0, 61519.0, 170198.0, 533300.0, 1314840.0, 1287355.0, 502636.0, 157998.0, 57912.0, 25227.0, 12372.0, 6670.0, 3696.0, 2228.0, 1270.0, 790.0, 559.0, 362.0, 232.0, 134.0, 94.0, 58.0, 39.0, 19.0, 21.0, 9.0, 11.0, 5.0, 5.0, 3.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.34375, -15.759521484375, -15.17529296875, -14.591064453125, -14.0068359375, -13.422607421875, -12.83837890625, -12.254150390625, -11.669921875, -11.085693359375, -10.50146484375, -9.917236328125, -9.3330078125, -8.748779296875, -8.16455078125, -7.580322265625, -6.99609375, -6.411865234375, -5.82763671875, -5.243408203125, -4.6591796875, -4.074951171875, -3.49072265625, -2.906494140625, -2.322265625, -1.738037109375, -1.15380859375, -0.569580078125, 0.0146484375, 0.598876953125, 1.18310546875, 1.767333984375, 2.3515625, 2.935791015625, 3.52001953125, 4.104248046875, 4.6884765625, 5.272705078125, 5.85693359375, 6.441162109375, 7.025390625, 7.609619140625, 8.19384765625, 8.778076171875, 9.3623046875, 9.946533203125, 10.53076171875, 11.114990234375, 11.69921875, 12.283447265625, 12.86767578125, 13.451904296875, 14.0361328125, 14.620361328125, 15.20458984375, 15.788818359375, 16.373046875, 16.957275390625, 17.54150390625, 18.125732421875, 18.7099609375, 19.294189453125, 19.87841796875, 20.462646484375, 21.046875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 5.0, 11.0, 11.0, 7.0, 19.0, 16.0, 25.0, 25.0, 26.0, 35.0, 43.0, 42.0, 32.0, 38.0, 43.0, 50.0, 41.0, 46.0, 55.0, 47.0, 45.0, 42.0, 33.0, 35.0, 31.0, 32.0, 28.0, 26.0, 22.0, 16.0, 10.0, 15.0, 11.0, 11.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.84375, -9.5634765625, -9.283203125, -9.0029296875, -8.72265625, -8.4423828125, -8.162109375, -7.8818359375, -7.6015625, -7.3212890625, -7.041015625, -6.7607421875, -6.48046875, -6.2001953125, -5.919921875, -5.6396484375, -5.359375, -5.0791015625, -4.798828125, -4.5185546875, -4.23828125, -3.9580078125, -3.677734375, -3.3974609375, -3.1171875, -2.8369140625, -2.556640625, -2.2763671875, -1.99609375, -1.7158203125, -1.435546875, -1.1552734375, -0.875, -0.5947265625, -0.314453125, -0.0341796875, 0.24609375, 0.5263671875, 0.806640625, 1.0869140625, 1.3671875, 1.6474609375, 1.927734375, 2.2080078125, 2.48828125, 2.7685546875, 3.048828125, 3.3291015625, 3.609375, 3.8896484375, 4.169921875, 4.4501953125, 4.73046875, 5.0107421875, 5.291015625, 5.5712890625, 5.8515625, 6.1318359375, 6.412109375, 6.6923828125, 6.97265625, 7.2529296875, 7.533203125, 7.8134765625, 8.09375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 7.0, 2.0, 6.0, 7.0, 14.0, 10.0, 20.0, 31.0, 45.0, 62.0, 70.0, 108.0, 156.0, 252.0, 393.0, 525.0, 808.0, 1109.0, 1743.0, 2594.0, 3908.0, 6407.0, 10915.0, 19682.0, 37867.0, 85687.0, 224441.0, 633143.0, 1318819.0, 1107770.0, 445303.0, 158657.0, 62905.0, 30102.0, 15698.0, 9051.0, 5550.0, 3492.0, 2249.0, 1516.0, 998.0, 667.0, 456.0, 329.0, 226.0, 159.0, 88.0, 82.0, 45.0, 31.0, 25.0, 22.0, 19.0, 10.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.448486328125, -14.91259765625, -14.376708984375, -13.8408203125, -13.304931640625, -12.76904296875, -12.233154296875, -11.697265625, -11.161376953125, -10.62548828125, -10.089599609375, -9.5537109375, -9.017822265625, -8.48193359375, -7.946044921875, -7.41015625, -6.874267578125, -6.33837890625, -5.802490234375, -5.2666015625, -4.730712890625, -4.19482421875, -3.658935546875, -3.123046875, -2.587158203125, -2.05126953125, -1.515380859375, -0.9794921875, -0.443603515625, 0.09228515625, 0.628173828125, 1.1640625, 1.699951171875, 2.23583984375, 2.771728515625, 3.3076171875, 3.843505859375, 4.37939453125, 4.915283203125, 5.451171875, 5.987060546875, 6.52294921875, 7.058837890625, 7.5947265625, 8.130615234375, 8.66650390625, 9.202392578125, 9.73828125, 10.274169921875, 10.81005859375, 11.345947265625, 11.8818359375, 12.417724609375, 12.95361328125, 13.489501953125, 14.025390625, 14.561279296875, 15.09716796875, 15.633056640625, 16.1689453125, 16.704833984375, 17.24072265625, 17.776611328125, 18.3125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 9.0, 6.0, 15.0, 10.0, 13.0, 19.0, 21.0, 31.0, 44.0, 50.0, 69.0, 80.0, 102.0, 118.0, 181.0, 214.0, 261.0, 298.0, 299.0, 337.0, 335.0, 280.0, 278.0, 219.0, 165.0, 137.0, 123.0, 86.0, 60.0, 41.0, 42.0, 22.0, 18.0, 13.0, 13.0, 7.0, 7.0, 10.0, 9.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-5.6015625, -5.44842529296875, -5.2952880859375, -5.14215087890625, -4.989013671875, -4.83587646484375, -4.6827392578125, -4.52960205078125, -4.37646484375, -4.22332763671875, -4.0701904296875, -3.91705322265625, -3.763916015625, -3.61077880859375, -3.4576416015625, -3.30450439453125, -3.1513671875, -2.99822998046875, -2.8450927734375, -2.69195556640625, -2.538818359375, -2.38568115234375, -2.2325439453125, -2.07940673828125, -1.92626953125, -1.77313232421875, -1.6199951171875, -1.46685791015625, -1.313720703125, -1.16058349609375, -1.0074462890625, -0.85430908203125, -0.701171875, -0.54803466796875, -0.3948974609375, -0.24176025390625, -0.088623046875, 0.06451416015625, 0.2176513671875, 0.37078857421875, 0.52392578125, 0.67706298828125, 0.8302001953125, 0.98333740234375, 1.136474609375, 1.28961181640625, 1.4427490234375, 1.59588623046875, 1.7490234375, 1.90216064453125, 2.0552978515625, 2.20843505859375, 2.361572265625, 2.51470947265625, 2.6678466796875, 2.82098388671875, 2.97412109375, 3.12725830078125, 3.2803955078125, 3.43353271484375, 3.586669921875, 3.73980712890625, 3.8929443359375, 4.04608154296875, 4.19921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 8.0, 6.0, 8.0, 14.0, 14.0, 22.0, 30.0, 30.0, 48.0, 48.0, 76.0, 82.0, 116.0, 93.0, 74.0, 69.0, 67.0, 53.0, 31.0, 23.0, 23.0, 17.0, 16.0, 3.0, 8.0, 7.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.927227020263672, -22.33791160583496, -21.74859619140625, -21.15928077697754, -20.569965362548828, -19.980649948120117, -19.391334533691406, -18.802019119262695, -18.212703704833984, -17.623388290405273, -17.034072875976562, -16.44475746154785, -15.85544204711914, -15.26612663269043, -14.676811218261719, -14.087495803833008, -13.498181343078613, -12.908865928649902, -12.319550514221191, -11.73023509979248, -11.14091968536377, -10.551604270935059, -9.962289810180664, -9.372974395751953, -8.783658981323242, -8.194343566894531, -7.60502815246582, -7.015712738037109, -6.426397323608398, -5.8370819091796875, -5.247766971588135, -4.658451557159424, -4.069136619567871, -3.47982120513916, -2.890505790710449, -2.3011906147003174, -1.7118752002716064, -1.1225597858428955, -0.5332446098327637, 0.056070804595947266, 0.6453862190246582, 1.2347016334533691, 1.8240169286727905, 2.413332223892212, 3.002647638320923, 3.591963052749634, 4.181278228759766, 4.770593643188477, 5.3599090576171875, 5.949224472045898, 6.538539886474609, 7.12785530090332, 7.717170715332031, 8.306486129760742, 8.895801544189453, 9.485116958618164, 10.074432373046875, 10.663747787475586, 11.253063201904297, 11.842378616333008, 12.431694030761719, 13.02100944519043, 13.61032485961914, 14.199640274047852, 14.788954734802246]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 9.0, 22.0, 16.0, 16.0, 26.0, 33.0, 40.0, 36.0, 31.0, 35.0, 43.0, 44.0, 63.0, 56.0, 56.0, 60.0, 47.0, 49.0, 43.0, 36.0, 34.0, 24.0, 37.0, 25.0, 27.0, 17.0, 15.0, 12.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.667814254760742, -12.26236343383789, -11.856912612915039, -11.451460838317871, -11.04601001739502, -10.640559196472168, -10.235107421875, -9.829656600952148, -9.424205780029297, -9.018754959106445, -8.613304138183594, -8.207852363586426, -7.802401542663574, -7.396950721740723, -6.991499423980713, -6.586048126220703, -6.180597305297852, -5.775146484375, -5.36969518661499, -4.9642438888549805, -4.558793067932129, -4.153342247009277, -3.7478909492492676, -3.342439889907837, -2.9369888305664062, -2.5315377712249756, -2.126086711883545, -1.7206356525421143, -1.3151845932006836, -0.9097335338592529, -0.5042824745178223, -0.0988314151763916, 0.30661964416503906, 0.7120707035064697, 1.1175217628479004, 1.522972822189331, 1.9284238815307617, 2.3338749408721924, 2.739326000213623, 3.1447770595550537, 3.5502281188964844, 3.955679178237915, 4.361130237579346, 4.7665815353393555, 5.172032356262207, 5.577483177185059, 5.982934474945068, 6.388385772705078, 6.79383659362793, 7.199287414550781, 7.604738712310791, 8.0101900100708, 8.415640830993652, 8.821091651916504, 9.226543426513672, 9.631994247436523, 10.037445068359375, 10.442895889282227, 10.848346710205078, 11.253798484802246, 11.659249305725098, 12.06470012664795, 12.470151901245117, 12.875602722167969, 13.28105354309082]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 8.0, 13.0, 24.0, 33.0, 55.0, 82.0, 126.0, 171.0, 311.0, 460.0, 675.0, 1192.0, 2029.0, 3677.0, 6613.0, 12106.0, 23081.0, 44470.0, 84498.0, 152076.0, 220409.0, 207518.0, 134102.0, 73130.0, 38048.0, 19674.0, 10624.0, 5657.0, 3191.0, 1794.0, 1055.0, 561.0, 383.0, 244.0, 151.0, 107.0, 65.0, 47.0, 24.0, 19.0, 18.0, 12.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-8.59375, -8.354248046875, -8.11474609375, -7.875244140625, -7.6357421875, -7.396240234375, -7.15673828125, -6.917236328125, -6.677734375, -6.438232421875, -6.19873046875, -5.959228515625, -5.7197265625, -5.480224609375, -5.24072265625, -5.001220703125, -4.76171875, -4.522216796875, -4.28271484375, -4.043212890625, -3.8037109375, -3.564208984375, -3.32470703125, -3.085205078125, -2.845703125, -2.606201171875, -2.36669921875, -2.127197265625, -1.8876953125, -1.648193359375, -1.40869140625, -1.169189453125, -0.9296875, -0.690185546875, -0.45068359375, -0.211181640625, 0.0283203125, 0.267822265625, 0.50732421875, 0.746826171875, 0.986328125, 1.225830078125, 1.46533203125, 1.704833984375, 1.9443359375, 2.183837890625, 2.42333984375, 2.662841796875, 2.90234375, 3.141845703125, 3.38134765625, 3.620849609375, 3.8603515625, 4.099853515625, 4.33935546875, 4.578857421875, 4.818359375, 5.057861328125, 5.29736328125, 5.536865234375, 5.7763671875, 6.015869140625, 6.25537109375, 6.494873046875, 6.734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 11.0, 19.0, 21.0, 11.0, 29.0, 35.0, 33.0, 28.0, 45.0, 44.0, 39.0, 59.0, 49.0, 66.0, 52.0, 58.0, 54.0, 46.0, 38.0, 39.0, 37.0, 32.0, 26.0, 30.0, 14.0, 23.0, 12.0, 5.0, 9.0, 5.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.59765625, -13.15625, -12.71484375, -12.2734375, -11.83203125, -11.390625, -10.94921875, -10.5078125, -10.06640625, -9.625, -9.18359375, -8.7421875, -8.30078125, -7.859375, -7.41796875, -6.9765625, -6.53515625, -6.09375, -5.65234375, -5.2109375, -4.76953125, -4.328125, -3.88671875, -3.4453125, -3.00390625, -2.5625, -2.12109375, -1.6796875, -1.23828125, -0.796875, -0.35546875, 0.0859375, 0.52734375, 0.96875, 1.41015625, 1.8515625, 2.29296875, 2.734375, 3.17578125, 3.6171875, 4.05859375, 4.5, 4.94140625, 5.3828125, 5.82421875, 6.265625, 6.70703125, 7.1484375, 7.58984375, 8.03125, 8.47265625, 8.9140625, 9.35546875, 9.796875, 10.23828125, 10.6796875, 11.12109375, 11.5625, 12.00390625, 12.4453125, 12.88671875, 13.328125, 13.76953125, 14.2109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 18.0, 30.0, 33.0, 45.0, 67.0, 80.0, 149.0, 196.0, 262.0, 421.0, 599.0, 976.0, 1558.0, 2457.0, 3860.0, 6660.0, 11115.0, 19379.0, 36442.0, 70490.0, 139304.0, 239013.0, 233375.0, 133815.0, 66936.0, 34860.0, 19094.0, 10738.0, 6197.0, 3751.0, 2320.0, 1474.0, 948.0, 614.0, 391.0, 272.0, 175.0, 131.0, 81.0, 52.0, 40.0, 29.0, 28.0, 20.0, 10.0, 5.0, 10.0, 5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-8.3046875, -8.0364990234375, -7.768310546875, -7.5001220703125, -7.23193359375, -6.9637451171875, -6.695556640625, -6.4273681640625, -6.1591796875, -5.8909912109375, -5.622802734375, -5.3546142578125, -5.08642578125, -4.8182373046875, -4.550048828125, -4.2818603515625, -4.013671875, -3.7454833984375, -3.477294921875, -3.2091064453125, -2.94091796875, -2.6727294921875, -2.404541015625, -2.1363525390625, -1.8681640625, -1.5999755859375, -1.331787109375, -1.0635986328125, -0.79541015625, -0.5272216796875, -0.259033203125, 0.0091552734375, 0.27734375, 0.5455322265625, 0.813720703125, 1.0819091796875, 1.35009765625, 1.6182861328125, 1.886474609375, 2.1546630859375, 2.4228515625, 2.6910400390625, 2.959228515625, 3.2274169921875, 3.49560546875, 3.7637939453125, 4.031982421875, 4.3001708984375, 4.568359375, 4.8365478515625, 5.104736328125, 5.3729248046875, 5.64111328125, 5.9093017578125, 6.177490234375, 6.4456787109375, 6.7138671875, 6.9820556640625, 7.250244140625, 7.5184326171875, 7.78662109375, 8.0548095703125, 8.322998046875, 8.5911865234375, 8.859375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 13.0, 14.0, 15.0, 21.0, 16.0, 21.0, 25.0, 34.0, 29.0, 34.0, 29.0, 42.0, 37.0, 35.0, 45.0, 43.0, 52.0, 51.0, 41.0, 35.0, 37.0, 54.0, 40.0, 23.0, 24.0, 28.0, 21.0, 29.0, 19.0, 11.0, 13.0, 13.0, 13.0, 7.0, 4.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.4432373046875, -6.214599609375, -5.9859619140625, -5.75732421875, -5.5286865234375, -5.300048828125, -5.0714111328125, -4.8427734375, -4.6141357421875, -4.385498046875, -4.1568603515625, -3.92822265625, -3.6995849609375, -3.470947265625, -3.2423095703125, -3.013671875, -2.7850341796875, -2.556396484375, -2.3277587890625, -2.09912109375, -1.8704833984375, -1.641845703125, -1.4132080078125, -1.1845703125, -0.9559326171875, -0.727294921875, -0.4986572265625, -0.27001953125, -0.0413818359375, 0.187255859375, 0.4158935546875, 0.64453125, 0.8731689453125, 1.101806640625, 1.3304443359375, 1.55908203125, 1.7877197265625, 2.016357421875, 2.2449951171875, 2.4736328125, 2.7022705078125, 2.930908203125, 3.1595458984375, 3.38818359375, 3.6168212890625, 3.845458984375, 4.0740966796875, 4.302734375, 4.5313720703125, 4.760009765625, 4.9886474609375, 5.21728515625, 5.4459228515625, 5.674560546875, 5.9031982421875, 6.1318359375, 6.3604736328125, 6.589111328125, 6.8177490234375, 7.04638671875, 7.2750244140625, 7.503662109375, 7.7322998046875, 7.9609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 17.0, 29.0, 33.0, 53.0, 87.0, 153.0, 248.0, 385.0, 656.0, 1041.0, 1805.0, 3301.0, 5842.0, 11276.0, 23826.0, 55707.0, 147309.0, 358266.0, 265702.0, 97185.0, 38882.0, 17256.0, 8505.0, 4506.0, 2660.0, 1442.0, 922.0, 530.0, 329.0, 213.0, 152.0, 67.0, 49.0, 35.0, 29.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.39886474609375, -6.1766357421875, -5.95440673828125, -5.732177734375, -5.50994873046875, -5.2877197265625, -5.06549072265625, -4.84326171875, -4.62103271484375, -4.3988037109375, -4.17657470703125, -3.954345703125, -3.73211669921875, -3.5098876953125, -3.28765869140625, -3.0654296875, -2.84320068359375, -2.6209716796875, -2.39874267578125, -2.176513671875, -1.95428466796875, -1.7320556640625, -1.50982666015625, -1.28759765625, -1.06536865234375, -0.8431396484375, -0.62091064453125, -0.398681640625, -0.17645263671875, 0.0457763671875, 0.26800537109375, 0.490234375, 0.71246337890625, 0.9346923828125, 1.15692138671875, 1.379150390625, 1.60137939453125, 1.8236083984375, 2.04583740234375, 2.26806640625, 2.49029541015625, 2.7125244140625, 2.93475341796875, 3.156982421875, 3.37921142578125, 3.6014404296875, 3.82366943359375, 4.0458984375, 4.26812744140625, 4.4903564453125, 4.71258544921875, 4.934814453125, 5.15704345703125, 5.3792724609375, 5.60150146484375, 5.82373046875, 6.04595947265625, 6.2681884765625, 6.49041748046875, 6.712646484375, 6.93487548828125, 7.1571044921875, 7.37933349609375, 7.6015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 15.0, 2.0, 7.0, 7.0, 9.0, 11.0, 22.0, 26.0, 26.0, 44.0, 53.0, 86.0, 101.0, 106.0, 122.0, 83.0, 93.0, 51.0, 34.0, 22.0, 20.0, 15.0, 9.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034165382385253906, -0.00033053383231163025, -0.00031941384077072144, -0.0003082938492298126, -0.0002971738576889038, -0.000286053866147995, -0.0002749338746070862, -0.00026381388306617737, -0.00025269389152526855, -0.00024157389998435974, -0.00023045390844345093, -0.00021933391690254211, -0.0002082139253616333, -0.0001970939338207245, -0.00018597394227981567, -0.00017485395073890686, -0.00016373395919799805, -0.00015261396765708923, -0.00014149397611618042, -0.0001303739845752716, -0.00011925399303436279, -0.00010813400149345398, -9.701400995254517e-05, -8.589401841163635e-05, -7.477402687072754e-05, -6.365403532981873e-05, -5.253404378890991e-05, -4.14140522480011e-05, -3.0294060707092285e-05, -1.917406916618347e-05, -8.054077625274658e-06, 3.0659139156341553e-06, 1.4185905456542969e-05, 2.5305896997451782e-05, 3.6425888538360596e-05, 4.754588007926941e-05, 5.866587162017822e-05, 6.978586316108704e-05, 8.090585470199585e-05, 9.202584624290466e-05, 0.00010314583778381348, 0.00011426582932472229, 0.0001253858208656311, 0.00013650581240653992, 0.00014762580394744873, 0.00015874579548835754, 0.00016986578702926636, 0.00018098577857017517, 0.00019210577011108398, 0.0002032257616519928, 0.0002143457531929016, 0.00022546574473381042, 0.00023658573627471924, 0.00024770572781562805, 0.00025882571935653687, 0.0002699457108974457, 0.0002810657024383545, 0.0002921856939792633, 0.0003033056855201721, 0.00031442567706108093, 0.00032554566860198975, 0.00033666566014289856, 0.0003477856516838074, 0.0003589056432247162, 0.000370025634765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 9.0, 5.0, 11.0, 10.0, 16.0, 26.0, 23.0, 48.0, 58.0, 99.0, 124.0, 186.0, 263.0, 437.0, 629.0, 902.0, 1342.0, 2054.0, 3085.0, 4919.0, 7947.0, 12875.0, 22480.0, 39889.0, 74704.0, 138483.0, 221622.0, 216503.0, 133273.0, 71848.0, 38623.0, 21728.0, 12831.0, 7649.0, 4789.0, 3010.0, 1948.0, 1291.0, 879.0, 608.0, 393.0, 275.0, 201.0, 150.0, 99.0, 66.0, 48.0, 28.0, 26.0, 12.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.34765625, -4.207275390625, -4.06689453125, -3.926513671875, -3.7861328125, -3.645751953125, -3.50537109375, -3.364990234375, -3.224609375, -3.084228515625, -2.94384765625, -2.803466796875, -2.6630859375, -2.522705078125, -2.38232421875, -2.241943359375, -2.1015625, -1.961181640625, -1.82080078125, -1.680419921875, -1.5400390625, -1.399658203125, -1.25927734375, -1.118896484375, -0.978515625, -0.838134765625, -0.69775390625, -0.557373046875, -0.4169921875, -0.276611328125, -0.13623046875, 0.004150390625, 0.14453125, 0.284912109375, 0.42529296875, 0.565673828125, 0.7060546875, 0.846435546875, 0.98681640625, 1.127197265625, 1.267578125, 1.407958984375, 1.54833984375, 1.688720703125, 1.8291015625, 1.969482421875, 2.10986328125, 2.250244140625, 2.390625, 2.531005859375, 2.67138671875, 2.811767578125, 2.9521484375, 3.092529296875, 3.23291015625, 3.373291015625, 3.513671875, 3.654052734375, 3.79443359375, 3.934814453125, 4.0751953125, 4.215576171875, 4.35595703125, 4.496337890625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 8.0, 5.0, 13.0, 12.0, 8.0, 19.0, 19.0, 20.0, 22.0, 32.0, 37.0, 39.0, 47.0, 54.0, 60.0, 67.0, 64.0, 63.0, 45.0, 56.0, 30.0, 38.0, 41.0, 28.0, 30.0, 28.0, 12.0, 18.0, 9.0, 14.0, 6.0, 5.0, 11.0, 3.0, 5.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.968231201171875, -1.90716552734375, -1.846099853515625, -1.7850341796875, -1.723968505859375, -1.66290283203125, -1.601837158203125, -1.540771484375, -1.479705810546875, -1.41864013671875, -1.357574462890625, -1.2965087890625, -1.235443115234375, -1.17437744140625, -1.113311767578125, -1.05224609375, -0.991180419921875, -0.93011474609375, -0.869049072265625, -0.8079833984375, -0.746917724609375, -0.68585205078125, -0.624786376953125, -0.563720703125, -0.502655029296875, -0.44158935546875, -0.380523681640625, -0.3194580078125, -0.258392333984375, -0.19732666015625, -0.136260986328125, -0.0751953125, -0.014129638671875, 0.04693603515625, 0.108001708984375, 0.1690673828125, 0.230133056640625, 0.29119873046875, 0.352264404296875, 0.413330078125, 0.474395751953125, 0.53546142578125, 0.596527099609375, 0.6575927734375, 0.718658447265625, 0.77972412109375, 0.840789794921875, 0.90185546875, 0.962921142578125, 1.02398681640625, 1.085052490234375, 1.1461181640625, 1.207183837890625, 1.26824951171875, 1.329315185546875, 1.390380859375, 1.451446533203125, 1.51251220703125, 1.573577880859375, 1.6346435546875, 1.695709228515625, 1.75677490234375, 1.817840576171875, 1.87890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 5.0, 10.0, 17.0, 13.0, 18.0, 19.0, 39.0, 45.0, 68.0, 73.0, 83.0, 108.0, 96.0, 63.0, 85.0, 67.0, 42.0, 42.0, 23.0, 18.0, 15.0, 11.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.896865844726562, -22.305076599121094, -21.713285446166992, -21.121496200561523, -20.529706954956055, -19.937917709350586, -19.346126556396484, -18.754337310791016, -18.162548065185547, -17.570758819580078, -16.978967666625977, -16.387178421020508, -15.795389175415039, -15.203598976135254, -14.611808776855469, -14.02001953125, -13.428229331970215, -12.83643913269043, -12.244649887084961, -11.652859687805176, -11.061070442199707, -10.469280242919922, -9.877490997314453, -9.285700798034668, -8.693910598754883, -8.102120399475098, -7.510331153869629, -6.918540954589844, -6.326751708984375, -5.73496150970459, -5.143171787261963, -4.551382064819336, -3.9595937728881836, -3.3678040504455566, -2.7760143280029297, -2.1842243671417236, -1.5924346446990967, -1.0006449222564697, -0.40885496139526367, 0.18293476104736328, 0.7747244834899902, 1.3665142059326172, 1.9583040475845337, 2.55009388923645, 3.141883611679077, 3.733673334121704, 4.32546329498291, 4.917253017425537, 5.509042739868164, 6.100832462310791, 6.692622184753418, 7.284412384033203, 7.876201629638672, 8.467991828918457, 9.059782028198242, 9.651571273803711, 10.24336051940918, 10.835150718688965, 11.426939964294434, 12.018730163574219, 12.610519409179688, 13.202309608459473, 13.794099807739258, 14.385889053344727, 14.977679252624512]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 9.0, 11.0, 6.0, 24.0, 9.0, 25.0, 32.0, 28.0, 39.0, 29.0, 38.0, 31.0, 45.0, 54.0, 48.0, 67.0, 62.0, 41.0, 56.0, 50.0, 37.0, 45.0, 28.0, 35.0, 21.0, 29.0, 21.0, 19.0, 11.0, 12.0, 11.0, 10.0, 4.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.114065170288086, -11.72291088104248, -11.331755638122559, -10.940601348876953, -10.549447059631348, -10.158292770385742, -9.76713752746582, -9.375983238220215, -8.98482894897461, -8.593674659729004, -8.202519416809082, -7.811365127563477, -7.420210838317871, -7.029056072235107, -6.637901306152344, -6.246747016906738, -5.855591773986816, -5.464437007904053, -5.073282718658447, -4.682127952575684, -4.290973663330078, -3.8998188972473145, -3.508664131164551, -3.117509603500366, -2.7263550758361816, -2.335200548171997, -1.944045901298523, -1.5528912544250488, -1.1617367267608643, -0.7705821990966797, -0.379427433013916, 0.011727094650268555, 0.4028816223144531, 0.7940362095832825, 1.1851907968521118, 1.576345443725586, 1.9674999713897705, 2.358654499053955, 2.7498092651367188, 3.1409637928009033, 3.532118320465088, 3.9232728481292725, 4.314427375793457, 4.705582141876221, 5.096736907958984, 5.48789119720459, 5.8790459632873535, 6.270200729370117, 6.661355018615723, 7.052509784698486, 7.443664073944092, 7.8348188400268555, 8.225973129272461, 8.617128372192383, 9.008282661437988, 9.399436950683594, 9.790592193603516, 10.181746482849121, 10.572901725769043, 10.964056015014648, 11.355210304260254, 11.74636459350586, 12.137519836425781, 12.528674125671387, 12.919828414916992]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 9.0, 4.0, 16.0, 16.0, 26.0, 28.0, 37.0, 55.0, 76.0, 129.0, 169.0, 238.0, 381.0, 722.0, 1201.0, 2250.0, 4220.0, 8947.0, 20436.0, 51196.0, 135708.0, 290831.0, 295448.0, 142065.0, 54191.0, 21313.0, 9190.0, 4361.0, 2169.0, 1195.0, 678.0, 408.0, 260.0, 176.0, 115.0, 81.0, 48.0, 40.0, 27.0, 36.0, 14.0, 11.0, 15.0, 9.0, 9.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.265625, -21.5703125, -20.875, -20.1796875, -19.484375, -18.7890625, -18.09375, -17.3984375, -16.703125, -16.0078125, -15.3125, -14.6171875, -13.921875, -13.2265625, -12.53125, -11.8359375, -11.140625, -10.4453125, -9.75, -9.0546875, -8.359375, -7.6640625, -6.96875, -6.2734375, -5.578125, -4.8828125, -4.1875, -3.4921875, -2.796875, -2.1015625, -1.40625, -0.7109375, -0.015625, 0.6796875, 1.375, 2.0703125, 2.765625, 3.4609375, 4.15625, 4.8515625, 5.546875, 6.2421875, 6.9375, 7.6328125, 8.328125, 9.0234375, 9.71875, 10.4140625, 11.109375, 11.8046875, 12.5, 13.1953125, 13.890625, 14.5859375, 15.28125, 15.9765625, 16.671875, 17.3671875, 18.0625, 18.7578125, 19.453125, 20.1484375, 20.84375, 21.5390625, 22.234375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 5.0, 10.0, 14.0, 14.0, 18.0, 18.0, 29.0, 28.0, 29.0, 42.0, 29.0, 34.0, 49.0, 48.0, 46.0, 53.0, 52.0, 59.0, 74.0, 41.0, 36.0, 35.0, 40.0, 33.0, 30.0, 24.0, 19.0, 23.0, 19.0, 14.0, 7.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.36328125, -10.9765625, -10.58984375, -10.203125, -9.81640625, -9.4296875, -9.04296875, -8.65625, -8.26953125, -7.8828125, -7.49609375, -7.109375, -6.72265625, -6.3359375, -5.94921875, -5.5625, -5.17578125, -4.7890625, -4.40234375, -4.015625, -3.62890625, -3.2421875, -2.85546875, -2.46875, -2.08203125, -1.6953125, -1.30859375, -0.921875, -0.53515625, -0.1484375, 0.23828125, 0.625, 1.01171875, 1.3984375, 1.78515625, 2.171875, 2.55859375, 2.9453125, 3.33203125, 3.71875, 4.10546875, 4.4921875, 4.87890625, 5.265625, 5.65234375, 6.0390625, 6.42578125, 6.8125, 7.19921875, 7.5859375, 7.97265625, 8.359375, 8.74609375, 9.1328125, 9.51953125, 9.90625, 10.29296875, 10.6796875, 11.06640625, 11.453125, 11.83984375, 12.2265625, 12.61328125, 13.0]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 8.0, 16.0, 27.0, 32.0, 33.0, 65.0, 79.0, 142.0, 197.0, 288.0, 445.0, 649.0, 948.0, 1462.0, 2354.0, 3449.0, 5337.0, 8570.0, 13948.0, 23329.0, 39533.0, 65831.0, 108448.0, 159207.0, 184174.0, 157685.0, 107068.0, 65662.0, 38547.0, 23110.0, 13981.0, 8519.0, 5284.0, 3477.0, 2254.0, 1525.0, 920.0, 610.0, 444.0, 282.0, 191.0, 141.0, 86.0, 62.0, 36.0, 30.0, 20.0, 9.0, 11.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.296875, -10.9381103515625, -10.579345703125, -10.2205810546875, -9.86181640625, -9.5030517578125, -9.144287109375, -8.7855224609375, -8.4267578125, -8.0679931640625, -7.709228515625, -7.3504638671875, -6.99169921875, -6.6329345703125, -6.274169921875, -5.9154052734375, -5.556640625, -5.1978759765625, -4.839111328125, -4.4803466796875, -4.12158203125, -3.7628173828125, -3.404052734375, -3.0452880859375, -2.6865234375, -2.3277587890625, -1.968994140625, -1.6102294921875, -1.25146484375, -0.8927001953125, -0.533935546875, -0.1751708984375, 0.18359375, 0.5423583984375, 0.901123046875, 1.2598876953125, 1.61865234375, 1.9774169921875, 2.336181640625, 2.6949462890625, 3.0537109375, 3.4124755859375, 3.771240234375, 4.1300048828125, 4.48876953125, 4.8475341796875, 5.206298828125, 5.5650634765625, 5.923828125, 6.2825927734375, 6.641357421875, 7.0001220703125, 7.35888671875, 7.7176513671875, 8.076416015625, 8.4351806640625, 8.7939453125, 9.1527099609375, 9.511474609375, 9.8702392578125, 10.22900390625, 10.5877685546875, 10.946533203125, 11.3052978515625, 11.6640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 6.0, 5.0, 11.0, 6.0, 19.0, 15.0, 29.0, 23.0, 24.0, 33.0, 36.0, 19.0, 40.0, 49.0, 39.0, 47.0, 34.0, 40.0, 50.0, 39.0, 41.0, 43.0, 36.0, 47.0, 26.0, 38.0, 34.0, 25.0, 22.0, 21.0, 12.0, 13.0, 20.0, 9.0, 5.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-8.7109375, -8.47357177734375, -8.2362060546875, -7.99884033203125, -7.761474609375, -7.52410888671875, -7.2867431640625, -7.04937744140625, -6.81201171875, -6.57464599609375, -6.3372802734375, -6.09991455078125, -5.862548828125, -5.62518310546875, -5.3878173828125, -5.15045166015625, -4.9130859375, -4.67572021484375, -4.4383544921875, -4.20098876953125, -3.963623046875, -3.72625732421875, -3.4888916015625, -3.25152587890625, -3.01416015625, -2.77679443359375, -2.5394287109375, -2.30206298828125, -2.064697265625, -1.82733154296875, -1.5899658203125, -1.35260009765625, -1.115234375, -0.87786865234375, -0.6405029296875, -0.40313720703125, -0.165771484375, 0.07159423828125, 0.3089599609375, 0.54632568359375, 0.78369140625, 1.02105712890625, 1.2584228515625, 1.49578857421875, 1.733154296875, 1.97052001953125, 2.2078857421875, 2.44525146484375, 2.6826171875, 2.91998291015625, 3.1573486328125, 3.39471435546875, 3.632080078125, 3.86944580078125, 4.1068115234375, 4.34417724609375, 4.58154296875, 4.81890869140625, 5.0562744140625, 5.29364013671875, 5.531005859375, 5.76837158203125, 6.0057373046875, 6.24310302734375, 6.48046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 1.0, 2.0, 3.0, 6.0, 12.0, 17.0, 29.0, 31.0, 53.0, 111.0, 138.0, 194.0, 302.0, 472.0, 692.0, 1020.0, 1713.0, 2819.0, 4733.0, 8347.0, 15167.0, 28809.0, 56098.0, 116518.0, 234271.0, 271465.0, 153128.0, 72193.0, 35969.0, 18949.0, 10344.0, 5850.0, 3467.0, 2055.0, 1295.0, 810.0, 476.0, 330.0, 238.0, 136.0, 92.0, 70.0, 41.0, 29.0, 29.0, 9.0, 13.0, 4.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.2265625, -13.770263671875, -13.31396484375, -12.857666015625, -12.4013671875, -11.945068359375, -11.48876953125, -11.032470703125, -10.576171875, -10.119873046875, -9.66357421875, -9.207275390625, -8.7509765625, -8.294677734375, -7.83837890625, -7.382080078125, -6.92578125, -6.469482421875, -6.01318359375, -5.556884765625, -5.1005859375, -4.644287109375, -4.18798828125, -3.731689453125, -3.275390625, -2.819091796875, -2.36279296875, -1.906494140625, -1.4501953125, -0.993896484375, -0.53759765625, -0.081298828125, 0.375, 0.831298828125, 1.28759765625, 1.743896484375, 2.2001953125, 2.656494140625, 3.11279296875, 3.569091796875, 4.025390625, 4.481689453125, 4.93798828125, 5.394287109375, 5.8505859375, 6.306884765625, 6.76318359375, 7.219482421875, 7.67578125, 8.132080078125, 8.58837890625, 9.044677734375, 9.5009765625, 9.957275390625, 10.41357421875, 10.869873046875, 11.326171875, 11.782470703125, 12.23876953125, 12.695068359375, 13.1513671875, 13.607666015625, 14.06396484375, 14.520263671875, 14.9765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 8.0, 9.0, 22.0, 41.0, 66.0, 119.0, 211.0, 191.0, 140.0, 75.0, 40.0, 28.0, 13.0, 12.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032520294189453125, -0.003156810998916626, -0.0030615925788879395, -0.002966374158859253, -0.0028711557388305664, -0.00277593731880188, -0.0026807188987731934, -0.002585500478744507, -0.0024902820587158203, -0.002395063638687134, -0.0022998452186584473, -0.0022046267986297607, -0.0021094083786010742, -0.0020141899585723877, -0.0019189715385437012, -0.0018237531185150146, -0.0017285346984863281, -0.0016333162784576416, -0.001538097858428955, -0.0014428794384002686, -0.001347661018371582, -0.0012524425983428955, -0.001157224178314209, -0.0010620057582855225, -0.0009667873382568359, -0.0008715689182281494, -0.0007763504981994629, -0.0006811320781707764, -0.0005859136581420898, -0.0004906952381134033, -0.0003954768180847168, -0.0003002583980560303, -0.00020503997802734375, -0.00010982155799865723, -1.4603137969970703e-05, 8.061528205871582e-05, 0.00017583370208740234, 0.00027105212211608887, 0.0003662705421447754, 0.0004614889621734619, 0.0005567073822021484, 0.000651925802230835, 0.0007471442222595215, 0.000842362642288208, 0.0009375810623168945, 0.001032799482345581, 0.0011280179023742676, 0.001223236322402954, 0.0013184547424316406, 0.0014136731624603271, 0.0015088915824890137, 0.0016041100025177002, 0.0016993284225463867, 0.0017945468425750732, 0.0018897652626037598, 0.0019849836826324463, 0.002080202102661133, 0.0021754205226898193, 0.002270638942718506, 0.0023658573627471924, 0.002461075782775879, 0.0025562942028045654, 0.002651512622833252, 0.0027467310428619385, 0.002841949462890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 0.0, 4.0, 2.0, 5.0, 8.0, 7.0, 16.0, 24.0, 27.0, 34.0, 47.0, 76.0, 105.0, 147.0, 208.0, 320.0, 408.0, 695.0, 1043.0, 1670.0, 2823.0, 4781.0, 8687.0, 16421.0, 31078.0, 61176.0, 120849.0, 216285.0, 248167.0, 160613.0, 82283.0, 42082.0, 21088.0, 11492.0, 6227.0, 3683.0, 2118.0, 1304.0, 801.0, 574.0, 366.0, 240.0, 157.0, 132.0, 78.0, 76.0, 44.0, 30.0, 16.0, 14.0, 14.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.4273681640625, -10.057861328125, -9.6883544921875, -9.31884765625, -8.9493408203125, -8.579833984375, -8.2103271484375, -7.8408203125, -7.4713134765625, -7.101806640625, -6.7322998046875, -6.36279296875, -5.9932861328125, -5.623779296875, -5.2542724609375, -4.884765625, -4.5152587890625, -4.145751953125, -3.7762451171875, -3.40673828125, -3.0372314453125, -2.667724609375, -2.2982177734375, -1.9287109375, -1.5592041015625, -1.189697265625, -0.8201904296875, -0.45068359375, -0.0811767578125, 0.288330078125, 0.6578369140625, 1.02734375, 1.3968505859375, 1.766357421875, 2.1358642578125, 2.50537109375, 2.8748779296875, 3.244384765625, 3.6138916015625, 3.9833984375, 4.3529052734375, 4.722412109375, 5.0919189453125, 5.46142578125, 5.8309326171875, 6.200439453125, 6.5699462890625, 6.939453125, 7.3089599609375, 7.678466796875, 8.0479736328125, 8.41748046875, 8.7869873046875, 9.156494140625, 9.5260009765625, 9.8955078125, 10.2650146484375, 10.634521484375, 11.0040283203125, 11.37353515625, 11.7430419921875, 12.112548828125, 12.4820556640625, 12.8515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 14.0, 15.0, 15.0, 31.0, 26.0, 36.0, 30.0, 33.0, 59.0, 53.0, 66.0, 52.0, 65.0, 59.0, 57.0, 50.0, 50.0, 43.0, 41.0, 35.0, 28.0, 22.0, 16.0, 9.0, 12.0, 6.0, 9.0, 13.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.9578857421875, -3.814208984375, -3.6705322265625, -3.52685546875, -3.3831787109375, -3.239501953125, -3.0958251953125, -2.9521484375, -2.8084716796875, -2.664794921875, -2.5211181640625, -2.37744140625, -2.2337646484375, -2.090087890625, -1.9464111328125, -1.802734375, -1.6590576171875, -1.515380859375, -1.3717041015625, -1.22802734375, -1.0843505859375, -0.940673828125, -0.7969970703125, -0.6533203125, -0.5096435546875, -0.365966796875, -0.2222900390625, -0.07861328125, 0.0650634765625, 0.208740234375, 0.3524169921875, 0.49609375, 0.6397705078125, 0.783447265625, 0.9271240234375, 1.07080078125, 1.2144775390625, 1.358154296875, 1.5018310546875, 1.6455078125, 1.7891845703125, 1.932861328125, 2.0765380859375, 2.22021484375, 2.3638916015625, 2.507568359375, 2.6512451171875, 2.794921875, 2.9385986328125, 3.082275390625, 3.2259521484375, 3.36962890625, 3.5133056640625, 3.656982421875, 3.8006591796875, 3.9443359375, 4.0880126953125, 4.231689453125, 4.3753662109375, 4.51904296875, 4.6627197265625, 4.806396484375, 4.9500732421875, 5.09375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 8.0, 7.0, 13.0, 22.0, 27.0, 28.0, 39.0, 55.0, 72.0, 79.0, 81.0, 96.0, 92.0, 76.0, 73.0, 49.0, 43.0, 32.0, 29.0, 18.0, 11.0, 10.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-25.841167449951172, -25.240509033203125, -24.639850616455078, -24.03919219970703, -23.438533782958984, -22.837873458862305, -22.237215042114258, -21.63655662536621, -21.035898208618164, -20.435239791870117, -19.83458137512207, -19.233922958374023, -18.633262634277344, -18.032604217529297, -17.43194580078125, -16.831287384033203, -16.230628967285156, -15.62997055053711, -15.029312133789062, -14.4286527633667, -13.827994346618652, -13.227335929870605, -12.626676559448242, -12.026018142700195, -11.425359725952148, -10.824701309204102, -10.224042892456055, -9.623383522033691, -9.022725105285645, -8.422066688537598, -7.821407794952393, -7.2207489013671875, -6.620092391967773, -6.019433975219727, -5.4187750816345215, -4.818116188049316, -4.2174577713012695, -3.6167991161346436, -3.0161404609680176, -2.4154815673828125, -1.8148231506347656, -1.2141644954681396, -0.6135058403015137, -0.012847185134887695, 0.5878114700317383, 1.1884701251983643, 1.7891287803649902, 2.3897876739501953, 2.990446090698242, 3.591104745864868, 4.191763401031494, 4.792422294616699, 5.393080711364746, 5.993739128112793, 6.594398021697998, 7.195056915283203, 7.79571533203125, 8.396373748779297, 8.997032165527344, 9.597691535949707, 10.198349952697754, 10.7990083694458, 11.399667739868164, 12.000326156616211, 12.600984573364258]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 12.0, 12.0, 17.0, 19.0, 25.0, 24.0, 37.0, 37.0, 36.0, 36.0, 54.0, 46.0, 52.0, 54.0, 43.0, 53.0, 47.0, 37.0, 47.0, 41.0, 35.0, 32.0, 28.0, 30.0, 28.0, 17.0, 20.0, 13.0, 7.0, 14.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.295372009277344, -9.920835494995117, -9.546298027038574, -9.171761512756348, -8.797224044799805, -8.422687530517578, -8.048151016235352, -7.673613548278809, -7.299076557159424, -6.924539566040039, -6.550002574920654, -6.1754655838012695, -5.800929069519043, -5.4263916015625, -5.051855087280273, -4.677318096160889, -4.302781105041504, -3.928244113922119, -3.5537071228027344, -3.1791703701019287, -2.804633378982544, -2.430096387863159, -2.0555596351623535, -1.6810226440429688, -1.306485652923584, -0.931948721408844, -0.557411789894104, -0.1828749179840088, 0.19166207313537598, 0.5661990642547607, 0.9407358169555664, 1.3152728080749512, 1.6898088455200195, 2.0643458366394043, 2.438882827758789, 2.8134195804595947, 3.1879565715789795, 3.5624935626983643, 3.93703031539917, 4.311567306518555, 4.6861042976379395, 5.060641288757324, 5.435178279876709, 5.809715270996094, 6.18425178527832, 6.558789253234863, 6.93332576751709, 7.307862758636475, 7.682399749755859, 8.056936264038086, 8.431473731994629, 8.806010246276855, 9.180547714233398, 9.555084228515625, 9.929620742797852, 10.304158210754395, 10.678695678710938, 11.053232192993164, 11.427769660949707, 11.802306175231934, 12.176843643188477, 12.551380157470703, 12.92591667175293, 13.300454139709473, 13.6749906539917]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 17.0, 32.0, 42.0, 61.0, 121.0, 171.0, 281.0, 432.0, 693.0, 1089.0, 1863.0, 2904.0, 4685.0, 8345.0, 15506.0, 31468.0, 73631.0, 198259.0, 585573.0, 1322488.0, 1198663.0, 470127.0, 156635.0, 59323.0, 27081.0, 13832.0, 7924.0, 4823.0, 2886.0, 1807.0, 1243.0, 733.0, 519.0, 349.0, 203.0, 137.0, 107.0, 61.0, 37.0, 26.0, 26.0, 12.0, 24.0, 8.0, 6.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.625, -12.1376953125, -11.650390625, -11.1630859375, -10.67578125, -10.1884765625, -9.701171875, -9.2138671875, -8.7265625, -8.2392578125, -7.751953125, -7.2646484375, -6.77734375, -6.2900390625, -5.802734375, -5.3154296875, -4.828125, -4.3408203125, -3.853515625, -3.3662109375, -2.87890625, -2.3916015625, -1.904296875, -1.4169921875, -0.9296875, -0.4423828125, 0.044921875, 0.5322265625, 1.01953125, 1.5068359375, 1.994140625, 2.4814453125, 2.96875, 3.4560546875, 3.943359375, 4.4306640625, 4.91796875, 5.4052734375, 5.892578125, 6.3798828125, 6.8671875, 7.3544921875, 7.841796875, 8.3291015625, 8.81640625, 9.3037109375, 9.791015625, 10.2783203125, 10.765625, 11.2529296875, 11.740234375, 12.2275390625, 12.71484375, 13.2021484375, 13.689453125, 14.1767578125, 14.6640625, 15.1513671875, 15.638671875, 16.1259765625, 16.61328125, 17.1005859375, 17.587890625, 18.0751953125, 18.5625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 12.0, 26.0, 9.0, 21.0, 20.0, 19.0, 20.0, 38.0, 37.0, 41.0, 44.0, 47.0, 43.0, 55.0, 46.0, 59.0, 43.0, 44.0, 46.0, 34.0, 45.0, 34.0, 43.0, 30.0, 27.0, 19.0, 18.0, 16.0, 11.0, 12.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.60546875, -6.37115478515625, -6.1368408203125, -5.90252685546875, -5.668212890625, -5.43389892578125, -5.1995849609375, -4.96527099609375, -4.73095703125, -4.49664306640625, -4.2623291015625, -4.02801513671875, -3.793701171875, -3.55938720703125, -3.3250732421875, -3.09075927734375, -2.8564453125, -2.62213134765625, -2.3878173828125, -2.15350341796875, -1.919189453125, -1.68487548828125, -1.4505615234375, -1.21624755859375, -0.98193359375, -0.74761962890625, -0.5133056640625, -0.27899169921875, -0.044677734375, 0.18963623046875, 0.4239501953125, 0.65826416015625, 0.892578125, 1.12689208984375, 1.3612060546875, 1.59552001953125, 1.829833984375, 2.06414794921875, 2.2984619140625, 2.53277587890625, 2.76708984375, 3.00140380859375, 3.2357177734375, 3.47003173828125, 3.704345703125, 3.93865966796875, 4.1729736328125, 4.40728759765625, 4.6416015625, 4.87591552734375, 5.1102294921875, 5.34454345703125, 5.578857421875, 5.81317138671875, 6.0474853515625, 6.28179931640625, 6.51611328125, 6.75042724609375, 6.9847412109375, 7.21905517578125, 7.453369140625, 7.68768310546875, 7.9219970703125, 8.15631103515625, 8.390625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 13.0, 12.0, 25.0, 28.0, 45.0, 59.0, 81.0, 121.0, 164.0, 220.0, 278.0, 436.0, 664.0, 920.0, 1384.0, 2090.0, 3160.0, 5056.0, 8349.0, 14509.0, 26638.0, 53499.0, 120344.0, 300798.0, 739296.0, 1237663.0, 949442.0, 416959.0, 163327.0, 69959.0, 33600.0, 17791.0, 10161.0, 6001.0, 3693.0, 2398.0, 1599.0, 1096.0, 696.0, 501.0, 352.0, 236.0, 157.0, 125.0, 82.0, 60.0, 51.0, 29.0, 29.0, 15.0, 13.0, 9.0, 14.0, 5.0, 2.0, 3.0, 5.0], "bins": [-13.8359375, -13.4124755859375, -12.989013671875, -12.5655517578125, -12.14208984375, -11.7186279296875, -11.295166015625, -10.8717041015625, -10.4482421875, -10.0247802734375, -9.601318359375, -9.1778564453125, -8.75439453125, -8.3309326171875, -7.907470703125, -7.4840087890625, -7.060546875, -6.6370849609375, -6.213623046875, -5.7901611328125, -5.36669921875, -4.9432373046875, -4.519775390625, -4.0963134765625, -3.6728515625, -3.2493896484375, -2.825927734375, -2.4024658203125, -1.97900390625, -1.5555419921875, -1.132080078125, -0.7086181640625, -0.28515625, 0.1383056640625, 0.561767578125, 0.9852294921875, 1.40869140625, 1.8321533203125, 2.255615234375, 2.6790771484375, 3.1025390625, 3.5260009765625, 3.949462890625, 4.3729248046875, 4.79638671875, 5.2198486328125, 5.643310546875, 6.0667724609375, 6.490234375, 6.9136962890625, 7.337158203125, 7.7606201171875, 8.18408203125, 8.6075439453125, 9.031005859375, 9.4544677734375, 9.8779296875, 10.3013916015625, 10.724853515625, 11.1483154296875, 11.57177734375, 11.9952392578125, 12.418701171875, 12.8421630859375, 13.265625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 7.0, 12.0, 9.0, 13.0, 17.0, 19.0, 39.0, 44.0, 38.0, 44.0, 63.0, 78.0, 91.0, 119.0, 164.0, 179.0, 219.0, 224.0, 292.0, 300.0, 322.0, 308.0, 284.0, 242.0, 231.0, 168.0, 123.0, 102.0, 76.0, 55.0, 43.0, 35.0, 29.0, 22.0, 13.0, 12.0, 6.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.97265625, -3.848297119140625, -3.72393798828125, -3.599578857421875, -3.4752197265625, -3.350860595703125, -3.22650146484375, -3.102142333984375, -2.977783203125, -2.853424072265625, -2.72906494140625, -2.604705810546875, -2.4803466796875, -2.355987548828125, -2.23162841796875, -2.107269287109375, -1.98291015625, -1.858551025390625, -1.73419189453125, -1.609832763671875, -1.4854736328125, -1.361114501953125, -1.23675537109375, -1.112396240234375, -0.988037109375, -0.863677978515625, -0.73931884765625, -0.614959716796875, -0.4906005859375, -0.366241455078125, -0.24188232421875, -0.117523193359375, 0.0068359375, 0.131195068359375, 0.25555419921875, 0.379913330078125, 0.5042724609375, 0.628631591796875, 0.75299072265625, 0.877349853515625, 1.001708984375, 1.126068115234375, 1.25042724609375, 1.374786376953125, 1.4991455078125, 1.623504638671875, 1.74786376953125, 1.872222900390625, 1.99658203125, 2.120941162109375, 2.24530029296875, 2.369659423828125, 2.4940185546875, 2.618377685546875, 2.74273681640625, 2.867095947265625, 2.991455078125, 3.115814208984375, 3.24017333984375, 3.364532470703125, 3.4888916015625, 3.613250732421875, 3.73760986328125, 3.861968994140625, 3.986328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 2.0, 5.0, 4.0, 8.0, 16.0, 21.0, 28.0, 24.0, 29.0, 38.0, 60.0, 95.0, 79.0, 95.0, 94.0, 81.0, 66.0, 62.0, 50.0, 38.0, 24.0, 17.0, 15.0, 14.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.773818969726562, -19.277854919433594, -18.781892776489258, -18.28592872619629, -17.789966583251953, -17.294002532958984, -16.798038482666016, -16.30207633972168, -15.806112289428711, -15.310149192810059, -14.814186096191406, -14.318222045898438, -13.822258949279785, -13.326295852661133, -12.830331802368164, -12.334368705749512, -11.83840560913086, -11.342442512512207, -10.846479415893555, -10.350515365600586, -9.854552268981934, -9.358589172363281, -8.862625122070312, -8.36666202545166, -7.870698928833008, -7.3747358322143555, -6.878772258758545, -6.382808685302734, -5.886845588684082, -5.39088249206543, -4.894918918609619, -4.398955345153809, -3.90299129486084, -3.4070279598236084, -2.911064624786377, -2.4151012897491455, -1.919137954711914, -1.4231746196746826, -0.9272112846374512, -0.4312479496002197, 0.06471538543701172, 0.5606787204742432, 1.0566420555114746, 1.552605390548706, 2.0485687255859375, 2.544532060623169, 3.0404953956604004, 3.536458730697632, 4.032422065734863, 4.528385162353516, 5.024348735809326, 5.520312309265137, 6.016275405883789, 6.512238502502441, 7.008202075958252, 7.5041656494140625, 8.000128746032715, 8.496091842651367, 8.992055892944336, 9.488018989562988, 9.98398208618164, 10.479945182800293, 10.975908279418945, 11.471872329711914, 11.967835426330566]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 3.0, 5.0, 11.0, 12.0, 14.0, 10.0, 28.0, 22.0, 23.0, 36.0, 32.0, 47.0, 37.0, 39.0, 59.0, 39.0, 50.0, 55.0, 35.0, 52.0, 50.0, 45.0, 43.0, 39.0, 31.0, 36.0, 26.0, 24.0, 23.0, 13.0, 15.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.06433391571045, -7.751862525939941, -7.439391136169434, -7.126920223236084, -6.814448833465576, -6.501977443695068, -6.189506530761719, -5.877035140991211, -5.564563751220703, -5.252092361450195, -4.9396209716796875, -4.627150058746338, -4.31467866897583, -4.002207279205322, -3.6897361278533936, -3.377264976501465, -3.064793586730957, -2.752322196960449, -2.4398510456085205, -2.127379894256592, -1.814908504486084, -1.5024372339248657, -1.1899659633636475, -0.8774948120117188, -0.5650234222412109, -0.2525521516799927, 0.059919118881225586, 0.37239038944244385, 0.6848616600036621, 0.9973329305648804, 1.3098042011260986, 1.6222753524780273, 1.9347476959228516, 2.2472190856933594, 2.559690237045288, 2.872161388397217, 3.1846327781677246, 3.4971041679382324, 3.809575319290161, 4.12204647064209, 4.434517860412598, 4.7469892501831055, 5.059460639953613, 5.371931552886963, 5.684402942657471, 5.9968743324279785, 6.309345245361328, 6.621816635131836, 6.934288024902344, 7.246759414672852, 7.559230804443359, 7.871701717376709, 8.184173583984375, 8.496644020080566, 8.809115409851074, 9.121586799621582, 9.43405818939209, 9.746529579162598, 10.059000968933105, 10.371472358703613, 10.683942794799805, 10.996414184570312, 11.30888557434082, 11.621356964111328, 11.933828353881836]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 6.0, 7.0, 6.0, 12.0, 22.0, 37.0, 56.0, 82.0, 165.0, 275.0, 466.0, 859.0, 1379.0, 2560.0, 4849.0, 9978.0, 20139.0, 42353.0, 89061.0, 173141.0, 250691.0, 215615.0, 121925.0, 58782.0, 27933.0, 13622.0, 6626.0, 3481.0, 1910.0, 1078.0, 579.0, 337.0, 213.0, 118.0, 63.0, 36.0, 27.0, 26.0, 14.0, 14.0, 5.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.26171875, -6.0643310546875, -5.866943359375, -5.6695556640625, -5.47216796875, -5.2747802734375, -5.077392578125, -4.8800048828125, -4.6826171875, -4.4852294921875, -4.287841796875, -4.0904541015625, -3.89306640625, -3.6956787109375, -3.498291015625, -3.3009033203125, -3.103515625, -2.9061279296875, -2.708740234375, -2.5113525390625, -2.31396484375, -2.1165771484375, -1.919189453125, -1.7218017578125, -1.5244140625, -1.3270263671875, -1.129638671875, -0.9322509765625, -0.73486328125, -0.5374755859375, -0.340087890625, -0.1427001953125, 0.0546875, 0.2520751953125, 0.449462890625, 0.6468505859375, 0.84423828125, 1.0416259765625, 1.239013671875, 1.4364013671875, 1.6337890625, 1.8311767578125, 2.028564453125, 2.2259521484375, 2.42333984375, 2.6207275390625, 2.818115234375, 3.0155029296875, 3.212890625, 3.4102783203125, 3.607666015625, 3.8050537109375, 4.00244140625, 4.1998291015625, 4.397216796875, 4.5946044921875, 4.7919921875, 4.9893798828125, 5.186767578125, 5.3841552734375, 5.58154296875, 5.7789306640625, 5.976318359375, 6.1737060546875, 6.37109375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 6.0, 8.0, 10.0, 8.0, 13.0, 22.0, 17.0, 23.0, 21.0, 25.0, 29.0, 47.0, 44.0, 54.0, 38.0, 54.0, 54.0, 42.0, 57.0, 46.0, 60.0, 41.0, 40.0, 34.0, 38.0, 27.0, 29.0, 20.0, 21.0, 26.0, 12.0, 7.0, 5.0, 4.0, 5.0, 2.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.2431640625, -7.908203125, -7.5732421875, -7.23828125, -6.9033203125, -6.568359375, -6.2333984375, -5.8984375, -5.5634765625, -5.228515625, -4.8935546875, -4.55859375, -4.2236328125, -3.888671875, -3.5537109375, -3.21875, -2.8837890625, -2.548828125, -2.2138671875, -1.87890625, -1.5439453125, -1.208984375, -0.8740234375, -0.5390625, -0.2041015625, 0.130859375, 0.4658203125, 0.80078125, 1.1357421875, 1.470703125, 1.8056640625, 2.140625, 2.4755859375, 2.810546875, 3.1455078125, 3.48046875, 3.8154296875, 4.150390625, 4.4853515625, 4.8203125, 5.1552734375, 5.490234375, 5.8251953125, 6.16015625, 6.4951171875, 6.830078125, 7.1650390625, 7.5, 7.8349609375, 8.169921875, 8.5048828125, 8.83984375, 9.1748046875, 9.509765625, 9.8447265625, 10.1796875, 10.5146484375, 10.849609375, 11.1845703125, 11.51953125, 11.8544921875, 12.189453125, 12.5244140625, 12.859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 12.0, 17.0, 25.0, 38.0, 51.0, 78.0, 129.0, 180.0, 284.0, 433.0, 710.0, 1117.0, 1830.0, 2931.0, 5138.0, 8590.0, 15624.0, 29895.0, 57690.0, 114596.0, 206387.0, 249978.0, 167959.0, 87880.0, 44559.0, 22858.0, 12448.0, 6851.0, 3930.0, 2296.0, 1487.0, 917.0, 515.0, 346.0, 258.0, 164.0, 105.0, 84.0, 54.0, 23.0, 21.0, 19.0, 11.0, 14.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.23046875, -6.04339599609375, -5.8563232421875, -5.66925048828125, -5.482177734375, -5.29510498046875, -5.1080322265625, -4.92095947265625, -4.73388671875, -4.54681396484375, -4.3597412109375, -4.17266845703125, -3.985595703125, -3.79852294921875, -3.6114501953125, -3.42437744140625, -3.2373046875, -3.05023193359375, -2.8631591796875, -2.67608642578125, -2.489013671875, -2.30194091796875, -2.1148681640625, -1.92779541015625, -1.74072265625, -1.55364990234375, -1.3665771484375, -1.17950439453125, -0.992431640625, -0.80535888671875, -0.6182861328125, -0.43121337890625, -0.244140625, -0.05706787109375, 0.1300048828125, 0.31707763671875, 0.504150390625, 0.69122314453125, 0.8782958984375, 1.06536865234375, 1.25244140625, 1.43951416015625, 1.6265869140625, 1.81365966796875, 2.000732421875, 2.18780517578125, 2.3748779296875, 2.56195068359375, 2.7490234375, 2.93609619140625, 3.1231689453125, 3.31024169921875, 3.497314453125, 3.68438720703125, 3.8714599609375, 4.05853271484375, 4.24560546875, 4.43267822265625, 4.6197509765625, 4.80682373046875, 4.993896484375, 5.18096923828125, 5.3680419921875, 5.55511474609375, 5.7421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 6.0, 7.0, 12.0, 15.0, 12.0, 17.0, 11.0, 23.0, 13.0, 19.0, 24.0, 40.0, 37.0, 37.0, 24.0, 52.0, 53.0, 41.0, 46.0, 38.0, 38.0, 50.0, 36.0, 28.0, 30.0, 35.0, 39.0, 28.0, 21.0, 31.0, 18.0, 17.0, 14.0, 12.0, 16.0, 15.0, 12.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.328125, -5.1619873046875, -4.995849609375, -4.8297119140625, -4.66357421875, -4.4974365234375, -4.331298828125, -4.1651611328125, -3.9990234375, -3.8328857421875, -3.666748046875, -3.5006103515625, -3.33447265625, -3.1683349609375, -3.002197265625, -2.8360595703125, -2.669921875, -2.5037841796875, -2.337646484375, -2.1715087890625, -2.00537109375, -1.8392333984375, -1.673095703125, -1.5069580078125, -1.3408203125, -1.1746826171875, -1.008544921875, -0.8424072265625, -0.67626953125, -0.5101318359375, -0.343994140625, -0.1778564453125, -0.01171875, 0.1544189453125, 0.320556640625, 0.4866943359375, 0.65283203125, 0.8189697265625, 0.985107421875, 1.1512451171875, 1.3173828125, 1.4835205078125, 1.649658203125, 1.8157958984375, 1.98193359375, 2.1480712890625, 2.314208984375, 2.4803466796875, 2.646484375, 2.8126220703125, 2.978759765625, 3.1448974609375, 3.31103515625, 3.4771728515625, 3.643310546875, 3.8094482421875, 3.9755859375, 4.1417236328125, 4.307861328125, 4.4739990234375, 4.64013671875, 4.8062744140625, 4.972412109375, 5.1385498046875, 5.3046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 8.0, 7.0, 12.0, 16.0, 31.0, 50.0, 72.0, 112.0, 167.0, 245.0, 394.0, 487.0, 770.0, 1156.0, 1839.0, 2797.0, 4496.0, 7144.0, 11698.0, 19852.0, 34367.0, 61421.0, 109790.0, 187446.0, 229966.0, 160415.0, 90937.0, 50373.0, 28657.0, 16728.0, 10045.0, 6201.0, 3890.0, 2357.0, 1528.0, 1042.0, 633.0, 445.0, 325.0, 191.0, 136.0, 97.0, 66.0, 50.0, 39.0, 20.0, 14.0, 11.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-2.708984375, -2.625213623046875, -2.54144287109375, -2.457672119140625, -2.3739013671875, -2.290130615234375, -2.20635986328125, -2.122589111328125, -2.038818359375, -1.955047607421875, -1.87127685546875, -1.787506103515625, -1.7037353515625, -1.619964599609375, -1.53619384765625, -1.452423095703125, -1.36865234375, -1.284881591796875, -1.20111083984375, -1.117340087890625, -1.0335693359375, -0.949798583984375, -0.86602783203125, -0.782257080078125, -0.698486328125, -0.614715576171875, -0.53094482421875, -0.447174072265625, -0.3634033203125, -0.279632568359375, -0.19586181640625, -0.112091064453125, -0.0283203125, 0.055450439453125, 0.13922119140625, 0.222991943359375, 0.3067626953125, 0.390533447265625, 0.47430419921875, 0.558074951171875, 0.641845703125, 0.725616455078125, 0.80938720703125, 0.893157958984375, 0.9769287109375, 1.060699462890625, 1.14447021484375, 1.228240966796875, 1.31201171875, 1.395782470703125, 1.47955322265625, 1.563323974609375, 1.6470947265625, 1.730865478515625, 1.81463623046875, 1.898406982421875, 1.982177734375, 2.065948486328125, 2.14971923828125, 2.233489990234375, 2.3172607421875, 2.401031494140625, 2.48480224609375, 2.568572998046875, 2.65234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 5.0, 8.0, 17.0, 20.0, 26.0, 32.0, 26.0, 32.0, 44.0, 58.0, 52.0, 76.0, 72.0, 77.0, 73.0, 77.0, 70.0, 51.0, 47.0, 27.0, 26.0, 23.0, 13.0, 12.0, 9.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013399124145507812, -0.00012907013297080994, -0.00012414902448654175, -0.00011922791600227356, -0.00011430680751800537, -0.00010938569903373718, -0.000104464590549469, -9.95434820652008e-05, -9.462237358093262e-05, -8.970126509666443e-05, -8.478015661239624e-05, -7.985904812812805e-05, -7.493793964385986e-05, -7.001683115959167e-05, -6.509572267532349e-05, -6.01746141910553e-05, -5.525350570678711e-05, -5.033239722251892e-05, -4.541128873825073e-05, -4.0490180253982544e-05, -3.5569071769714355e-05, -3.064796328544617e-05, -2.572685480117798e-05, -2.080574631690979e-05, -1.58846378326416e-05, -1.0963529348373413e-05, -6.042420864105225e-06, -1.1213123798370361e-06, 3.7997961044311523e-06, 8.72090458869934e-06, 1.364201307296753e-05, 1.8563121557235718e-05, 2.3484230041503906e-05, 2.8405338525772095e-05, 3.332644701004028e-05, 3.824755549430847e-05, 4.316866397857666e-05, 4.808977246284485e-05, 5.301088094711304e-05, 5.7931989431381226e-05, 6.285309791564941e-05, 6.77742063999176e-05, 7.269531488418579e-05, 7.761642336845398e-05, 8.253753185272217e-05, 8.745864033699036e-05, 9.237974882125854e-05, 9.730085730552673e-05, 0.00010222196578979492, 0.00010714307427406311, 0.0001120641827583313, 0.00011698529124259949, 0.00012190639972686768, 0.00012682750821113586, 0.00013174861669540405, 0.00013666972517967224, 0.00014159083366394043, 0.00014651194214820862, 0.0001514330506324768, 0.000156354159116745, 0.00016127526760101318, 0.00016619637608528137, 0.00017111748456954956, 0.00017603859305381775, 0.00018095970153808594]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 3.0, 6.0, 6.0, 8.0, 17.0, 20.0, 22.0, 46.0, 42.0, 61.0, 89.0, 124.0, 178.0, 255.0, 346.0, 489.0, 782.0, 1096.0, 1629.0, 2572.0, 4186.0, 7087.0, 11940.0, 21176.0, 38071.0, 69708.0, 125017.0, 193593.0, 211403.0, 154513.0, 89675.0, 48628.0, 27048.0, 15170.0, 8678.0, 5340.0, 3238.0, 2067.0, 1293.0, 887.0, 603.0, 403.0, 298.0, 211.0, 142.0, 102.0, 74.0, 63.0, 39.0, 32.0, 19.0, 26.0, 11.0, 9.0, 6.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0], "bins": [-2.58984375, -2.506866455078125, -2.42388916015625, -2.340911865234375, -2.2579345703125, -2.174957275390625, -2.09197998046875, -2.009002685546875, -1.926025390625, -1.843048095703125, -1.76007080078125, -1.677093505859375, -1.5941162109375, -1.511138916015625, -1.42816162109375, -1.345184326171875, -1.26220703125, -1.179229736328125, -1.09625244140625, -1.013275146484375, -0.9302978515625, -0.847320556640625, -0.76434326171875, -0.681365966796875, -0.598388671875, -0.515411376953125, -0.43243408203125, -0.349456787109375, -0.2664794921875, -0.183502197265625, -0.10052490234375, -0.017547607421875, 0.0654296875, 0.148406982421875, 0.23138427734375, 0.314361572265625, 0.3973388671875, 0.480316162109375, 0.56329345703125, 0.646270751953125, 0.729248046875, 0.812225341796875, 0.89520263671875, 0.978179931640625, 1.0611572265625, 1.144134521484375, 1.22711181640625, 1.310089111328125, 1.39306640625, 1.476043701171875, 1.55902099609375, 1.641998291015625, 1.7249755859375, 1.807952880859375, 1.89093017578125, 1.973907470703125, 2.056884765625, 2.139862060546875, 2.22283935546875, 2.305816650390625, 2.3887939453125, 2.471771240234375, 2.55474853515625, 2.637725830078125, 2.720703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 6.0, 7.0, 7.0, 17.0, 16.0, 18.0, 28.0, 32.0, 46.0, 43.0, 49.0, 44.0, 50.0, 59.0, 70.0, 65.0, 70.0, 63.0, 48.0, 37.0, 36.0, 34.0, 27.0, 26.0, 18.0, 14.0, 11.0, 14.0, 5.0, 3.0, 3.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.953125, -0.920989990234375, -0.88885498046875, -0.856719970703125, -0.8245849609375, -0.792449951171875, -0.76031494140625, -0.728179931640625, -0.696044921875, -0.663909912109375, -0.63177490234375, -0.599639892578125, -0.5675048828125, -0.535369873046875, -0.50323486328125, -0.471099853515625, -0.43896484375, -0.406829833984375, -0.37469482421875, -0.342559814453125, -0.3104248046875, -0.278289794921875, -0.24615478515625, -0.214019775390625, -0.181884765625, -0.149749755859375, -0.11761474609375, -0.085479736328125, -0.0533447265625, -0.021209716796875, 0.01092529296875, 0.043060302734375, 0.0751953125, 0.107330322265625, 0.13946533203125, 0.171600341796875, 0.2037353515625, 0.235870361328125, 0.26800537109375, 0.300140380859375, 0.332275390625, 0.364410400390625, 0.39654541015625, 0.428680419921875, 0.4608154296875, 0.492950439453125, 0.52508544921875, 0.557220458984375, 0.58935546875, 0.621490478515625, 0.65362548828125, 0.685760498046875, 0.7178955078125, 0.750030517578125, 0.78216552734375, 0.814300537109375, 0.846435546875, 0.878570556640625, 0.91070556640625, 0.942840576171875, 0.9749755859375, 1.007110595703125, 1.03924560546875, 1.071380615234375, 1.103515625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 11.0, 15.0, 15.0, 29.0, 17.0, 34.0, 39.0, 53.0, 77.0, 76.0, 89.0, 84.0, 94.0, 73.0, 56.0, 49.0, 48.0, 32.0, 19.0, 17.0, 13.0, 18.0, 9.0, 7.0, 1.0, 6.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.91670036315918, -18.446056365966797, -17.975412368774414, -17.504770278930664, -17.03412628173828, -16.5634822845459, -16.092838287353516, -15.62219524383545, -15.151552200317383, -14.680908203125, -14.210265159606934, -13.73962116241455, -13.268978118896484, -12.798334121704102, -12.327690124511719, -11.857047080993652, -11.38640308380127, -10.915759086608887, -10.44511604309082, -9.974472045898438, -9.503829002380371, -9.033185005187988, -8.562541961669922, -8.091897964477539, -7.6212544441223145, -7.15061092376709, -6.679967403411865, -6.209323883056641, -5.738679885864258, -5.268036842346191, -4.797392845153809, -4.326749324798584, -3.856106758117676, -3.385463237762451, -2.9148197174072266, -2.444175958633423, -1.9735324382781982, -1.5028889179229736, -1.03224515914917, -0.5616016387939453, -0.0909581184387207, 0.3796854615211487, 0.8503290414810181, 1.3209726810455322, 1.7916162014007568, 2.2622597217559814, 2.732903480529785, 3.2035470008850098, 3.6741905212402344, 4.144834041595459, 4.615477561950684, 5.086121559143066, 5.556764602661133, 6.027408599853516, 6.49805212020874, 6.968695640563965, 7.4393391609191895, 7.909982681274414, 8.380626678466797, 8.851269721984863, 9.321913719177246, 9.792556762695312, 10.263200759887695, 10.733844757080078, 11.204487800598145]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 9.0, 12.0, 11.0, 26.0, 14.0, 24.0, 33.0, 30.0, 42.0, 32.0, 41.0, 52.0, 52.0, 44.0, 42.0, 44.0, 42.0, 52.0, 51.0, 42.0, 42.0, 36.0, 31.0, 36.0, 19.0, 25.0, 19.0, 22.0, 12.0, 12.0, 14.0, 4.0, 5.0, 1.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.915238380432129, -7.616649150848389, -7.31805944442749, -7.01947021484375, -6.720880508422852, -6.422291278839111, -6.123702049255371, -5.825112342834473, -5.526523113250732, -5.227933883666992, -4.929344177246094, -4.6307549476623535, -4.332165718078613, -4.033576011657715, -3.7349867820739746, -3.4363973140716553, -3.137807846069336, -2.8392183780670166, -2.5406289100646973, -2.242039680480957, -1.9434502124786377, -1.6448607444763184, -1.3462713956832886, -1.0476820468902588, -0.7490925788879395, -0.4505031704902649, -0.15191376209259033, 0.14667564630508423, 0.4452650547027588, 0.7438545227050781, 1.042443871498108, 1.3410332202911377, 1.6396217346191406, 1.93821120262146, 2.2368006706237793, 2.5353899002075195, 2.833979368209839, 3.132568836212158, 3.4311580657958984, 3.7297475337982178, 4.028337001800537, 4.326926231384277, 4.625515937805176, 4.924105167388916, 5.222694396972656, 5.521284103393555, 5.819873332977295, 6.118462562561035, 6.417052268981934, 6.715641498565674, 7.014231204986572, 7.3128204345703125, 7.611410140991211, 7.909999370574951, 8.208588600158691, 8.50717830657959, 8.805767059326172, 9.10435676574707, 9.402945518493652, 9.70153522491455, 10.00012493133545, 10.298713684082031, 10.59730339050293, 10.895893096923828, 11.194482803344727]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 16.0, 17.0, 22.0, 39.0, 61.0, 77.0, 106.0, 168.0, 212.0, 339.0, 510.0, 822.0, 1365.0, 2355.0, 4180.0, 7801.0, 15534.0, 30372.0, 63036.0, 127715.0, 222245.0, 245273.0, 161568.0, 82468.0, 40066.0, 19482.0, 9901.0, 5306.0, 2975.0, 1685.0, 977.0, 636.0, 377.0, 284.0, 172.0, 112.0, 89.0, 53.0, 46.0, 22.0, 15.0, 9.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.34375, -13.9114990234375, -13.479248046875, -13.0469970703125, -12.61474609375, -12.1824951171875, -11.750244140625, -11.3179931640625, -10.8857421875, -10.4534912109375, -10.021240234375, -9.5889892578125, -9.15673828125, -8.7244873046875, -8.292236328125, -7.8599853515625, -7.427734375, -6.9954833984375, -6.563232421875, -6.1309814453125, -5.69873046875, -5.2664794921875, -4.834228515625, -4.4019775390625, -3.9697265625, -3.5374755859375, -3.105224609375, -2.6729736328125, -2.24072265625, -1.8084716796875, -1.376220703125, -0.9439697265625, -0.51171875, -0.0794677734375, 0.352783203125, 0.7850341796875, 1.21728515625, 1.6495361328125, 2.081787109375, 2.5140380859375, 2.9462890625, 3.3785400390625, 3.810791015625, 4.2430419921875, 4.67529296875, 5.1075439453125, 5.539794921875, 5.9720458984375, 6.404296875, 6.8365478515625, 7.268798828125, 7.7010498046875, 8.13330078125, 8.5655517578125, 8.997802734375, 9.4300537109375, 9.8623046875, 10.2945556640625, 10.726806640625, 11.1590576171875, 11.59130859375, 12.0235595703125, 12.455810546875, 12.8880615234375, 13.3203125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 4.0, 9.0, 13.0, 17.0, 21.0, 20.0, 22.0, 19.0, 26.0, 31.0, 38.0, 33.0, 39.0, 51.0, 38.0, 50.0, 38.0, 54.0, 44.0, 49.0, 46.0, 33.0, 44.0, 29.0, 25.0, 31.0, 35.0, 15.0, 20.0, 17.0, 15.0, 20.0, 8.0, 6.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.22882080078125, -6.9537353515625, -6.67864990234375, -6.403564453125, -6.12847900390625, -5.8533935546875, -5.57830810546875, -5.30322265625, -5.02813720703125, -4.7530517578125, -4.47796630859375, -4.202880859375, -3.92779541015625, -3.6527099609375, -3.37762451171875, -3.1025390625, -2.82745361328125, -2.5523681640625, -2.27728271484375, -2.002197265625, -1.72711181640625, -1.4520263671875, -1.17694091796875, -0.90185546875, -0.62677001953125, -0.3516845703125, -0.07659912109375, 0.198486328125, 0.47357177734375, 0.7486572265625, 1.02374267578125, 1.298828125, 1.57391357421875, 1.8489990234375, 2.12408447265625, 2.399169921875, 2.67425537109375, 2.9493408203125, 3.22442626953125, 3.49951171875, 3.77459716796875, 4.0496826171875, 4.32476806640625, 4.599853515625, 4.87493896484375, 5.1500244140625, 5.42510986328125, 5.7001953125, 5.97528076171875, 6.2503662109375, 6.52545166015625, 6.800537109375, 7.07562255859375, 7.3507080078125, 7.62579345703125, 7.90087890625, 8.17596435546875, 8.4510498046875, 8.72613525390625, 9.001220703125, 9.27630615234375, 9.5513916015625, 9.82647705078125, 10.1015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 16.0, 20.0, 24.0, 29.0, 49.0, 66.0, 110.0, 121.0, 207.0, 366.0, 572.0, 834.0, 1457.0, 2435.0, 4351.0, 7806.0, 14861.0, 30503.0, 65238.0, 136089.0, 235478.0, 248071.0, 153392.0, 74359.0, 34994.0, 17006.0, 8631.0, 4684.0, 2604.0, 1607.0, 956.0, 550.0, 382.0, 231.0, 129.0, 89.0, 72.0, 41.0, 30.0, 25.0, 20.0, 14.0, 6.0, 8.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-14.1484375, -13.7208251953125, -13.293212890625, -12.8656005859375, -12.43798828125, -12.0103759765625, -11.582763671875, -11.1551513671875, -10.7275390625, -10.2999267578125, -9.872314453125, -9.4447021484375, -9.01708984375, -8.5894775390625, -8.161865234375, -7.7342529296875, -7.306640625, -6.8790283203125, -6.451416015625, -6.0238037109375, -5.59619140625, -5.1685791015625, -4.740966796875, -4.3133544921875, -3.8857421875, -3.4581298828125, -3.030517578125, -2.6029052734375, -2.17529296875, -1.7476806640625, -1.320068359375, -0.8924560546875, -0.46484375, -0.0372314453125, 0.390380859375, 0.8179931640625, 1.24560546875, 1.6732177734375, 2.100830078125, 2.5284423828125, 2.9560546875, 3.3836669921875, 3.811279296875, 4.2388916015625, 4.66650390625, 5.0941162109375, 5.521728515625, 5.9493408203125, 6.376953125, 6.8045654296875, 7.232177734375, 7.6597900390625, 8.08740234375, 8.5150146484375, 8.942626953125, 9.3702392578125, 9.7978515625, 10.2254638671875, 10.653076171875, 11.0806884765625, 11.50830078125, 11.9359130859375, 12.363525390625, 12.7911376953125, 13.21875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 7.0, 8.0, 13.0, 21.0, 18.0, 21.0, 32.0, 22.0, 38.0, 39.0, 41.0, 47.0, 40.0, 47.0, 61.0, 58.0, 46.0, 47.0, 46.0, 46.0, 41.0, 42.0, 40.0, 40.0, 23.0, 20.0, 17.0, 16.0, 8.0, 13.0, 9.0, 4.0, 9.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.76348876953125, -5.5543212890625, -5.34515380859375, -5.135986328125, -4.92681884765625, -4.7176513671875, -4.50848388671875, -4.29931640625, -4.09014892578125, -3.8809814453125, -3.67181396484375, -3.462646484375, -3.25347900390625, -3.0443115234375, -2.83514404296875, -2.6259765625, -2.41680908203125, -2.2076416015625, -1.99847412109375, -1.789306640625, -1.58013916015625, -1.3709716796875, -1.16180419921875, -0.95263671875, -0.74346923828125, -0.5343017578125, -0.32513427734375, -0.115966796875, 0.09320068359375, 0.3023681640625, 0.51153564453125, 0.720703125, 0.92987060546875, 1.1390380859375, 1.34820556640625, 1.557373046875, 1.76654052734375, 1.9757080078125, 2.18487548828125, 2.39404296875, 2.60321044921875, 2.8123779296875, 3.02154541015625, 3.230712890625, 3.43988037109375, 3.6490478515625, 3.85821533203125, 4.0673828125, 4.27655029296875, 4.4857177734375, 4.69488525390625, 4.904052734375, 5.11322021484375, 5.3223876953125, 5.53155517578125, 5.74072265625, 5.94989013671875, 6.1590576171875, 6.36822509765625, 6.577392578125, 6.78656005859375, 6.9957275390625, 7.20489501953125, 7.4140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 9.0, 15.0, 19.0, 20.0, 29.0, 52.0, 57.0, 93.0, 125.0, 206.0, 285.0, 381.0, 587.0, 823.0, 1340.0, 1933.0, 3023.0, 4672.0, 7564.0, 12540.0, 21208.0, 37520.0, 68896.0, 126420.0, 205030.0, 219139.0, 148047.0, 81190.0, 43976.0, 24822.0, 14380.0, 8794.0, 5252.0, 3437.0, 2204.0, 1408.0, 955.0, 636.0, 422.0, 329.0, 219.0, 150.0, 115.0, 68.0, 46.0, 47.0, 29.0, 14.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-8.3046875, -8.0379638671875, -7.771240234375, -7.5045166015625, -7.23779296875, -6.9710693359375, -6.704345703125, -6.4376220703125, -6.1708984375, -5.9041748046875, -5.637451171875, -5.3707275390625, -5.10400390625, -4.8372802734375, -4.570556640625, -4.3038330078125, -4.037109375, -3.7703857421875, -3.503662109375, -3.2369384765625, -2.97021484375, -2.7034912109375, -2.436767578125, -2.1700439453125, -1.9033203125, -1.6365966796875, -1.369873046875, -1.1031494140625, -0.83642578125, -0.5697021484375, -0.302978515625, -0.0362548828125, 0.23046875, 0.4971923828125, 0.763916015625, 1.0306396484375, 1.29736328125, 1.5640869140625, 1.830810546875, 2.0975341796875, 2.3642578125, 2.6309814453125, 2.897705078125, 3.1644287109375, 3.43115234375, 3.6978759765625, 3.964599609375, 4.2313232421875, 4.498046875, 4.7647705078125, 5.031494140625, 5.2982177734375, 5.56494140625, 5.8316650390625, 6.098388671875, 6.3651123046875, 6.6318359375, 6.8985595703125, 7.165283203125, 7.4320068359375, 7.69873046875, 7.9654541015625, 8.232177734375, 8.4989013671875, 8.765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 4.0, 7.0, 11.0, 8.0, 12.0, 18.0, 10.0, 32.0, 28.0, 67.0, 74.0, 84.0, 77.0, 105.0, 97.0, 76.0, 73.0, 68.0, 47.0, 31.0, 29.0, 13.0, 3.0, 7.0, 8.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013284683227539062, -0.001292213797569275, -0.0012559592723846436, -0.0012197047472000122, -0.0011834502220153809, -0.0011471956968307495, -0.0011109411716461182, -0.0010746866464614868, -0.0010384321212768555, -0.0010021775960922241, -0.0009659230709075928, -0.0009296685457229614, -0.0008934140205383301, -0.0008571594953536987, -0.0008209049701690674, -0.000784650444984436, -0.0007483959197998047, -0.0007121413946151733, -0.000675886869430542, -0.0006396323442459106, -0.0006033778190612793, -0.000567123293876648, -0.0005308687686920166, -0.0004946142435073853, -0.0004583597183227539, -0.00042210519313812256, -0.0003858506679534912, -0.00034959614276885986, -0.0003133416175842285, -0.00027708709239959717, -0.00024083256721496582, -0.00020457804203033447, -0.00016832351684570312, -0.00013206899166107178, -9.581446647644043e-05, -5.955994129180908e-05, -2.3305416107177734e-05, 1.2949109077453613e-05, 4.920363426208496e-05, 8.545815944671631e-05, 0.00012171268463134766, 0.000157967209815979, 0.00019422173500061035, 0.0002304762601852417, 0.00026673078536987305, 0.0003029853105545044, 0.00033923983573913574, 0.0003754943609237671, 0.00041174888610839844, 0.0004480034112930298, 0.00048425793647766113, 0.0005205124616622925, 0.0005567669868469238, 0.0005930215120315552, 0.0006292760372161865, 0.0006655305624008179, 0.0007017850875854492, 0.0007380396127700806, 0.0007742941379547119, 0.0008105486631393433, 0.0008468031883239746, 0.000883057713508606, 0.0009193122386932373, 0.0009555667638778687, 0.0009918212890625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 5.0, 5.0, 10.0, 10.0, 18.0, 16.0, 37.0, 49.0, 63.0, 83.0, 115.0, 150.0, 231.0, 272.0, 404.0, 595.0, 887.0, 1265.0, 1804.0, 2687.0, 4326.0, 6681.0, 10943.0, 18730.0, 33817.0, 61366.0, 111070.0, 179707.0, 214825.0, 167832.0, 100293.0, 54776.0, 30140.0, 17298.0, 9919.0, 6269.0, 3803.0, 2497.0, 1667.0, 1161.0, 761.0, 584.0, 413.0, 283.0, 207.0, 138.0, 113.0, 78.0, 47.0, 39.0, 23.0, 20.0, 11.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-7.28515625, -7.06036376953125, -6.8355712890625, -6.61077880859375, -6.385986328125, -6.16119384765625, -5.9364013671875, -5.71160888671875, -5.48681640625, -5.26202392578125, -5.0372314453125, -4.81243896484375, -4.587646484375, -4.36285400390625, -4.1380615234375, -3.91326904296875, -3.6884765625, -3.46368408203125, -3.2388916015625, -3.01409912109375, -2.789306640625, -2.56451416015625, -2.3397216796875, -2.11492919921875, -1.89013671875, -1.66534423828125, -1.4405517578125, -1.21575927734375, -0.990966796875, -0.76617431640625, -0.5413818359375, -0.31658935546875, -0.091796875, 0.13299560546875, 0.3577880859375, 0.58258056640625, 0.807373046875, 1.03216552734375, 1.2569580078125, 1.48175048828125, 1.70654296875, 1.93133544921875, 2.1561279296875, 2.38092041015625, 2.605712890625, 2.83050537109375, 3.0552978515625, 3.28009033203125, 3.5048828125, 3.72967529296875, 3.9544677734375, 4.17926025390625, 4.404052734375, 4.62884521484375, 4.8536376953125, 5.07843017578125, 5.30322265625, 5.52801513671875, 5.7528076171875, 5.97760009765625, 6.202392578125, 6.42718505859375, 6.6519775390625, 6.87677001953125, 7.1015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 11.0, 7.0, 11.0, 12.0, 12.0, 19.0, 25.0, 36.0, 51.0, 50.0, 63.0, 75.0, 64.0, 78.0, 95.0, 83.0, 56.0, 44.0, 39.0, 26.0, 26.0, 23.0, 12.0, 21.0, 17.0, 7.0, 6.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.0625, -3.94134521484375, -3.8201904296875, -3.69903564453125, -3.577880859375, -3.45672607421875, -3.3355712890625, -3.21441650390625, -3.09326171875, -2.97210693359375, -2.8509521484375, -2.72979736328125, -2.608642578125, -2.48748779296875, -2.3663330078125, -2.24517822265625, -2.1240234375, -2.00286865234375, -1.8817138671875, -1.76055908203125, -1.639404296875, -1.51824951171875, -1.3970947265625, -1.27593994140625, -1.15478515625, -1.03363037109375, -0.9124755859375, -0.79132080078125, -0.670166015625, -0.54901123046875, -0.4278564453125, -0.30670166015625, -0.185546875, -0.06439208984375, 0.0567626953125, 0.17791748046875, 0.299072265625, 0.42022705078125, 0.5413818359375, 0.66253662109375, 0.78369140625, 0.90484619140625, 1.0260009765625, 1.14715576171875, 1.268310546875, 1.38946533203125, 1.5106201171875, 1.63177490234375, 1.7529296875, 1.87408447265625, 1.9952392578125, 2.11639404296875, 2.237548828125, 2.35870361328125, 2.4798583984375, 2.60101318359375, 2.72216796875, 2.84332275390625, 2.9644775390625, 3.08563232421875, 3.206787109375, 3.32794189453125, 3.4490966796875, 3.57025146484375, 3.69140625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 11.0, 20.0, 32.0, 33.0, 37.0, 65.0, 69.0, 90.0, 89.0, 97.0, 88.0, 69.0, 65.0, 55.0, 40.0, 26.0, 23.0, 16.0, 17.0, 6.0, 2.0, 5.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-21.103822708129883, -20.61128044128418, -20.118736267089844, -19.62619400024414, -19.133651733398438, -18.641109466552734, -18.1485652923584, -17.656023025512695, -17.163480758666992, -16.67093849182129, -16.178394317626953, -15.68585205078125, -15.193309783935547, -14.700766563415527, -14.208223342895508, -13.715681076049805, -13.223136901855469, -12.73059368133545, -12.238051414489746, -11.745508193969727, -11.252965927124023, -10.760422706604004, -10.267879486083984, -9.775337219238281, -9.282794952392578, -8.790251731872559, -8.297709465026855, -7.805166244506836, -7.312623500823975, -6.820080757141113, -6.327538013458252, -5.834995269775391, -5.342452049255371, -4.84990930557251, -4.357366561889648, -3.864823579788208, -3.3722805976867676, -2.8797378540039062, -2.387195110321045, -1.8946521282196045, -1.4021093845367432, -0.9095665216445923, -0.4170237183570862, 0.07551908493041992, 0.5680619478225708, 1.0606048107147217, 1.553147554397583, 2.0456905364990234, 2.5382332801818848, 3.030776023864746, 3.5233190059661865, 4.015861511230469, 4.508404731750488, 5.00094747543335, 5.493490219116211, 5.9860334396362305, 6.478575706481934, 6.971118450164795, 7.463661193847656, 7.956204414367676, 8.448746681213379, 8.941289901733398, 9.433832168579102, 9.926375389099121, 10.41891860961914]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 7.0, 9.0, 12.0, 9.0, 29.0, 17.0, 42.0, 36.0, 29.0, 50.0, 42.0, 55.0, 51.0, 43.0, 60.0, 56.0, 52.0, 54.0, 46.0, 42.0, 42.0, 33.0, 33.0, 27.0, 25.0, 25.0, 19.0, 5.0, 14.0, 2.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.959763526916504, -7.626382827758789, -7.293002605438232, -6.959622383117676, -6.626241683959961, -6.292860984802246, -5.9594807624816895, -5.626100540161133, -5.292719841003418, -4.959339141845703, -4.6259589195251465, -4.29257869720459, -3.959197998046875, -3.6258175373077393, -3.2924370765686035, -2.9590566158294678, -2.625676155090332, -2.2922956943511963, -1.9589152336120605, -1.6255347728729248, -1.292154312133789, -0.9587738513946533, -0.6253933906555176, -0.29201292991638184, 0.041367530822753906, 0.37474799156188965, 0.7081284523010254, 1.0415089130401611, 1.3748893737792969, 1.7082698345184326, 2.0416502952575684, 2.375030755996704, 2.7084102630615234, 3.041790723800659, 3.375171184539795, 3.7085516452789307, 4.041932106018066, 4.375312805175781, 4.708693027496338, 5.0420732498168945, 5.375453948974609, 5.708834648132324, 6.042214870452881, 6.3755950927734375, 6.708975791931152, 7.042356491088867, 7.375736713409424, 7.7091169357299805, 8.042497634887695, 8.37587833404541, 8.709259033203125, 9.042638778686523, 9.376019477844238, 9.709400177001953, 10.042779922485352, 10.376160621643066, 10.709541320800781, 11.042922019958496, 11.376302719116211, 11.70968246459961, 12.043063163757324, 12.376443862915039, 12.709823608398438, 13.043204307556152, 13.376585006713867]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 27.0, 56.0, 96.0, 138.0, 233.0, 452.0, 793.0, 1408.0, 2541.0, 4609.0, 9246.0, 20977.0, 55162.0, 184988.0, 759341.0, 1785325.0, 1004664.0, 244679.0, 68288.0, 25350.0, 11690.0, 6073.0, 3291.0, 1918.0, 1096.0, 671.0, 390.0, 238.0, 163.0, 104.0, 82.0, 42.0, 32.0, 15.0, 20.0, 11.0, 17.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -12.9139404296875, -12.366943359375, -11.8199462890625, -11.27294921875, -10.7259521484375, -10.178955078125, -9.6319580078125, -9.0849609375, -8.5379638671875, -7.990966796875, -7.4439697265625, -6.89697265625, -6.3499755859375, -5.802978515625, -5.2559814453125, -4.708984375, -4.1619873046875, -3.614990234375, -3.0679931640625, -2.52099609375, -1.9739990234375, -1.427001953125, -0.8800048828125, -0.3330078125, 0.2139892578125, 0.760986328125, 1.3079833984375, 1.85498046875, 2.4019775390625, 2.948974609375, 3.4959716796875, 4.04296875, 4.5899658203125, 5.136962890625, 5.6839599609375, 6.23095703125, 6.7779541015625, 7.324951171875, 7.8719482421875, 8.4189453125, 8.9659423828125, 9.512939453125, 10.0599365234375, 10.60693359375, 11.1539306640625, 11.700927734375, 12.2479248046875, 12.794921875, 13.3419189453125, 13.888916015625, 14.4359130859375, 14.98291015625, 15.5299072265625, 16.076904296875, 16.6239013671875, 17.1708984375, 17.7178955078125, 18.264892578125, 18.8118896484375, 19.35888671875, 19.9058837890625, 20.452880859375, 20.9998779296875, 21.546875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 2.0, 2.0, 7.0, 9.0, 9.0, 19.0, 11.0, 13.0, 14.0, 23.0, 39.0, 37.0, 24.0, 36.0, 50.0, 35.0, 59.0, 52.0, 46.0, 51.0, 57.0, 40.0, 53.0, 47.0, 48.0, 32.0, 23.0, 24.0, 25.0, 21.0, 21.0, 15.0, 21.0, 10.0, 9.0, 6.0, 3.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.61785888671875, -5.4036865234375, -5.18951416015625, -4.975341796875, -4.76116943359375, -4.5469970703125, -4.33282470703125, -4.11865234375, -3.90447998046875, -3.6903076171875, -3.47613525390625, -3.261962890625, -3.04779052734375, -2.8336181640625, -2.61944580078125, -2.4052734375, -2.19110107421875, -1.9769287109375, -1.76275634765625, -1.548583984375, -1.33441162109375, -1.1202392578125, -0.90606689453125, -0.69189453125, -0.47772216796875, -0.2635498046875, -0.04937744140625, 0.164794921875, 0.37896728515625, 0.5931396484375, 0.80731201171875, 1.021484375, 1.23565673828125, 1.4498291015625, 1.66400146484375, 1.878173828125, 2.09234619140625, 2.3065185546875, 2.52069091796875, 2.73486328125, 2.94903564453125, 3.1632080078125, 3.37738037109375, 3.591552734375, 3.80572509765625, 4.0198974609375, 4.23406982421875, 4.4482421875, 4.66241455078125, 4.8765869140625, 5.09075927734375, 5.304931640625, 5.51910400390625, 5.7332763671875, 5.94744873046875, 6.16162109375, 6.37579345703125, 6.5899658203125, 6.80413818359375, 7.018310546875, 7.23248291015625, 7.4466552734375, 7.66082763671875, 7.875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 9.0, 13.0, 11.0, 21.0, 24.0, 42.0, 60.0, 91.0, 126.0, 225.0, 279.0, 423.0, 707.0, 1015.0, 1593.0, 2438.0, 4033.0, 6499.0, 11341.0, 20916.0, 42291.0, 98135.0, 264602.0, 750351.0, 1408421.0, 974687.0, 361524.0, 130288.0, 54245.0, 25694.0, 13824.0, 7870.0, 4606.0, 2857.0, 1691.0, 1153.0, 723.0, 463.0, 381.0, 190.0, 138.0, 93.0, 59.0, 42.0, 22.0, 30.0, 15.0, 5.0, 10.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.5078125, -12.0859375, -11.6640625, -11.2421875, -10.8203125, -10.3984375, -9.9765625, -9.5546875, -9.1328125, -8.7109375, -8.2890625, -7.8671875, -7.4453125, -7.0234375, -6.6015625, -6.1796875, -5.7578125, -5.3359375, -4.9140625, -4.4921875, -4.0703125, -3.6484375, -3.2265625, -2.8046875, -2.3828125, -1.9609375, -1.5390625, -1.1171875, -0.6953125, -0.2734375, 0.1484375, 0.5703125, 0.9921875, 1.4140625, 1.8359375, 2.2578125, 2.6796875, 3.1015625, 3.5234375, 3.9453125, 4.3671875, 4.7890625, 5.2109375, 5.6328125, 6.0546875, 6.4765625, 6.8984375, 7.3203125, 7.7421875, 8.1640625, 8.5859375, 9.0078125, 9.4296875, 9.8515625, 10.2734375, 10.6953125, 11.1171875, 11.5390625, 11.9609375, 12.3828125, 12.8046875, 13.2265625, 13.6484375, 14.0703125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 13.0, 12.0, 13.0, 23.0, 28.0, 29.0, 35.0, 31.0, 69.0, 73.0, 91.0, 135.0, 183.0, 214.0, 258.0, 281.0, 342.0, 359.0, 327.0, 281.0, 285.0, 235.0, 198.0, 135.0, 98.0, 71.0, 53.0, 47.0, 33.0, 17.0, 24.0, 13.0, 9.0, 14.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4158935546875, -3.296630859375, -3.1773681640625, -3.05810546875, -2.9388427734375, -2.819580078125, -2.7003173828125, -2.5810546875, -2.4617919921875, -2.342529296875, -2.2232666015625, -2.10400390625, -1.9847412109375, -1.865478515625, -1.7462158203125, -1.626953125, -1.5076904296875, -1.388427734375, -1.2691650390625, -1.14990234375, -1.0306396484375, -0.911376953125, -0.7921142578125, -0.6728515625, -0.5535888671875, -0.434326171875, -0.3150634765625, -0.19580078125, -0.0765380859375, 0.042724609375, 0.1619873046875, 0.28125, 0.4005126953125, 0.519775390625, 0.6390380859375, 0.75830078125, 0.8775634765625, 0.996826171875, 1.1160888671875, 1.2353515625, 1.3546142578125, 1.473876953125, 1.5931396484375, 1.71240234375, 1.8316650390625, 1.950927734375, 2.0701904296875, 2.189453125, 2.3087158203125, 2.427978515625, 2.5472412109375, 2.66650390625, 2.7857666015625, 2.905029296875, 3.0242919921875, 3.1435546875, 3.2628173828125, 3.382080078125, 3.5013427734375, 3.62060546875, 3.7398681640625, 3.859130859375, 3.9783935546875, 4.09765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 2.0, 7.0, 8.0, 7.0, 20.0, 15.0, 34.0, 37.0, 64.0, 76.0, 92.0, 100.0, 131.0, 108.0, 87.0, 52.0, 49.0, 33.0, 36.0, 14.0, 7.0, 5.0, 10.0, 2.0, 2.0, 8.0, 1.0, 2.0], "bins": [-27.16619300842285, -26.602209091186523, -26.038225173950195, -25.4742431640625, -24.910259246826172, -24.346275329589844, -23.782291412353516, -23.218307495117188, -22.65432357788086, -22.09033966064453, -21.526355743408203, -20.962371826171875, -20.39838981628418, -19.83440589904785, -19.270421981811523, -18.706438064575195, -18.1424560546875, -17.578472137451172, -17.014488220214844, -16.450504302978516, -15.886521339416504, -15.322538375854492, -14.758554458618164, -14.194570541381836, -13.630586624145508, -13.06660270690918, -12.502619743347168, -11.93863582611084, -11.374651908874512, -10.8106689453125, -10.246685028076172, -9.682701110839844, -9.118718147277832, -8.554734230041504, -7.990750789642334, -7.426767349243164, -6.862783432006836, -6.298799991607666, -5.734816551208496, -5.170832633972168, -4.606849193572998, -4.042865753173828, -3.4788818359375, -2.91489839553833, -2.350914716720581, -1.786931037902832, -1.222947597503662, -0.6589639186859131, -0.09498023986816406, 0.4690033793449402, 1.0329869985580444, 1.596970558166504, 2.160954236984253, 2.724937915802002, 3.288921356201172, 3.852905035018921, 4.41688871383667, 4.98087215423584, 5.544856071472168, 6.108839511871338, 6.672822952270508, 7.236806869506836, 7.800790309906006, 8.364773750305176, 8.928757667541504]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 2.0, 7.0, 12.0, 9.0, 23.0, 22.0, 12.0, 40.0, 38.0, 40.0, 43.0, 36.0, 38.0, 45.0, 43.0, 43.0, 46.0, 38.0, 54.0, 43.0, 42.0, 43.0, 37.0, 35.0, 36.0, 34.0, 22.0, 22.0, 21.0, 14.0, 13.0, 6.0, 9.0, 8.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.928322792053223, -6.660472393035889, -6.3926215171813965, -6.1247711181640625, -5.8569207191467285, -5.5890703201293945, -5.321219444274902, -5.053369045257568, -4.785518646240234, -4.5176682472229, -4.249817371368408, -3.981966972351074, -3.7141165733337402, -3.446265935897827, -3.178415298461914, -2.91056489944458, -2.642714023590088, -2.374863386154175, -2.107012987136841, -1.8391623497009277, -1.5713118314743042, -1.3034613132476807, -1.0356106758117676, -0.767760157585144, -0.4999096393585205, -0.23205909132957458, 0.03579145669937134, 0.30364203453063965, 0.5714925527572632, 0.8393430709838867, 1.1071937084197998, 1.3750442266464233, 1.6428947448730469, 1.9107452630996704, 2.178595781326294, 2.446446418762207, 2.714296817779541, 2.982147455215454, 3.249998092651367, 3.517848491668701, 3.7856991291046143, 4.053549766540527, 4.321400165557861, 4.589250564575195, 4.8571014404296875, 5.1249518394470215, 5.3928022384643555, 5.660653114318848, 5.928503513336182, 6.196353912353516, 6.464204788208008, 6.732055187225342, 6.999905586242676, 7.267756462097168, 7.535606861114502, 7.803457260131836, 8.071308135986328, 8.33915901184082, 8.607008934020996, 8.874859809875488, 9.14271068572998, 9.410560607910156, 9.678411483764648, 9.94626235961914, 10.214112281799316]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 3.0, 4.0, 4.0, 11.0, 11.0, 16.0, 24.0, 43.0, 51.0, 67.0, 95.0, 128.0, 247.0, 291.0, 502.0, 683.0, 1069.0, 1573.0, 2775.0, 4581.0, 8499.0, 16815.0, 34681.0, 76604.0, 164416.0, 268300.0, 233550.0, 122469.0, 55753.0, 25693.0, 12724.0, 6691.0, 3871.0, 2252.0, 1361.0, 856.0, 569.0, 388.0, 271.0, 210.0, 130.0, 76.0, 54.0, 55.0, 29.0, 20.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.671875, -6.46844482421875, -6.2650146484375, -6.06158447265625, -5.858154296875, -5.65472412109375, -5.4512939453125, -5.24786376953125, -5.04443359375, -4.84100341796875, -4.6375732421875, -4.43414306640625, -4.230712890625, -4.02728271484375, -3.8238525390625, -3.62042236328125, -3.4169921875, -3.21356201171875, -3.0101318359375, -2.80670166015625, -2.603271484375, -2.39984130859375, -2.1964111328125, -1.99298095703125, -1.78955078125, -1.58612060546875, -1.3826904296875, -1.17926025390625, -0.975830078125, -0.77239990234375, -0.5689697265625, -0.36553955078125, -0.162109375, 0.04132080078125, 0.2447509765625, 0.44818115234375, 0.651611328125, 0.85504150390625, 1.0584716796875, 1.26190185546875, 1.46533203125, 1.66876220703125, 1.8721923828125, 2.07562255859375, 2.279052734375, 2.48248291015625, 2.6859130859375, 2.88934326171875, 3.0927734375, 3.29620361328125, 3.4996337890625, 3.70306396484375, 3.906494140625, 4.10992431640625, 4.3133544921875, 4.51678466796875, 4.72021484375, 4.92364501953125, 5.1270751953125, 5.33050537109375, 5.533935546875, 5.73736572265625, 5.9407958984375, 6.14422607421875, 6.34765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 5.0, 3.0, 4.0, 12.0, 14.0, 16.0, 30.0, 16.0, 27.0, 28.0, 33.0, 43.0, 28.0, 29.0, 55.0, 53.0, 37.0, 44.0, 49.0, 44.0, 43.0, 45.0, 35.0, 38.0, 24.0, 34.0, 28.0, 40.0, 25.0, 23.0, 17.0, 20.0, 10.0, 6.0, 7.0, 2.0, 8.0, 1.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.296875, -7.031982421875, -6.76708984375, -6.502197265625, -6.2373046875, -5.972412109375, -5.70751953125, -5.442626953125, -5.177734375, -4.912841796875, -4.64794921875, -4.383056640625, -4.1181640625, -3.853271484375, -3.58837890625, -3.323486328125, -3.05859375, -2.793701171875, -2.52880859375, -2.263916015625, -1.9990234375, -1.734130859375, -1.46923828125, -1.204345703125, -0.939453125, -0.674560546875, -0.40966796875, -0.144775390625, 0.1201171875, 0.385009765625, 0.64990234375, 0.914794921875, 1.1796875, 1.444580078125, 1.70947265625, 1.974365234375, 2.2392578125, 2.504150390625, 2.76904296875, 3.033935546875, 3.298828125, 3.563720703125, 3.82861328125, 4.093505859375, 4.3583984375, 4.623291015625, 4.88818359375, 5.153076171875, 5.41796875, 5.682861328125, 5.94775390625, 6.212646484375, 6.4775390625, 6.742431640625, 7.00732421875, 7.272216796875, 7.537109375, 7.802001953125, 8.06689453125, 8.331787109375, 8.5966796875, 8.861572265625, 9.12646484375, 9.391357421875, 9.65625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 11.0, 23.0, 32.0, 39.0, 48.0, 65.0, 105.0, 141.0, 211.0, 330.0, 468.0, 797.0, 1249.0, 2088.0, 3933.0, 7563.0, 16684.0, 41342.0, 117416.0, 310971.0, 331507.0, 131268.0, 45780.0, 18216.0, 8173.0, 4146.0, 2296.0, 1289.0, 784.0, 477.0, 310.0, 230.0, 157.0, 100.0, 80.0, 60.0, 36.0, 38.0, 25.0, 20.0, 10.0, 9.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.165771484375, -7.89404296875, -7.622314453125, -7.3505859375, -7.078857421875, -6.80712890625, -6.535400390625, -6.263671875, -5.991943359375, -5.72021484375, -5.448486328125, -5.1767578125, -4.905029296875, -4.63330078125, -4.361572265625, -4.08984375, -3.818115234375, -3.54638671875, -3.274658203125, -3.0029296875, -2.731201171875, -2.45947265625, -2.187744140625, -1.916015625, -1.644287109375, -1.37255859375, -1.100830078125, -0.8291015625, -0.557373046875, -0.28564453125, -0.013916015625, 0.2578125, 0.529541015625, 0.80126953125, 1.072998046875, 1.3447265625, 1.616455078125, 1.88818359375, 2.159912109375, 2.431640625, 2.703369140625, 2.97509765625, 3.246826171875, 3.5185546875, 3.790283203125, 4.06201171875, 4.333740234375, 4.60546875, 4.877197265625, 5.14892578125, 5.420654296875, 5.6923828125, 5.964111328125, 6.23583984375, 6.507568359375, 6.779296875, 7.051025390625, 7.32275390625, 7.594482421875, 7.8662109375, 8.137939453125, 8.40966796875, 8.681396484375, 8.953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 5.0, 12.0, 14.0, 12.0, 17.0, 26.0, 26.0, 26.0, 29.0, 47.0, 27.0, 36.0, 31.0, 49.0, 38.0, 44.0, 47.0, 55.0, 40.0, 43.0, 49.0, 51.0, 30.0, 27.0, 33.0, 21.0, 21.0, 24.0, 22.0, 21.0, 11.0, 5.0, 13.0, 5.0, 4.0, 8.0, 3.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.8880615234375, -4.733154296875, -4.5782470703125, -4.42333984375, -4.2684326171875, -4.113525390625, -3.9586181640625, -3.8037109375, -3.6488037109375, -3.493896484375, -3.3389892578125, -3.18408203125, -3.0291748046875, -2.874267578125, -2.7193603515625, -2.564453125, -2.4095458984375, -2.254638671875, -2.0997314453125, -1.94482421875, -1.7899169921875, -1.635009765625, -1.4801025390625, -1.3251953125, -1.1702880859375, -1.015380859375, -0.8604736328125, -0.70556640625, -0.5506591796875, -0.395751953125, -0.2408447265625, -0.0859375, 0.0689697265625, 0.223876953125, 0.3787841796875, 0.53369140625, 0.6885986328125, 0.843505859375, 0.9984130859375, 1.1533203125, 1.3082275390625, 1.463134765625, 1.6180419921875, 1.77294921875, 1.9278564453125, 2.082763671875, 2.2376708984375, 2.392578125, 2.5474853515625, 2.702392578125, 2.8572998046875, 3.01220703125, 3.1671142578125, 3.322021484375, 3.4769287109375, 3.6318359375, 3.7867431640625, 3.941650390625, 4.0965576171875, 4.25146484375, 4.4063720703125, 4.561279296875, 4.7161865234375, 4.87109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 4.0, 10.0, 10.0, 15.0, 31.0, 34.0, 47.0, 65.0, 102.0, 145.0, 189.0, 299.0, 419.0, 556.0, 875.0, 1296.0, 1842.0, 2930.0, 4738.0, 8068.0, 13717.0, 24765.0, 46898.0, 92712.0, 184641.0, 271072.0, 188673.0, 95111.0, 47937.0, 25217.0, 14065.0, 8047.0, 4913.0, 3034.0, 1928.0, 1295.0, 869.0, 594.0, 414.0, 278.0, 189.0, 164.0, 99.0, 85.0, 52.0, 26.0, 29.0, 19.0, 16.0, 7.0, 7.0, 8.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.888671875, -2.802490234375, -2.71630859375, -2.630126953125, -2.5439453125, -2.457763671875, -2.37158203125, -2.285400390625, -2.19921875, -2.113037109375, -2.02685546875, -1.940673828125, -1.8544921875, -1.768310546875, -1.68212890625, -1.595947265625, -1.509765625, -1.423583984375, -1.33740234375, -1.251220703125, -1.1650390625, -1.078857421875, -0.99267578125, -0.906494140625, -0.8203125, -0.734130859375, -0.64794921875, -0.561767578125, -0.4755859375, -0.389404296875, -0.30322265625, -0.217041015625, -0.130859375, -0.044677734375, 0.04150390625, 0.127685546875, 0.2138671875, 0.300048828125, 0.38623046875, 0.472412109375, 0.55859375, 0.644775390625, 0.73095703125, 0.817138671875, 0.9033203125, 0.989501953125, 1.07568359375, 1.161865234375, 1.248046875, 1.334228515625, 1.42041015625, 1.506591796875, 1.5927734375, 1.678955078125, 1.76513671875, 1.851318359375, 1.9375, 2.023681640625, 2.10986328125, 2.196044921875, 2.2822265625, 2.368408203125, 2.45458984375, 2.540771484375, 2.626953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 9.0, 17.0, 17.0, 35.0, 50.0, 79.0, 109.0, 147.0, 135.0, 133.0, 78.0, 45.0, 37.0, 19.0, 21.0, 13.0, 10.0, 6.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00033473968505859375, -0.00032637640833854675, -0.00031801313161849976, -0.00030964985489845276, -0.00030128657817840576, -0.00029292330145835876, -0.00028456002473831177, -0.00027619674801826477, -0.0002678334712982178, -0.0002594701945781708, -0.0002511069178581238, -0.00024274364113807678, -0.00023438036441802979, -0.0002260170876979828, -0.0002176538109779358, -0.0002092905342578888, -0.0002009272575378418, -0.0001925639808177948, -0.0001842007040977478, -0.0001758374273777008, -0.0001674741506576538, -0.0001591108739376068, -0.00015074759721755981, -0.00014238432049751282, -0.00013402104377746582, -0.00012565776705741882, -0.00011729449033737183, -0.00010893121361732483, -0.00010056793689727783, -9.220466017723083e-05, -8.384138345718384e-05, -7.547810673713684e-05, -6.711483001708984e-05, -5.875155329704285e-05, -5.038827657699585e-05, -4.202499985694885e-05, -3.3661723136901855e-05, -2.529844641685486e-05, -1.693516969680786e-05, -8.571892976760864e-06, -2.086162567138672e-07, 8.15466046333313e-06, 1.6517937183380127e-05, 2.4881213903427124e-05, 3.324449062347412e-05, 4.160776734352112e-05, 4.9971044063568115e-05, 5.833432078361511e-05, 6.669759750366211e-05, 7.50608742237091e-05, 8.34241509437561e-05, 9.17874276638031e-05, 0.0001001507043838501, 0.0001085139811038971, 0.00011687725782394409, 0.0001252405345439911, 0.00013360381126403809, 0.00014196708798408508, 0.00015033036470413208, 0.00015869364142417908, 0.00016705691814422607, 0.00017542019486427307, 0.00018378347158432007, 0.00019214674830436707, 0.00020051002502441406]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 8.0, 13.0, 19.0, 22.0, 28.0, 37.0, 55.0, 89.0, 134.0, 190.0, 257.0, 389.0, 636.0, 1064.0, 1683.0, 2857.0, 4840.0, 8473.0, 15461.0, 29517.0, 58471.0, 116942.0, 207675.0, 245904.0, 169182.0, 89026.0, 44298.0, 22551.0, 11964.0, 6690.0, 3979.0, 2253.0, 1355.0, 858.0, 550.0, 365.0, 219.0, 138.0, 109.0, 79.0, 51.0, 35.0, 23.0, 14.0, 10.0, 12.0, 9.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.470367431640625, -2.38604736328125, -2.301727294921875, -2.2174072265625, -2.133087158203125, -2.04876708984375, -1.964447021484375, -1.880126953125, -1.795806884765625, -1.71148681640625, -1.627166748046875, -1.5428466796875, -1.458526611328125, -1.37420654296875, -1.289886474609375, -1.20556640625, -1.121246337890625, -1.03692626953125, -0.952606201171875, -0.8682861328125, -0.783966064453125, -0.69964599609375, -0.615325927734375, -0.531005859375, -0.446685791015625, -0.36236572265625, -0.278045654296875, -0.1937255859375, -0.109405517578125, -0.02508544921875, 0.059234619140625, 0.1435546875, 0.227874755859375, 0.31219482421875, 0.396514892578125, 0.4808349609375, 0.565155029296875, 0.64947509765625, 0.733795166015625, 0.818115234375, 0.902435302734375, 0.98675537109375, 1.071075439453125, 1.1553955078125, 1.239715576171875, 1.32403564453125, 1.408355712890625, 1.49267578125, 1.576995849609375, 1.66131591796875, 1.745635986328125, 1.8299560546875, 1.914276123046875, 1.99859619140625, 2.082916259765625, 2.167236328125, 2.251556396484375, 2.33587646484375, 2.420196533203125, 2.5045166015625, 2.588836669921875, 2.67315673828125, 2.757476806640625, 2.841796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 8.0, 11.0, 8.0, 13.0, 14.0, 12.0, 20.0, 19.0, 47.0, 39.0, 54.0, 43.0, 56.0, 50.0, 64.0, 74.0, 71.0, 70.0, 58.0, 43.0, 42.0, 35.0, 37.0, 19.0, 18.0, 12.0, 12.0, 14.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.984375, -0.9542999267578125, -0.924224853515625, -0.8941497802734375, -0.86407470703125, -0.8339996337890625, -0.803924560546875, -0.7738494873046875, -0.7437744140625, -0.7136993408203125, -0.683624267578125, -0.6535491943359375, -0.62347412109375, -0.5933990478515625, -0.563323974609375, -0.5332489013671875, -0.503173828125, -0.4730987548828125, -0.443023681640625, -0.4129486083984375, -0.38287353515625, -0.3527984619140625, -0.322723388671875, -0.2926483154296875, -0.2625732421875, -0.2324981689453125, -0.202423095703125, -0.1723480224609375, -0.14227294921875, -0.1121978759765625, -0.082122802734375, -0.0520477294921875, -0.02197265625, 0.0081024169921875, 0.038177490234375, 0.0682525634765625, 0.09832763671875, 0.1284027099609375, 0.158477783203125, 0.1885528564453125, 0.2186279296875, 0.2487030029296875, 0.278778076171875, 0.3088531494140625, 0.33892822265625, 0.3690032958984375, 0.399078369140625, 0.4291534423828125, 0.459228515625, 0.4893035888671875, 0.519378662109375, 0.5494537353515625, 0.57952880859375, 0.6096038818359375, 0.639678955078125, 0.6697540283203125, 0.6998291015625, 0.7299041748046875, 0.759979248046875, 0.7900543212890625, 0.82012939453125, 0.8502044677734375, 0.880279541015625, 0.9103546142578125, 0.9404296875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 8.0, 11.0, 9.0, 16.0, 37.0, 29.0, 51.0, 71.0, 87.0, 100.0, 113.0, 112.0, 93.0, 67.0, 54.0, 35.0, 37.0, 23.0, 13.0, 8.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-25.433486938476562, -24.898591995239258, -24.363698959350586, -23.82880401611328, -23.293909072875977, -22.759014129638672, -22.22412109375, -21.689226150512695, -21.15433120727539, -20.619436264038086, -20.084543228149414, -19.54964828491211, -19.014753341674805, -18.4798583984375, -17.944965362548828, -17.410070419311523, -16.87517547607422, -16.340280532836914, -15.805386543273926, -15.270492553710938, -14.735597610473633, -14.200703620910645, -13.665809631347656, -13.130914688110352, -12.59602165222168, -12.061127662658691, -11.526232719421387, -10.991338729858398, -10.456443786621094, -9.921549797058105, -9.386655807495117, -8.851760864257812, -8.316866874694824, -7.781972408294678, -7.247077941894531, -6.712183952331543, -6.177289009094238, -5.64239501953125, -5.1075005531311035, -4.572606086730957, -4.0377116203308105, -3.502817153930664, -2.9679226875305176, -2.43302845954895, -1.8981339931488037, -1.3632395267486572, -0.8283452987670898, -0.29345083236694336, 0.24144363403320312, 0.7763380408287048, 1.3112324476242065, 1.8461267948150635, 2.38102126121521, 2.9159157276153564, 3.450809955596924, 3.9857044219970703, 4.520598888397217, 5.055493354797363, 5.59038782119751, 6.125282287597656, 6.6601762771606445, 7.195071220397949, 7.7299652099609375, 8.264860153198242, 8.79975414276123]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 6.0, 1.0, 7.0, 7.0, 14.0, 20.0, 22.0, 18.0, 24.0, 47.0, 36.0, 43.0, 34.0, 40.0, 34.0, 56.0, 47.0, 35.0, 49.0, 43.0, 44.0, 43.0, 42.0, 37.0, 46.0, 29.0, 37.0, 23.0, 26.0, 11.0, 22.0, 13.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.845996856689453, -6.58424711227417, -6.3224968910217285, -6.060747146606445, -5.798996925354004, -5.537247180938721, -5.2754974365234375, -5.013747215270996, -4.751996994018555, -4.4902472496032715, -4.22849702835083, -3.966747283935547, -3.7049970626831055, -3.4432473182678223, -3.18149733543396, -2.9197473526000977, -2.6579976081848145, -2.396247625350952, -2.13449764251709, -1.872747778892517, -1.6109977960586548, -1.3492478132247925, -1.0874979496002197, -0.8257479667663574, -0.5639979839324951, -0.3022480309009552, -0.04049807786941528, 0.22125184535980225, 0.48300182819366455, 0.7447518110275269, 1.0065016746520996, 1.268251657485962, 1.5300016403198242, 1.7917516231536865, 2.053501605987549, 2.315251350402832, 2.5770015716552734, 2.8387513160705566, 3.100501298904419, 3.3622512817382812, 3.6240012645721436, 3.885751247406006, 4.147500991821289, 4.4092512130737305, 4.671000957489014, 4.932751178741455, 5.194500923156738, 5.45625114440918, 5.718000888824463, 5.979750633239746, 6.2415008544921875, 6.503250598907471, 6.765000820159912, 7.026750564575195, 7.288500785827637, 7.55025053024292, 7.812000274658203, 8.073750495910645, 8.33549976348877, 8.597249984741211, 8.859000205993652, 9.120750427246094, 9.382499694824219, 9.64424991607666, 9.906000137329102]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 8.0, 18.0, 24.0, 25.0, 61.0, 71.0, 111.0, 181.0, 248.0, 418.0, 677.0, 1051.0, 1732.0, 3022.0, 5077.0, 9310.0, 16698.0, 30940.0, 59182.0, 108461.0, 175261.0, 213872.0, 177737.0, 111084.0, 61038.0, 32403.0, 17479.0, 9371.0, 5291.0, 2876.0, 1767.0, 1105.0, 760.0, 396.0, 271.0, 169.0, 126.0, 62.0, 44.0, 38.0, 31.0, 13.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.45361328125, -8.1572265625, -7.86083984375, -7.564453125, -7.26806640625, -6.9716796875, -6.67529296875, -6.37890625, -6.08251953125, -5.7861328125, -5.48974609375, -5.193359375, -4.89697265625, -4.6005859375, -4.30419921875, -4.0078125, -3.71142578125, -3.4150390625, -3.11865234375, -2.822265625, -2.52587890625, -2.2294921875, -1.93310546875, -1.63671875, -1.34033203125, -1.0439453125, -0.74755859375, -0.451171875, -0.15478515625, 0.1416015625, 0.43798828125, 0.734375, 1.03076171875, 1.3271484375, 1.62353515625, 1.919921875, 2.21630859375, 2.5126953125, 2.80908203125, 3.10546875, 3.40185546875, 3.6982421875, 3.99462890625, 4.291015625, 4.58740234375, 4.8837890625, 5.18017578125, 5.4765625, 5.77294921875, 6.0693359375, 6.36572265625, 6.662109375, 6.95849609375, 7.2548828125, 7.55126953125, 7.84765625, 8.14404296875, 8.4404296875, 8.73681640625, 9.033203125, 9.32958984375, 9.6259765625, 9.92236328125, 10.21875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 3.0, 12.0, 10.0, 11.0, 26.0, 22.0, 26.0, 26.0, 26.0, 52.0, 35.0, 47.0, 49.0, 42.0, 50.0, 45.0, 48.0, 45.0, 58.0, 36.0, 42.0, 30.0, 36.0, 47.0, 37.0, 20.0, 26.0, 17.0, 20.0, 11.0, 7.0, 6.0, 6.0, 11.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46875, -7.185791015625, -6.90283203125, -6.619873046875, -6.3369140625, -6.053955078125, -5.77099609375, -5.488037109375, -5.205078125, -4.922119140625, -4.63916015625, -4.356201171875, -4.0732421875, -3.790283203125, -3.50732421875, -3.224365234375, -2.94140625, -2.658447265625, -2.37548828125, -2.092529296875, -1.8095703125, -1.526611328125, -1.24365234375, -0.960693359375, -0.677734375, -0.394775390625, -0.11181640625, 0.171142578125, 0.4541015625, 0.737060546875, 1.02001953125, 1.302978515625, 1.5859375, 1.868896484375, 2.15185546875, 2.434814453125, 2.7177734375, 3.000732421875, 3.28369140625, 3.566650390625, 3.849609375, 4.132568359375, 4.41552734375, 4.698486328125, 4.9814453125, 5.264404296875, 5.54736328125, 5.830322265625, 6.11328125, 6.396240234375, 6.67919921875, 6.962158203125, 7.2451171875, 7.528076171875, 7.81103515625, 8.093994140625, 8.376953125, 8.659912109375, 8.94287109375, 9.225830078125, 9.5087890625, 9.791748046875, 10.07470703125, 10.357666015625, 10.640625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 16.0, 19.0, 26.0, 50.0, 62.0, 107.0, 152.0, 209.0, 265.0, 468.0, 687.0, 1007.0, 1466.0, 2450.0, 3775.0, 5633.0, 9077.0, 13986.0, 22380.0, 35907.0, 55373.0, 84791.0, 119623.0, 148684.0, 151731.0, 127512.0, 92697.0, 61784.0, 39696.0, 24961.0, 15834.0, 9940.0, 6450.0, 3956.0, 2591.0, 1773.0, 1159.0, 763.0, 467.0, 339.0, 220.0, 156.0, 97.0, 71.0, 49.0, 28.0, 21.0, 15.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.265625, -6.06427001953125, -5.8629150390625, -5.66156005859375, -5.460205078125, -5.25885009765625, -5.0574951171875, -4.85614013671875, -4.65478515625, -4.45343017578125, -4.2520751953125, -4.05072021484375, -3.849365234375, -3.64801025390625, -3.4466552734375, -3.24530029296875, -3.0439453125, -2.84259033203125, -2.6412353515625, -2.43988037109375, -2.238525390625, -2.03717041015625, -1.8358154296875, -1.63446044921875, -1.43310546875, -1.23175048828125, -1.0303955078125, -0.82904052734375, -0.627685546875, -0.42633056640625, -0.2249755859375, -0.02362060546875, 0.177734375, 0.37908935546875, 0.5804443359375, 0.78179931640625, 0.983154296875, 1.18450927734375, 1.3858642578125, 1.58721923828125, 1.78857421875, 1.98992919921875, 2.1912841796875, 2.39263916015625, 2.593994140625, 2.79534912109375, 2.9967041015625, 3.19805908203125, 3.3994140625, 3.60076904296875, 3.8021240234375, 4.00347900390625, 4.204833984375, 4.40618896484375, 4.6075439453125, 4.80889892578125, 5.01025390625, 5.21160888671875, 5.4129638671875, 5.61431884765625, 5.815673828125, 6.01702880859375, 6.2183837890625, 6.41973876953125, 6.62109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 5.0, 10.0, 4.0, 16.0, 12.0, 15.0, 18.0, 13.0, 25.0, 28.0, 36.0, 28.0, 34.0, 33.0, 42.0, 34.0, 41.0, 26.0, 45.0, 35.0, 46.0, 47.0, 44.0, 38.0, 40.0, 45.0, 28.0, 39.0, 28.0, 27.0, 23.0, 15.0, 9.0, 13.0, 5.0, 13.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.703125, -5.5421142578125, -5.381103515625, -5.2200927734375, -5.05908203125, -4.8980712890625, -4.737060546875, -4.5760498046875, -4.4150390625, -4.2540283203125, -4.093017578125, -3.9320068359375, -3.77099609375, -3.6099853515625, -3.448974609375, -3.2879638671875, -3.126953125, -2.9659423828125, -2.804931640625, -2.6439208984375, -2.48291015625, -2.3218994140625, -2.160888671875, -1.9998779296875, -1.8388671875, -1.6778564453125, -1.516845703125, -1.3558349609375, -1.19482421875, -1.0338134765625, -0.872802734375, -0.7117919921875, -0.55078125, -0.3897705078125, -0.228759765625, -0.0677490234375, 0.09326171875, 0.2542724609375, 0.415283203125, 0.5762939453125, 0.7373046875, 0.8983154296875, 1.059326171875, 1.2203369140625, 1.38134765625, 1.5423583984375, 1.703369140625, 1.8643798828125, 2.025390625, 2.1864013671875, 2.347412109375, 2.5084228515625, 2.66943359375, 2.8304443359375, 2.991455078125, 3.1524658203125, 3.3134765625, 3.4744873046875, 3.635498046875, 3.7965087890625, 3.95751953125, 4.1185302734375, 4.279541015625, 4.4405517578125, 4.6015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 8.0, 9.0, 12.0, 24.0, 21.0, 44.0, 32.0, 73.0, 100.0, 126.0, 209.0, 272.0, 392.0, 649.0, 989.0, 1437.0, 2313.0, 3578.0, 5931.0, 10159.0, 18480.0, 37698.0, 84099.0, 198554.0, 313097.0, 201003.0, 85660.0, 37973.0, 19083.0, 10254.0, 5927.0, 3509.0, 2315.0, 1493.0, 968.0, 640.0, 415.0, 299.0, 211.0, 156.0, 108.0, 70.0, 48.0, 28.0, 31.0, 15.0, 14.0, 6.0, 12.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.2890625, -8.9942626953125, -8.699462890625, -8.4046630859375, -8.10986328125, -7.8150634765625, -7.520263671875, -7.2254638671875, -6.9306640625, -6.6358642578125, -6.341064453125, -6.0462646484375, -5.75146484375, -5.4566650390625, -5.161865234375, -4.8670654296875, -4.572265625, -4.2774658203125, -3.982666015625, -3.6878662109375, -3.39306640625, -3.0982666015625, -2.803466796875, -2.5086669921875, -2.2138671875, -1.9190673828125, -1.624267578125, -1.3294677734375, -1.03466796875, -0.7398681640625, -0.445068359375, -0.1502685546875, 0.14453125, 0.4393310546875, 0.734130859375, 1.0289306640625, 1.32373046875, 1.6185302734375, 1.913330078125, 2.2081298828125, 2.5029296875, 2.7977294921875, 3.092529296875, 3.3873291015625, 3.68212890625, 3.9769287109375, 4.271728515625, 4.5665283203125, 4.861328125, 5.1561279296875, 5.450927734375, 5.7457275390625, 6.04052734375, 6.3353271484375, 6.630126953125, 6.9249267578125, 7.2197265625, 7.5145263671875, 7.809326171875, 8.1041259765625, 8.39892578125, 8.6937255859375, 8.988525390625, 9.2833251953125, 9.578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 20.0, 15.0, 29.0, 34.0, 52.0, 58.0, 84.0, 113.0, 97.0, 96.0, 77.0, 63.0, 54.0, 43.0, 37.0, 21.0, 20.0, 12.0, 12.0, 6.0, 8.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000797271728515625, -0.0007695257663726807, -0.0007417798042297363, -0.000714033842086792, -0.0006862878799438477, -0.0006585419178009033, -0.000630795955657959, -0.0006030499935150146, -0.0005753040313720703, -0.000547558069229126, -0.0005198121070861816, -0.0004920661449432373, -0.00046432018280029297, -0.00043657422065734863, -0.0004088282585144043, -0.00038108229637145996, -0.0003533363342285156, -0.0003255903720855713, -0.00029784440994262695, -0.0002700984477996826, -0.00024235248565673828, -0.00021460652351379395, -0.0001868605613708496, -0.00015911459922790527, -0.00013136863708496094, -0.0001036226749420166, -7.587671279907227e-05, -4.813075065612793e-05, -2.0384788513183594e-05, 7.361173629760742e-06, 3.510713577270508e-05, 6.285309791564941e-05, 9.059906005859375e-05, 0.00011834502220153809, 0.00014609098434448242, 0.00017383694648742676, 0.0002015829086303711, 0.00022932887077331543, 0.00025707483291625977, 0.0002848207950592041, 0.00031256675720214844, 0.0003403127193450928, 0.0003680586814880371, 0.00039580464363098145, 0.0004235506057739258, 0.0004512965679168701, 0.00047904253005981445, 0.0005067884922027588, 0.0005345344543457031, 0.0005622804164886475, 0.0005900263786315918, 0.0006177723407745361, 0.0006455183029174805, 0.0006732642650604248, 0.0007010102272033691, 0.0007287561893463135, 0.0007565021514892578, 0.0007842481136322021, 0.0008119940757751465, 0.0008397400379180908, 0.0008674860000610352, 0.0008952319622039795, 0.0009229779243469238, 0.0009507238864898682, 0.0009784698486328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 7.0, 14.0, 13.0, 23.0, 38.0, 50.0, 66.0, 106.0, 140.0, 252.0, 334.0, 536.0, 882.0, 1299.0, 2337.0, 3796.0, 6771.0, 12865.0, 24882.0, 52954.0, 121479.0, 251597.0, 282534.0, 153842.0, 66757.0, 30372.0, 15127.0, 8064.0, 4461.0, 2575.0, 1628.0, 947.0, 644.0, 389.0, 257.0, 179.0, 101.0, 79.0, 59.0, 34.0, 19.0, 16.0, 7.0, 6.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6015625, -7.3406982421875, -7.079833984375, -6.8189697265625, -6.55810546875, -6.2972412109375, -6.036376953125, -5.7755126953125, -5.5146484375, -5.2537841796875, -4.992919921875, -4.7320556640625, -4.47119140625, -4.2103271484375, -3.949462890625, -3.6885986328125, -3.427734375, -3.1668701171875, -2.906005859375, -2.6451416015625, -2.38427734375, -2.1234130859375, -1.862548828125, -1.6016845703125, -1.3408203125, -1.0799560546875, -0.819091796875, -0.5582275390625, -0.29736328125, -0.0364990234375, 0.224365234375, 0.4852294921875, 0.74609375, 1.0069580078125, 1.267822265625, 1.5286865234375, 1.78955078125, 2.0504150390625, 2.311279296875, 2.5721435546875, 2.8330078125, 3.0938720703125, 3.354736328125, 3.6156005859375, 3.87646484375, 4.1373291015625, 4.398193359375, 4.6590576171875, 4.919921875, 5.1807861328125, 5.441650390625, 5.7025146484375, 5.96337890625, 6.2242431640625, 6.485107421875, 6.7459716796875, 7.0068359375, 7.2677001953125, 7.528564453125, 7.7894287109375, 8.05029296875, 8.3111572265625, 8.572021484375, 8.8328857421875, 9.09375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 5.0, 6.0, 14.0, 23.0, 21.0, 32.0, 34.0, 27.0, 41.0, 54.0, 72.0, 74.0, 54.0, 77.0, 78.0, 50.0, 47.0, 41.0, 51.0, 40.0, 26.0, 23.0, 22.0, 11.0, 9.0, 7.0, 5.0, 6.0, 5.0, 8.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.025390625, -2.93170166015625, -2.8380126953125, -2.74432373046875, -2.650634765625, -2.55694580078125, -2.4632568359375, -2.36956787109375, -2.27587890625, -2.18218994140625, -2.0885009765625, -1.99481201171875, -1.901123046875, -1.80743408203125, -1.7137451171875, -1.62005615234375, -1.5263671875, -1.43267822265625, -1.3389892578125, -1.24530029296875, -1.151611328125, -1.05792236328125, -0.9642333984375, -0.87054443359375, -0.77685546875, -0.68316650390625, -0.5894775390625, -0.49578857421875, -0.402099609375, -0.30841064453125, -0.2147216796875, -0.12103271484375, -0.02734375, 0.06634521484375, 0.1600341796875, 0.25372314453125, 0.347412109375, 0.44110107421875, 0.5347900390625, 0.62847900390625, 0.72216796875, 0.81585693359375, 0.9095458984375, 1.00323486328125, 1.096923828125, 1.19061279296875, 1.2843017578125, 1.37799072265625, 1.4716796875, 1.56536865234375, 1.6590576171875, 1.75274658203125, 1.846435546875, 1.94012451171875, 2.0338134765625, 2.12750244140625, 2.22119140625, 2.31488037109375, 2.4085693359375, 2.50225830078125, 2.595947265625, 2.68963623046875, 2.7833251953125, 2.87701416015625, 2.970703125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 11.0, 13.0, 28.0, 34.0, 48.0, 63.0, 97.0, 128.0, 126.0, 128.0, 83.0, 72.0, 50.0, 28.0, 39.0, 22.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0544490814209, -27.434873580932617, -26.815296173095703, -26.195720672607422, -25.57614517211914, -24.956567764282227, -24.336992263793945, -23.71741485595703, -23.09783935546875, -22.47826385498047, -21.858686447143555, -21.239110946655273, -20.619535446166992, -19.999958038330078, -19.380382537841797, -18.760807037353516, -18.141231536865234, -17.521656036376953, -16.90207862854004, -16.282503128051758, -15.66292667388916, -15.043350219726562, -14.423774719238281, -13.804198265075684, -13.184621810913086, -12.565045356750488, -11.945469856262207, -11.32589340209961, -10.706316947937012, -10.086740493774414, -9.467164993286133, -8.847588539123535, -8.228013038635254, -7.6084370613098145, -6.988860607147217, -6.369284629821777, -5.74970817565918, -5.13013219833374, -4.510556221008301, -3.890979766845703, -3.2714037895202637, -2.651827573776245, -2.0322513580322266, -1.412675380706787, -0.7930991649627686, -0.17352294921875, 0.44605302810668945, 1.065629482269287, 1.6852054595947266, 2.304781675338745, 2.9243578910827637, 3.543933868408203, 4.163510322570801, 4.78308629989624, 5.40266227722168, 6.022238731384277, 6.641814708709717, 7.261390686035156, 7.880967140197754, 8.500543594360352, 9.120119094848633, 9.73969554901123, 10.359272003173828, 10.97884750366211, 11.598423957824707]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 2.0, 3.0, 6.0, 6.0, 14.0, 14.0, 10.0, 12.0, 25.0, 19.0, 32.0, 36.0, 40.0, 38.0, 43.0, 37.0, 53.0, 44.0, 44.0, 42.0, 54.0, 43.0, 33.0, 41.0, 41.0, 39.0, 25.0, 44.0, 33.0, 27.0, 30.0, 12.0, 10.0, 9.0, 9.0, 5.0, 5.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.750573635101318, -7.480526447296143, -7.210478782653809, -6.940431594848633, -6.670384407043457, -6.400337219238281, -6.130289554595947, -5.8602423667907715, -5.5901947021484375, -5.320147514343262, -5.050099849700928, -4.780052661895752, -4.510005474090576, -4.239957809448242, -3.9699106216430664, -3.6998634338378906, -3.429816246032715, -3.15976881980896, -2.889721632003784, -2.6196742057800293, -2.3496270179748535, -2.0795795917510986, -1.8095321655273438, -1.5394848585128784, -1.269437551498413, -0.9993902444839478, -0.7293428778648376, -0.45929551124572754, -0.1892482042312622, 0.08079910278320312, 0.350846529006958, 0.6208938360214233, 0.8909406661987305, 1.1609879732131958, 1.4310352802276611, 1.701082706451416, 1.9711300134658813, 2.2411773204803467, 2.5112247467041016, 2.7812719345092773, 3.0513193607330322, 3.321366786956787, 3.591413974761963, 3.8614614009857178, 4.131508827209473, 4.401556015014648, 4.671603202819824, 4.941650867462158, 5.211698055267334, 5.48174524307251, 5.751792907714844, 6.0218400955200195, 6.291887283325195, 6.561934471130371, 6.831982135772705, 7.102029323577881, 7.372076988220215, 7.642124176025391, 7.912171840667725, 8.182218551635742, 8.452266693115234, 8.72231388092041, 8.992361068725586, 9.262408256530762, 9.532455444335938]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 3.0, 13.0, 12.0, 26.0, 24.0, 36.0, 69.0, 117.0, 159.0, 219.0, 368.0, 542.0, 887.0, 1180.0, 1825.0, 2742.0, 4020.0, 6135.0, 9636.0, 16096.0, 28944.0, 59459.0, 138556.0, 368594.0, 929145.0, 1326848.0, 783901.0, 294085.0, 110893.0, 47914.0, 23810.0, 13381.0, 8167.0, 5259.0, 3480.0, 2252.0, 1597.0, 1033.0, 768.0, 556.0, 435.0, 296.0, 213.0, 168.0, 106.0, 86.0, 51.0, 58.0, 42.0, 36.0, 16.0, 11.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.0625, -9.7200927734375, -9.377685546875, -9.0352783203125, -8.69287109375, -8.3504638671875, -8.008056640625, -7.6656494140625, -7.3232421875, -6.9808349609375, -6.638427734375, -6.2960205078125, -5.95361328125, -5.6112060546875, -5.268798828125, -4.9263916015625, -4.583984375, -4.2415771484375, -3.899169921875, -3.5567626953125, -3.21435546875, -2.8719482421875, -2.529541015625, -2.1871337890625, -1.8447265625, -1.5023193359375, -1.159912109375, -0.8175048828125, -0.47509765625, -0.1326904296875, 0.209716796875, 0.5521240234375, 0.89453125, 1.2369384765625, 1.579345703125, 1.9217529296875, 2.26416015625, 2.6065673828125, 2.948974609375, 3.2913818359375, 3.6337890625, 3.9761962890625, 4.318603515625, 4.6610107421875, 5.00341796875, 5.3458251953125, 5.688232421875, 6.0306396484375, 6.373046875, 6.7154541015625, 7.057861328125, 7.4002685546875, 7.74267578125, 8.0850830078125, 8.427490234375, 8.7698974609375, 9.1123046875, 9.4547119140625, 9.797119140625, 10.1395263671875, 10.48193359375, 10.8243408203125, 11.166748046875, 11.5091552734375, 11.8515625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 9.0, 20.0, 13.0, 14.0, 32.0, 21.0, 43.0, 42.0, 42.0, 42.0, 45.0, 38.0, 41.0, 44.0, 40.0, 50.0, 48.0, 48.0, 53.0, 41.0, 41.0, 38.0, 31.0, 22.0, 24.0, 22.0, 20.0, 12.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.7952880859375, -4.610107421875, -4.4249267578125, -4.23974609375, -4.0545654296875, -3.869384765625, -3.6842041015625, -3.4990234375, -3.3138427734375, -3.128662109375, -2.9434814453125, -2.75830078125, -2.5731201171875, -2.387939453125, -2.2027587890625, -2.017578125, -1.8323974609375, -1.647216796875, -1.4620361328125, -1.27685546875, -1.0916748046875, -0.906494140625, -0.7213134765625, -0.5361328125, -0.3509521484375, -0.165771484375, 0.0194091796875, 0.20458984375, 0.3897705078125, 0.574951171875, 0.7601318359375, 0.9453125, 1.1304931640625, 1.315673828125, 1.5008544921875, 1.68603515625, 1.8712158203125, 2.056396484375, 2.2415771484375, 2.4267578125, 2.6119384765625, 2.797119140625, 2.9822998046875, 3.16748046875, 3.3526611328125, 3.537841796875, 3.7230224609375, 3.908203125, 4.0933837890625, 4.278564453125, 4.4637451171875, 4.64892578125, 4.8341064453125, 5.019287109375, 5.2044677734375, 5.3896484375, 5.5748291015625, 5.760009765625, 5.9451904296875, 6.13037109375, 6.3155517578125, 6.500732421875, 6.6859130859375, 6.87109375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 4.0, 11.0, 17.0, 31.0, 29.0, 53.0, 61.0, 104.0, 153.0, 252.0, 387.0, 546.0, 881.0, 1320.0, 2122.0, 3431.0, 5768.0, 10085.0, 18962.0, 37517.0, 83033.0, 215724.0, 614281.0, 1326252.0, 1130829.0, 451278.0, 159922.0, 64512.0, 29838.0, 15452.0, 8467.0, 4850.0, 2934.0, 1765.0, 1203.0, 751.0, 496.0, 311.0, 209.0, 142.0, 92.0, 65.0, 68.0, 23.0, 11.0, 13.0, 10.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.0318603515625, -11.641845703125, -11.2518310546875, -10.86181640625, -10.4718017578125, -10.081787109375, -9.6917724609375, -9.3017578125, -8.9117431640625, -8.521728515625, -8.1317138671875, -7.74169921875, -7.3516845703125, -6.961669921875, -6.5716552734375, -6.181640625, -5.7916259765625, -5.401611328125, -5.0115966796875, -4.62158203125, -4.2315673828125, -3.841552734375, -3.4515380859375, -3.0615234375, -2.6715087890625, -2.281494140625, -1.8914794921875, -1.50146484375, -1.1114501953125, -0.721435546875, -0.3314208984375, 0.05859375, 0.4486083984375, 0.838623046875, 1.2286376953125, 1.61865234375, 2.0086669921875, 2.398681640625, 2.7886962890625, 3.1787109375, 3.5687255859375, 3.958740234375, 4.3487548828125, 4.73876953125, 5.1287841796875, 5.518798828125, 5.9088134765625, 6.298828125, 6.6888427734375, 7.078857421875, 7.4688720703125, 7.85888671875, 8.2489013671875, 8.638916015625, 9.0289306640625, 9.4189453125, 9.8089599609375, 10.198974609375, 10.5889892578125, 10.97900390625, 11.3690185546875, 11.759033203125, 12.1490478515625, 12.5390625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 5.0, 4.0, 5.0, 9.0, 9.0, 8.0, 20.0, 30.0, 23.0, 38.0, 53.0, 68.0, 71.0, 88.0, 115.0, 142.0, 191.0, 238.0, 267.0, 318.0, 353.0, 340.0, 295.0, 257.0, 258.0, 200.0, 170.0, 123.0, 84.0, 83.0, 60.0, 36.0, 24.0, 20.0, 17.0, 18.0, 10.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.4964599609375, -3.387451171875, -3.2784423828125, -3.16943359375, -3.0604248046875, -2.951416015625, -2.8424072265625, -2.7333984375, -2.6243896484375, -2.515380859375, -2.4063720703125, -2.29736328125, -2.1883544921875, -2.079345703125, -1.9703369140625, -1.861328125, -1.7523193359375, -1.643310546875, -1.5343017578125, -1.42529296875, -1.3162841796875, -1.207275390625, -1.0982666015625, -0.9892578125, -0.8802490234375, -0.771240234375, -0.6622314453125, -0.55322265625, -0.4442138671875, -0.335205078125, -0.2261962890625, -0.1171875, -0.0081787109375, 0.100830078125, 0.2098388671875, 0.31884765625, 0.4278564453125, 0.536865234375, 0.6458740234375, 0.7548828125, 0.8638916015625, 0.972900390625, 1.0819091796875, 1.19091796875, 1.2999267578125, 1.408935546875, 1.5179443359375, 1.626953125, 1.7359619140625, 1.844970703125, 1.9539794921875, 2.06298828125, 2.1719970703125, 2.281005859375, 2.3900146484375, 2.4990234375, 2.6080322265625, 2.717041015625, 2.8260498046875, 2.93505859375, 3.0440673828125, 3.153076171875, 3.2620849609375, 3.37109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 17.0, 19.0, 23.0, 35.0, 54.0, 65.0, 76.0, 102.0, 117.0, 124.0, 93.0, 72.0, 48.0, 41.0, 31.0, 21.0, 10.0, 12.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-20.712648391723633, -20.2382755279541, -19.76390266418457, -19.28952980041504, -18.815156936645508, -18.340784072875977, -17.866411209106445, -17.39203643798828, -16.91766357421875, -16.44329071044922, -15.968917846679688, -15.494544982910156, -15.020172119140625, -14.545799255371094, -14.071425437927246, -13.597052574157715, -13.1226806640625, -12.648307800292969, -12.173934936523438, -11.699562072753906, -11.225189208984375, -10.750816345214844, -10.276442527770996, -9.802069664001465, -9.327696800231934, -8.853323936462402, -8.378951072692871, -7.904577732086182, -7.43020486831665, -6.955832004547119, -6.48145866394043, -6.007085800170898, -5.532713890075684, -5.058341026306152, -4.583968162536621, -4.109594821929932, -3.6352219581604004, -3.160849094390869, -2.686475992202759, -2.2121028900146484, -1.7377300262451172, -1.2633570432662964, -0.7889840602874756, -0.3146110773086548, 0.15976190567016602, 0.6341347694396973, 1.1085078716278076, 1.582880973815918, 2.057253837585449, 2.5316267013549805, 3.005999803543091, 3.480372905731201, 3.9547457695007324, 4.429118633270264, 4.903491973876953, 5.377864837646484, 5.852237701416016, 6.326610565185547, 6.800983428955078, 7.275356769561768, 7.749729633331299, 8.224102020263672, 8.69847583770752, 9.17284870147705, 9.647221565246582]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 8.0, 4.0, 10.0, 17.0, 17.0, 14.0, 31.0, 29.0, 25.0, 39.0, 32.0, 37.0, 39.0, 44.0, 48.0, 37.0, 46.0, 48.0, 50.0, 46.0, 38.0, 39.0, 32.0, 43.0, 36.0, 33.0, 18.0, 20.0, 22.0, 13.0, 12.0, 16.0, 9.0, 8.0, 7.0, 4.0, 1.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.637454509735107, -6.406438827514648, -6.175422668457031, -5.944406986236572, -5.713391304016113, -5.482375144958496, -5.251359462738037, -5.020343780517578, -4.789327621459961, -4.558311939239502, -4.327295780181885, -4.096280097961426, -3.865264415740967, -3.6342484951019287, -3.4032325744628906, -3.1722168922424316, -2.9412012100219727, -2.7101852893829346, -2.4791696071624756, -2.2481536865234375, -2.0171380043029785, -1.7861220836639404, -1.5551061630249023, -1.3240903615951538, -1.0930745601654053, -0.8620587587356567, -0.6310428977012634, -0.4000270366668701, -0.16901123523712158, 0.06200456619262695, 0.29302048683166504, 0.5240362882614136, 0.7550516128540039, 0.9860674142837524, 1.217083215713501, 1.448099136352539, 1.6791149377822876, 1.9101307392120361, 2.141146659851074, 2.372162342071533, 2.6031782627105713, 2.8341941833496094, 3.0652098655700684, 3.2962257862091064, 3.5272417068481445, 3.7582573890686035, 3.9892733097076416, 4.22028923034668, 4.451304912567139, 4.682320594787598, 4.913336753845215, 5.144352436065674, 5.375368118286133, 5.60638427734375, 5.837399959564209, 6.068415641784668, 6.299431800842285, 6.530447483062744, 6.761463642120361, 6.99247932434082, 7.223495006561279, 7.454510688781738, 7.6855268478393555, 7.9165425300598145, 8.147558212280273]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 12.0, 17.0, 22.0, 31.0, 46.0, 84.0, 163.0, 233.0, 327.0, 567.0, 828.0, 1232.0, 2042.0, 3340.0, 5506.0, 9286.0, 16414.0, 29923.0, 54945.0, 100624.0, 167494.0, 216817.0, 183048.0, 113678.0, 63101.0, 33701.0, 18603.0, 10535.0, 5854.0, 3721.0, 2274.0, 1503.0, 909.0, 563.0, 397.0, 240.0, 146.0, 112.0, 61.0, 52.0, 33.0, 23.0, 20.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.912109375, -3.799072265625, -3.68603515625, -3.572998046875, -3.4599609375, -3.346923828125, -3.23388671875, -3.120849609375, -3.0078125, -2.894775390625, -2.78173828125, -2.668701171875, -2.5556640625, -2.442626953125, -2.32958984375, -2.216552734375, -2.103515625, -1.990478515625, -1.87744140625, -1.764404296875, -1.6513671875, -1.538330078125, -1.42529296875, -1.312255859375, -1.19921875, -1.086181640625, -0.97314453125, -0.860107421875, -0.7470703125, -0.634033203125, -0.52099609375, -0.407958984375, -0.294921875, -0.181884765625, -0.06884765625, 0.044189453125, 0.1572265625, 0.270263671875, 0.38330078125, 0.496337890625, 0.609375, 0.722412109375, 0.83544921875, 0.948486328125, 1.0615234375, 1.174560546875, 1.28759765625, 1.400634765625, 1.513671875, 1.626708984375, 1.73974609375, 1.852783203125, 1.9658203125, 2.078857421875, 2.19189453125, 2.304931640625, 2.41796875, 2.531005859375, 2.64404296875, 2.757080078125, 2.8701171875, 2.983154296875, 3.09619140625, 3.209228515625, 3.322265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 7.0, 5.0, 17.0, 23.0, 30.0, 29.0, 32.0, 33.0, 46.0, 36.0, 42.0, 41.0, 48.0, 48.0, 61.0, 45.0, 61.0, 44.0, 47.0, 41.0, 39.0, 28.0, 33.0, 33.0, 25.0, 18.0, 14.0, 12.0, 7.0, 7.0, 9.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.65899658203125, -7.3922119140625, -7.12542724609375, -6.858642578125, -6.59185791015625, -6.3250732421875, -6.05828857421875, -5.79150390625, -5.52471923828125, -5.2579345703125, -4.99114990234375, -4.724365234375, -4.45758056640625, -4.1907958984375, -3.92401123046875, -3.6572265625, -3.39044189453125, -3.1236572265625, -2.85687255859375, -2.590087890625, -2.32330322265625, -2.0565185546875, -1.78973388671875, -1.52294921875, -1.25616455078125, -0.9893798828125, -0.72259521484375, -0.455810546875, -0.18902587890625, 0.0777587890625, 0.34454345703125, 0.611328125, 0.87811279296875, 1.1448974609375, 1.41168212890625, 1.678466796875, 1.94525146484375, 2.2120361328125, 2.47882080078125, 2.74560546875, 3.01239013671875, 3.2791748046875, 3.54595947265625, 3.812744140625, 4.07952880859375, 4.3463134765625, 4.61309814453125, 4.8798828125, 5.14666748046875, 5.4134521484375, 5.68023681640625, 5.947021484375, 6.21380615234375, 6.4805908203125, 6.74737548828125, 7.01416015625, 7.28094482421875, 7.5477294921875, 7.81451416015625, 8.081298828125, 8.34808349609375, 8.6148681640625, 8.88165283203125, 9.1484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 14.0, 18.0, 24.0, 25.0, 38.0, 59.0, 83.0, 101.0, 150.0, 218.0, 306.0, 452.0, 581.0, 936.0, 1405.0, 2110.0, 3387.0, 5446.0, 9304.0, 16323.0, 29764.0, 56348.0, 104852.0, 179795.0, 228031.0, 177687.0, 103956.0, 55691.0, 29860.0, 16515.0, 9350.0, 5566.0, 3562.0, 2194.0, 1431.0, 937.0, 615.0, 391.0, 278.0, 207.0, 155.0, 98.0, 80.0, 50.0, 38.0, 32.0, 22.0, 18.0, 8.0, 4.0, 5.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0], "bins": [-3.640625, -3.5250244140625, -3.409423828125, -3.2938232421875, -3.17822265625, -3.0626220703125, -2.947021484375, -2.8314208984375, -2.7158203125, -2.6002197265625, -2.484619140625, -2.3690185546875, -2.25341796875, -2.1378173828125, -2.022216796875, -1.9066162109375, -1.791015625, -1.6754150390625, -1.559814453125, -1.4442138671875, -1.32861328125, -1.2130126953125, -1.097412109375, -0.9818115234375, -0.8662109375, -0.7506103515625, -0.635009765625, -0.5194091796875, -0.40380859375, -0.2882080078125, -0.172607421875, -0.0570068359375, 0.05859375, 0.1741943359375, 0.289794921875, 0.4053955078125, 0.52099609375, 0.6365966796875, 0.752197265625, 0.8677978515625, 0.9833984375, 1.0989990234375, 1.214599609375, 1.3302001953125, 1.44580078125, 1.5614013671875, 1.677001953125, 1.7926025390625, 1.908203125, 2.0238037109375, 2.139404296875, 2.2550048828125, 2.37060546875, 2.4862060546875, 2.601806640625, 2.7174072265625, 2.8330078125, 2.9486083984375, 3.064208984375, 3.1798095703125, 3.29541015625, 3.4110107421875, 3.526611328125, 3.6422119140625, 3.7578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 10.0, 9.0, 15.0, 17.0, 14.0, 18.0, 30.0, 31.0, 30.0, 39.0, 40.0, 31.0, 38.0, 40.0, 44.0, 50.0, 42.0, 33.0, 37.0, 62.0, 40.0, 44.0, 34.0, 25.0, 27.0, 31.0, 30.0, 28.0, 14.0, 10.0, 17.0, 8.0, 15.0, 4.0, 6.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.240814208984375, -4.11053466796875, -3.980255126953125, -3.8499755859375, -3.719696044921875, -3.58941650390625, -3.459136962890625, -3.328857421875, -3.198577880859375, -3.06829833984375, -2.938018798828125, -2.8077392578125, -2.677459716796875, -2.54718017578125, -2.416900634765625, -2.28662109375, -2.156341552734375, -2.02606201171875, -1.895782470703125, -1.7655029296875, -1.635223388671875, -1.50494384765625, -1.374664306640625, -1.244384765625, -1.114105224609375, -0.98382568359375, -0.853546142578125, -0.7232666015625, -0.592987060546875, -0.46270751953125, -0.332427978515625, -0.2021484375, -0.071868896484375, 0.05841064453125, 0.188690185546875, 0.3189697265625, 0.449249267578125, 0.57952880859375, 0.709808349609375, 0.840087890625, 0.970367431640625, 1.10064697265625, 1.230926513671875, 1.3612060546875, 1.491485595703125, 1.62176513671875, 1.752044677734375, 1.88232421875, 2.012603759765625, 2.14288330078125, 2.273162841796875, 2.4034423828125, 2.533721923828125, 2.66400146484375, 2.794281005859375, 2.924560546875, 3.054840087890625, 3.18511962890625, 3.315399169921875, 3.4456787109375, 3.575958251953125, 3.70623779296875, 3.836517333984375, 3.966796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 11.0, 19.0, 23.0, 29.0, 39.0, 58.0, 74.0, 106.0, 146.0, 223.0, 332.0, 536.0, 747.0, 1253.0, 1998.0, 3246.0, 5677.0, 10285.0, 17707.0, 33165.0, 63175.0, 122049.0, 215060.0, 241949.0, 154615.0, 81061.0, 42210.0, 22490.0, 12363.0, 6887.0, 4122.0, 2517.0, 1577.0, 945.0, 594.0, 420.0, 294.0, 168.0, 121.0, 96.0, 49.0, 38.0, 22.0, 20.0, 7.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5218505859375, -1.471435546875, -1.4210205078125, -1.37060546875, -1.3201904296875, -1.269775390625, -1.2193603515625, -1.1689453125, -1.1185302734375, -1.068115234375, -1.0177001953125, -0.96728515625, -0.9168701171875, -0.866455078125, -0.8160400390625, -0.765625, -0.7152099609375, -0.664794921875, -0.6143798828125, -0.56396484375, -0.5135498046875, -0.463134765625, -0.4127197265625, -0.3623046875, -0.3118896484375, -0.261474609375, -0.2110595703125, -0.16064453125, -0.1102294921875, -0.059814453125, -0.0093994140625, 0.041015625, 0.0914306640625, 0.141845703125, 0.1922607421875, 0.24267578125, 0.2930908203125, 0.343505859375, 0.3939208984375, 0.4443359375, 0.4947509765625, 0.545166015625, 0.5955810546875, 0.64599609375, 0.6964111328125, 0.746826171875, 0.7972412109375, 0.84765625, 0.8980712890625, 0.948486328125, 0.9989013671875, 1.04931640625, 1.0997314453125, 1.150146484375, 1.2005615234375, 1.2509765625, 1.3013916015625, 1.351806640625, 1.4022216796875, 1.45263671875, 1.5030517578125, 1.553466796875, 1.6038818359375, 1.654296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 17.0, 17.0, 46.0, 45.0, 61.0, 75.0, 118.0, 126.0, 105.0, 102.0, 73.0, 62.0, 50.0, 19.0, 24.0, 14.0, 11.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010824203491210938, -0.00010389834642410278, -9.955465793609619e-05, -9.52109694480896e-05, -9.086728096008301e-05, -8.652359247207642e-05, -8.217990398406982e-05, -7.783621549606323e-05, -7.349252700805664e-05, -6.914883852005005e-05, -6.480515003204346e-05, -6.0461461544036865e-05, -5.6117773056030273e-05, -5.177408456802368e-05, -4.743039608001709e-05, -4.30867075920105e-05, -3.8743019104003906e-05, -3.4399330615997314e-05, -3.0055642127990723e-05, -2.571195363998413e-05, -2.136826515197754e-05, -1.7024576663970947e-05, -1.2680888175964355e-05, -8.337199687957764e-06, -3.993511199951172e-06, 3.501772880554199e-07, 4.693865776062012e-06, 9.037554264068604e-06, 1.3381242752075195e-05, 1.7724931240081787e-05, 2.206861972808838e-05, 2.641230821609497e-05, 3.075599670410156e-05, 3.5099685192108154e-05, 3.9443373680114746e-05, 4.378706216812134e-05, 4.813075065612793e-05, 5.247443914413452e-05, 5.681812763214111e-05, 6.11618161201477e-05, 6.55055046081543e-05, 6.984919309616089e-05, 7.419288158416748e-05, 7.853657007217407e-05, 8.288025856018066e-05, 8.722394704818726e-05, 9.156763553619385e-05, 9.591132402420044e-05, 0.00010025501251220703, 0.00010459870100021362, 0.00010894238948822021, 0.0001132860779762268, 0.0001176297664642334, 0.00012197345495223999, 0.00012631714344024658, 0.00013066083192825317, 0.00013500452041625977, 0.00013934820890426636, 0.00014369189739227295, 0.00014803558588027954, 0.00015237927436828613, 0.00015672296285629272, 0.00016106665134429932, 0.0001654103398323059, 0.0001697540283203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 20.0, 22.0, 25.0, 44.0, 54.0, 102.0, 131.0, 211.0, 310.0, 461.0, 861.0, 1363.0, 2341.0, 4499.0, 9170.0, 20323.0, 48707.0, 118257.0, 245967.0, 294160.0, 171542.0, 72537.0, 30178.0, 13439.0, 6295.0, 3088.0, 1683.0, 1032.0, 586.0, 371.0, 249.0, 144.0, 111.0, 87.0, 50.0, 28.0, 28.0, 13.0, 16.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.37109375, -2.30181884765625, -2.2325439453125, -2.16326904296875, -2.093994140625, -2.02471923828125, -1.9554443359375, -1.88616943359375, -1.81689453125, -1.74761962890625, -1.6783447265625, -1.60906982421875, -1.539794921875, -1.47052001953125, -1.4012451171875, -1.33197021484375, -1.2626953125, -1.19342041015625, -1.1241455078125, -1.05487060546875, -0.985595703125, -0.91632080078125, -0.8470458984375, -0.77777099609375, -0.70849609375, -0.63922119140625, -0.5699462890625, -0.50067138671875, -0.431396484375, -0.36212158203125, -0.2928466796875, -0.22357177734375, -0.154296875, -0.08502197265625, -0.0157470703125, 0.05352783203125, 0.122802734375, 0.19207763671875, 0.2613525390625, 0.33062744140625, 0.39990234375, 0.46917724609375, 0.5384521484375, 0.60772705078125, 0.677001953125, 0.74627685546875, 0.8155517578125, 0.88482666015625, 0.9541015625, 1.02337646484375, 1.0926513671875, 1.16192626953125, 1.231201171875, 1.30047607421875, 1.3697509765625, 1.43902587890625, 1.50830078125, 1.57757568359375, 1.6468505859375, 1.71612548828125, 1.785400390625, 1.85467529296875, 1.9239501953125, 1.99322509765625, 2.0625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 11.0, 11.0, 21.0, 18.0, 31.0, 27.0, 35.0, 50.0, 63.0, 86.0, 97.0, 78.0, 100.0, 70.0, 58.0, 48.0, 35.0, 39.0, 25.0, 18.0, 22.0, 11.0, 7.0, 8.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71875, -0.6937713623046875, -0.668792724609375, -0.6438140869140625, -0.61883544921875, -0.5938568115234375, -0.568878173828125, -0.5438995361328125, -0.5189208984375, -0.4939422607421875, -0.468963623046875, -0.4439849853515625, -0.41900634765625, -0.3940277099609375, -0.369049072265625, -0.3440704345703125, -0.319091796875, -0.2941131591796875, -0.269134521484375, -0.2441558837890625, -0.21917724609375, -0.1941986083984375, -0.169219970703125, -0.1442413330078125, -0.1192626953125, -0.0942840576171875, -0.069305419921875, -0.0443267822265625, -0.01934814453125, 0.0056304931640625, 0.030609130859375, 0.0555877685546875, 0.08056640625, 0.1055450439453125, 0.130523681640625, 0.1555023193359375, 0.18048095703125, 0.2054595947265625, 0.230438232421875, 0.2554168701171875, 0.2803955078125, 0.3053741455078125, 0.330352783203125, 0.3553314208984375, 0.38031005859375, 0.4052886962890625, 0.430267333984375, 0.4552459716796875, 0.480224609375, 0.5052032470703125, 0.530181884765625, 0.5551605224609375, 0.58013916015625, 0.6051177978515625, 0.630096435546875, 0.6550750732421875, 0.6800537109375, 0.7050323486328125, 0.730010986328125, 0.7549896240234375, 0.77996826171875, 0.8049468994140625, 0.829925537109375, 0.8549041748046875, 0.8798828125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 16.0, 17.0, 27.0, 22.0, 54.0, 63.0, 66.0, 100.0, 109.0, 117.0, 95.0, 81.0, 53.0, 43.0, 39.0, 22.0, 23.0, 7.0, 9.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 3.0], "bins": [-19.901113510131836, -19.447967529296875, -18.994821548461914, -18.541675567626953, -18.088529586791992, -17.63538360595703, -17.182239532470703, -16.729093551635742, -16.27594757080078, -15.82280158996582, -15.36965560913086, -14.916509628295898, -14.463364601135254, -14.010218620300293, -13.557072639465332, -13.103926658630371, -12.65078067779541, -12.19763469696045, -11.744488716125488, -11.291343688964844, -10.838197708129883, -10.385051727294922, -9.931905746459961, -9.478759765625, -9.025613784790039, -8.572467803955078, -8.119321823120117, -7.6661763191223145, -7.213030815124512, -6.759884834289551, -6.30673885345459, -5.853592872619629, -5.400448799133301, -4.94730281829834, -4.494157314300537, -4.041011333465576, -3.5878655910491943, -3.1347198486328125, -2.6815738677978516, -2.2284281253814697, -1.775282382965088, -1.322136640548706, -0.8689907789230347, -0.4158449172973633, 0.037300825119018555, 0.4904465675354004, 0.9435925483703613, 1.3967382907867432, 1.849884033203125, 2.303029775619507, 2.7561755180358887, 3.2093214988708496, 3.6624672412872314, 4.115612983703613, 4.568758964538574, 5.021904945373535, 5.475050449371338, 5.928196430206299, 6.381341934204102, 6.8344879150390625, 7.287633895874023, 7.740779399871826, 8.193925857543945, 8.64707088470459, 9.10021686553955]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 10.0, 7.0, 6.0, 7.0, 20.0, 19.0, 9.0, 26.0, 36.0, 21.0, 29.0, 47.0, 31.0, 40.0, 36.0, 47.0, 42.0, 51.0, 48.0, 40.0, 45.0, 42.0, 36.0, 41.0, 29.0, 41.0, 32.0, 28.0, 19.0, 23.0, 14.0, 15.0, 13.0, 9.0, 11.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.676895618438721, -6.449435710906982, -6.221975803375244, -5.994515895843506, -5.767055988311768, -5.539596080780029, -5.312136650085449, -5.084676742553711, -4.857216835021973, -4.629756927490234, -4.402297019958496, -4.174837112426758, -3.9473772048950195, -3.7199172973632812, -3.492457628250122, -3.264997720718384, -3.0375375747680664, -2.810077667236328, -2.58261775970459, -2.3551578521728516, -2.1276979446411133, -1.9002381563186646, -1.6727783679962158, -1.4453184604644775, -1.2178585529327393, -0.990398645401001, -0.7629387974739075, -0.535478949546814, -0.3080190420150757, -0.0805591344833374, 0.14690065383911133, 0.3743605613708496, 0.6018204689025879, 0.8292803764343262, 1.0567402839660645, 1.2842000722885132, 1.5116599798202515, 1.7391198873519897, 1.9665796756744385, 2.1940395832061768, 2.421499490737915, 2.6489593982696533, 2.8764193058013916, 3.103878974914551, 3.331338882446289, 3.5587987899780273, 3.7862586975097656, 4.013718605041504, 4.241178512573242, 4.4686384201049805, 4.696098327636719, 4.923558235168457, 5.151018142700195, 5.378478050231934, 5.605937957763672, 5.83339786529541, 6.060857772827148, 6.288317680358887, 6.515777587890625, 6.743237495422363, 6.970697402954102, 7.19815731048584, 7.425617218017578, 7.653077125549316, 7.8805365562438965]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 4.0, 10.0, 13.0, 31.0, 30.0, 48.0, 92.0, 156.0, 256.0, 393.0, 672.0, 1180.0, 2182.0, 4261.0, 9014.0, 20437.0, 50131.0, 131945.0, 287788.0, 299019.0, 144304.0, 55108.0, 21834.0, 9701.0, 4594.0, 2294.0, 1295.0, 667.0, 424.0, 249.0, 148.0, 92.0, 57.0, 38.0, 25.0, 18.0, 18.0, 10.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7265625, -12.316650390625, -11.90673828125, -11.496826171875, -11.0869140625, -10.677001953125, -10.26708984375, -9.857177734375, -9.447265625, -9.037353515625, -8.62744140625, -8.217529296875, -7.8076171875, -7.397705078125, -6.98779296875, -6.577880859375, -6.16796875, -5.758056640625, -5.34814453125, -4.938232421875, -4.5283203125, -4.118408203125, -3.70849609375, -3.298583984375, -2.888671875, -2.478759765625, -2.06884765625, -1.658935546875, -1.2490234375, -0.839111328125, -0.42919921875, -0.019287109375, 0.390625, 0.800537109375, 1.21044921875, 1.620361328125, 2.0302734375, 2.440185546875, 2.85009765625, 3.260009765625, 3.669921875, 4.079833984375, 4.48974609375, 4.899658203125, 5.3095703125, 5.719482421875, 6.12939453125, 6.539306640625, 6.94921875, 7.359130859375, 7.76904296875, 8.178955078125, 8.5888671875, 8.998779296875, 9.40869140625, 9.818603515625, 10.228515625, 10.638427734375, 11.04833984375, 11.458251953125, 11.8681640625, 12.278076171875, 12.68798828125, 13.097900390625, 13.5078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 6.0, 8.0, 9.0, 14.0, 10.0, 15.0, 13.0, 20.0, 21.0, 28.0, 48.0, 39.0, 40.0, 40.0, 39.0, 45.0, 40.0, 50.0, 50.0, 57.0, 38.0, 43.0, 41.0, 36.0, 35.0, 33.0, 24.0, 21.0, 29.0, 24.0, 16.0, 14.0, 10.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.35546875, -7.11383056640625, -6.8721923828125, -6.63055419921875, -6.388916015625, -6.14727783203125, -5.9056396484375, -5.66400146484375, -5.42236328125, -5.18072509765625, -4.9390869140625, -4.69744873046875, -4.455810546875, -4.21417236328125, -3.9725341796875, -3.73089599609375, -3.4892578125, -3.24761962890625, -3.0059814453125, -2.76434326171875, -2.522705078125, -2.28106689453125, -2.0394287109375, -1.79779052734375, -1.55615234375, -1.31451416015625, -1.0728759765625, -0.83123779296875, -0.589599609375, -0.34796142578125, -0.1063232421875, 0.13531494140625, 0.376953125, 0.61859130859375, 0.8602294921875, 1.10186767578125, 1.343505859375, 1.58514404296875, 1.8267822265625, 2.06842041015625, 2.31005859375, 2.55169677734375, 2.7933349609375, 3.03497314453125, 3.276611328125, 3.51824951171875, 3.7598876953125, 4.00152587890625, 4.2431640625, 4.48480224609375, 4.7264404296875, 4.96807861328125, 5.209716796875, 5.45135498046875, 5.6929931640625, 5.93463134765625, 6.17626953125, 6.41790771484375, 6.6595458984375, 6.90118408203125, 7.142822265625, 7.38446044921875, 7.6260986328125, 7.86773681640625, 8.109375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 15.0, 14.0, 37.0, 60.0, 80.0, 108.0, 151.0, 217.0, 360.0, 512.0, 752.0, 1306.0, 1896.0, 3006.0, 4771.0, 7884.0, 13098.0, 21438.0, 36839.0, 62660.0, 104407.0, 158559.0, 189645.0, 164865.0, 111193.0, 66692.0, 38705.0, 22845.0, 13740.0, 8414.0, 5192.0, 3311.0, 2002.0, 1272.0, 837.0, 553.0, 365.0, 253.0, 151.0, 101.0, 68.0, 51.0, 32.0, 20.0, 18.0, 12.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.77471923828125, -6.5455322265625, -6.31634521484375, -6.087158203125, -5.85797119140625, -5.6287841796875, -5.39959716796875, -5.17041015625, -4.94122314453125, -4.7120361328125, -4.48284912109375, -4.253662109375, -4.02447509765625, -3.7952880859375, -3.56610107421875, -3.3369140625, -3.10772705078125, -2.8785400390625, -2.64935302734375, -2.420166015625, -2.19097900390625, -1.9617919921875, -1.73260498046875, -1.50341796875, -1.27423095703125, -1.0450439453125, -0.81585693359375, -0.586669921875, -0.35748291015625, -0.1282958984375, 0.10089111328125, 0.330078125, 0.55926513671875, 0.7884521484375, 1.01763916015625, 1.246826171875, 1.47601318359375, 1.7052001953125, 1.93438720703125, 2.16357421875, 2.39276123046875, 2.6219482421875, 2.85113525390625, 3.080322265625, 3.30950927734375, 3.5386962890625, 3.76788330078125, 3.9970703125, 4.22625732421875, 4.4554443359375, 4.68463134765625, 4.913818359375, 5.14300537109375, 5.3721923828125, 5.60137939453125, 5.83056640625, 6.05975341796875, 6.2889404296875, 6.51812744140625, 6.747314453125, 6.97650146484375, 7.2056884765625, 7.43487548828125, 7.6640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 12.0, 13.0, 13.0, 12.0, 14.0, 27.0, 40.0, 44.0, 41.0, 57.0, 39.0, 55.0, 52.0, 50.0, 54.0, 63.0, 48.0, 47.0, 65.0, 47.0, 38.0, 40.0, 26.0, 30.0, 13.0, 22.0, 17.0, 8.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3497314453125, -6.156494140625, -5.9632568359375, -5.77001953125, -5.5767822265625, -5.383544921875, -5.1903076171875, -4.9970703125, -4.8038330078125, -4.610595703125, -4.4173583984375, -4.22412109375, -4.0308837890625, -3.837646484375, -3.6444091796875, -3.451171875, -3.2579345703125, -3.064697265625, -2.8714599609375, -2.67822265625, -2.4849853515625, -2.291748046875, -2.0985107421875, -1.9052734375, -1.7120361328125, -1.518798828125, -1.3255615234375, -1.13232421875, -0.9390869140625, -0.745849609375, -0.5526123046875, -0.359375, -0.1661376953125, 0.027099609375, 0.2203369140625, 0.41357421875, 0.6068115234375, 0.800048828125, 0.9932861328125, 1.1865234375, 1.3797607421875, 1.572998046875, 1.7662353515625, 1.95947265625, 2.1527099609375, 2.345947265625, 2.5391845703125, 2.732421875, 2.9256591796875, 3.118896484375, 3.3121337890625, 3.50537109375, 3.6986083984375, 3.891845703125, 4.0850830078125, 4.2783203125, 4.4715576171875, 4.664794921875, 4.8580322265625, 5.05126953125, 5.2445068359375, 5.437744140625, 5.6309814453125, 5.82421875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 16.0, 17.0, 22.0, 39.0, 38.0, 82.0, 92.0, 159.0, 301.0, 447.0, 711.0, 1063.0, 1789.0, 2896.0, 4912.0, 8747.0, 15956.0, 31083.0, 63219.0, 130513.0, 236922.0, 252239.0, 148285.0, 72247.0, 35144.0, 17922.0, 9874.0, 5464.0, 3164.0, 1929.0, 1188.0, 738.0, 486.0, 306.0, 173.0, 133.0, 80.0, 60.0, 26.0, 25.0, 20.0, 9.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6796875, -5.49700927734375, -5.3143310546875, -5.13165283203125, -4.948974609375, -4.76629638671875, -4.5836181640625, -4.40093994140625, -4.21826171875, -4.03558349609375, -3.8529052734375, -3.67022705078125, -3.487548828125, -3.30487060546875, -3.1221923828125, -2.93951416015625, -2.7568359375, -2.57415771484375, -2.3914794921875, -2.20880126953125, -2.026123046875, -1.84344482421875, -1.6607666015625, -1.47808837890625, -1.29541015625, -1.11273193359375, -0.9300537109375, -0.74737548828125, -0.564697265625, -0.38201904296875, -0.1993408203125, -0.01666259765625, 0.166015625, 0.34869384765625, 0.5313720703125, 0.71405029296875, 0.896728515625, 1.07940673828125, 1.2620849609375, 1.44476318359375, 1.62744140625, 1.81011962890625, 1.9927978515625, 2.17547607421875, 2.358154296875, 2.54083251953125, 2.7235107421875, 2.90618896484375, 3.0888671875, 3.27154541015625, 3.4542236328125, 3.63690185546875, 3.819580078125, 4.00225830078125, 4.1849365234375, 4.36761474609375, 4.55029296875, 4.73297119140625, 4.9156494140625, 5.09832763671875, 5.281005859375, 5.46368408203125, 5.6463623046875, 5.82904052734375, 6.01171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 7.0, 9.0, 9.0, 28.0, 23.0, 31.0, 30.0, 41.0, 49.0, 63.0, 81.0, 85.0, 75.0, 77.0, 70.0, 54.0, 63.0, 44.0, 32.0, 20.0, 25.0, 12.0, 10.0, 10.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003352165222167969, -0.0003203153610229492, -0.00030541419982910156, -0.0002905130386352539, -0.00027561187744140625, -0.0002607107162475586, -0.00024580955505371094, -0.00023090839385986328, -0.00021600723266601562, -0.00020110607147216797, -0.0001862049102783203, -0.00017130374908447266, -0.000156402587890625, -0.00014150142669677734, -0.0001266002655029297, -0.00011169910430908203, -9.679794311523438e-05, -8.189678192138672e-05, -6.699562072753906e-05, -5.2094459533691406e-05, -3.719329833984375e-05, -2.2292137145996094e-05, -7.3909759521484375e-06, 7.510185241699219e-06, 2.2411346435546875e-05, 3.731250762939453e-05, 5.221366882324219e-05, 6.711483001708984e-05, 8.20159912109375e-05, 9.691715240478516e-05, 0.00011181831359863281, 0.00012671947479248047, 0.00014162063598632812, 0.00015652179718017578, 0.00017142295837402344, 0.0001863241195678711, 0.00020122528076171875, 0.0002161264419555664, 0.00023102760314941406, 0.0002459287643432617, 0.0002608299255371094, 0.00027573108673095703, 0.0002906322479248047, 0.00030553340911865234, 0.0003204345703125, 0.00033533573150634766, 0.0003502368927001953, 0.00036513805389404297, 0.0003800392150878906, 0.0003949403762817383, 0.00040984153747558594, 0.0004247426986694336, 0.00043964385986328125, 0.0004545450210571289, 0.00046944618225097656, 0.0004843473434448242, 0.0004992485046386719, 0.0005141496658325195, 0.0005290508270263672, 0.0005439519882202148, 0.0005588531494140625, 0.0005737543106079102, 0.0005886554718017578, 0.0006035566329956055, 0.0006184577941894531]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 10.0, 15.0, 33.0, 43.0, 56.0, 79.0, 103.0, 139.0, 245.0, 379.0, 561.0, 953.0, 1560.0, 2764.0, 5090.0, 9860.0, 20535.0, 44515.0, 99783.0, 208832.0, 285699.0, 195431.0, 91809.0, 40651.0, 18820.0, 9254.0, 4703.0, 2588.0, 1521.0, 888.0, 549.0, 300.0, 233.0, 169.0, 103.0, 72.0, 49.0, 43.0, 26.0, 15.0, 13.0, 14.0, 5.0, 9.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0], "bins": [-6.0546875, -5.8736572265625, -5.692626953125, -5.5115966796875, -5.33056640625, -5.1495361328125, -4.968505859375, -4.7874755859375, -4.6064453125, -4.4254150390625, -4.244384765625, -4.0633544921875, -3.88232421875, -3.7012939453125, -3.520263671875, -3.3392333984375, -3.158203125, -2.9771728515625, -2.796142578125, -2.6151123046875, -2.43408203125, -2.2530517578125, -2.072021484375, -1.8909912109375, -1.7099609375, -1.5289306640625, -1.347900390625, -1.1668701171875, -0.98583984375, -0.8048095703125, -0.623779296875, -0.4427490234375, -0.26171875, -0.0806884765625, 0.100341796875, 0.2813720703125, 0.46240234375, 0.6434326171875, 0.824462890625, 1.0054931640625, 1.1865234375, 1.3675537109375, 1.548583984375, 1.7296142578125, 1.91064453125, 2.0916748046875, 2.272705078125, 2.4537353515625, 2.634765625, 2.8157958984375, 2.996826171875, 3.1778564453125, 3.35888671875, 3.5399169921875, 3.720947265625, 3.9019775390625, 4.0830078125, 4.2640380859375, 4.445068359375, 4.6260986328125, 4.80712890625, 4.9881591796875, 5.169189453125, 5.3502197265625, 5.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 9.0, 16.0, 16.0, 35.0, 43.0, 62.0, 63.0, 88.0, 98.0, 97.0, 106.0, 71.0, 64.0, 47.0, 43.0, 24.0, 22.0, 12.0, 12.0, 15.0, 6.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.224609375, -2.149261474609375, -2.07391357421875, -1.998565673828125, -1.9232177734375, -1.847869873046875, -1.77252197265625, -1.697174072265625, -1.621826171875, -1.546478271484375, -1.47113037109375, -1.395782470703125, -1.3204345703125, -1.245086669921875, -1.16973876953125, -1.094390869140625, -1.01904296875, -0.943695068359375, -0.86834716796875, -0.792999267578125, -0.7176513671875, -0.642303466796875, -0.56695556640625, -0.491607666015625, -0.416259765625, -0.340911865234375, -0.26556396484375, -0.190216064453125, -0.1148681640625, -0.039520263671875, 0.03582763671875, 0.111175537109375, 0.1865234375, 0.261871337890625, 0.33721923828125, 0.412567138671875, 0.4879150390625, 0.563262939453125, 0.63861083984375, 0.713958740234375, 0.789306640625, 0.864654541015625, 0.94000244140625, 1.015350341796875, 1.0906982421875, 1.166046142578125, 1.24139404296875, 1.316741943359375, 1.39208984375, 1.467437744140625, 1.54278564453125, 1.618133544921875, 1.6934814453125, 1.768829345703125, 1.84417724609375, 1.919525146484375, 1.994873046875, 2.070220947265625, 2.14556884765625, 2.220916748046875, 2.2962646484375, 2.371612548828125, 2.44696044921875, 2.522308349609375, 2.59765625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 5.0, 10.0, 17.0, 19.0, 33.0, 66.0, 72.0, 83.0, 109.0, 126.0, 116.0, 76.0, 74.0, 55.0, 37.0, 27.0, 21.0, 18.0, 9.0, 3.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0], "bins": [-22.312911987304688, -21.832881927490234, -21.352853775024414, -20.87282371520996, -20.392793655395508, -19.912765502929688, -19.432735443115234, -18.95270538330078, -18.47267723083496, -17.992647171020508, -17.512619018554688, -17.032588958740234, -16.55255889892578, -16.07253074645996, -15.592500686645508, -15.112471580505371, -14.632441520690918, -14.152412414550781, -13.672382354736328, -13.192353248596191, -12.712324142456055, -12.232294082641602, -11.752264976501465, -11.272235870361328, -10.792205810546875, -10.312176704406738, -9.832146644592285, -9.352117538452148, -8.872088432312012, -8.392059326171875, -7.912029266357422, -7.432000160217285, -6.951970100402832, -6.471940517425537, -5.9919114112854, -5.5118818283081055, -5.031852722167969, -4.551823139190674, -4.071793556213379, -3.591764211654663, -3.1117348670959473, -2.6317055225372314, -2.1516761779785156, -1.6716465950012207, -1.1916172504425049, -0.7115879058837891, -0.23155832290649414, 0.24847102165222168, 0.7285003662109375, 1.2085297107696533, 1.6885591745376587, 2.168588638305664, 2.64861798286438, 3.1286473274230957, 3.6086769104003906, 4.088706016540527, 4.568735599517822, 5.048765182495117, 5.528794288635254, 6.008823871612549, 6.488853454589844, 6.9688825607299805, 7.448912143707275, 7.92894172668457, 8.408970832824707]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 8.0, 3.0, 6.0, 11.0, 10.0, 12.0, 11.0, 12.0, 11.0, 22.0, 19.0, 14.0, 34.0, 40.0, 34.0, 26.0, 47.0, 29.0, 29.0, 51.0, 43.0, 45.0, 42.0, 39.0, 42.0, 37.0, 41.0, 40.0, 41.0, 34.0, 21.0, 22.0, 20.0, 16.0, 20.0, 13.0, 10.0, 9.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.974536895751953, -6.759966850280762, -6.545396327972412, -6.3308258056640625, -6.116255760192871, -5.90168571472168, -5.68711519241333, -5.4725446701049805, -5.257974624633789, -5.043404579162598, -4.828834056854248, -4.614263534545898, -4.399693489074707, -4.185123443603516, -3.970552921295166, -3.7559826374053955, -3.541412353515625, -3.3268420696258545, -3.112271785736084, -2.8977015018463135, -2.683131217956543, -2.4685609340667725, -2.253990650177002, -2.0394203662872314, -1.824850082397461, -1.6102797985076904, -1.39570951461792, -1.1811392307281494, -0.9665689468383789, -0.7519986629486084, -0.5374283790588379, -0.3228580951690674, -0.10828733444213867, 0.10628294944763184, 0.32085323333740234, 0.5354235172271729, 0.7499938011169434, 0.9645640850067139, 1.1791343688964844, 1.3937046527862549, 1.6082749366760254, 1.822845220565796, 2.0374155044555664, 2.251985788345337, 2.4665560722351074, 2.681126356124878, 2.8956966400146484, 3.110266923904419, 3.3248372077941895, 3.53940749168396, 3.7539777755737305, 3.968548059463501, 4.1831183433532715, 4.397688865661621, 4.6122589111328125, 4.826828956604004, 5.0413994789123535, 5.255970001220703, 5.4705400466918945, 5.685110092163086, 5.8996806144714355, 6.114251136779785, 6.328821182250977, 6.543391227722168, 6.757961750030518]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 13.0, 7.0, 22.0, 30.0, 43.0, 66.0, 75.0, 128.0, 201.0, 245.0, 401.0, 553.0, 878.0, 1197.0, 1810.0, 2629.0, 4247.0, 6712.0, 11056.0, 20109.0, 40163.0, 96840.0, 280401.0, 849752.0, 1492744.0, 895756.0, 296332.0, 100727.0, 41135.0, 19846.0, 10991.0, 6558.0, 4083.0, 2785.0, 1741.0, 1220.0, 858.0, 547.0, 396.0, 301.0, 224.0, 138.0, 103.0, 76.0, 39.0, 34.0, 29.0, 12.0, 21.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.7421875, -11.3919677734375, -11.041748046875, -10.6915283203125, -10.34130859375, -9.9910888671875, -9.640869140625, -9.2906494140625, -8.9404296875, -8.5902099609375, -8.239990234375, -7.8897705078125, -7.53955078125, -7.1893310546875, -6.839111328125, -6.4888916015625, -6.138671875, -5.7884521484375, -5.438232421875, -5.0880126953125, -4.73779296875, -4.3875732421875, -4.037353515625, -3.6871337890625, -3.3369140625, -2.9866943359375, -2.636474609375, -2.2862548828125, -1.93603515625, -1.5858154296875, -1.235595703125, -0.8853759765625, -0.53515625, -0.1849365234375, 0.165283203125, 0.5155029296875, 0.86572265625, 1.2159423828125, 1.566162109375, 1.9163818359375, 2.2666015625, 2.6168212890625, 2.967041015625, 3.3172607421875, 3.66748046875, 4.0177001953125, 4.367919921875, 4.7181396484375, 5.068359375, 5.4185791015625, 5.768798828125, 6.1190185546875, 6.46923828125, 6.8194580078125, 7.169677734375, 7.5198974609375, 7.8701171875, 8.2203369140625, 8.570556640625, 8.9207763671875, 9.27099609375, 9.6212158203125, 9.971435546875, 10.3216552734375, 10.671875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 8.0, 3.0, 8.0, 10.0, 17.0, 14.0, 19.0, 22.0, 23.0, 24.0, 48.0, 31.0, 35.0, 41.0, 38.0, 47.0, 36.0, 53.0, 38.0, 43.0, 35.0, 46.0, 42.0, 42.0, 36.0, 29.0, 35.0, 29.0, 29.0, 18.0, 19.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 9.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-4.78515625, -4.6336669921875, -4.482177734375, -4.3306884765625, -4.17919921875, -4.0277099609375, -3.876220703125, -3.7247314453125, -3.5732421875, -3.4217529296875, -3.270263671875, -3.1187744140625, -2.96728515625, -2.8157958984375, -2.664306640625, -2.5128173828125, -2.361328125, -2.2098388671875, -2.058349609375, -1.9068603515625, -1.75537109375, -1.6038818359375, -1.452392578125, -1.3009033203125, -1.1494140625, -0.9979248046875, -0.846435546875, -0.6949462890625, -0.54345703125, -0.3919677734375, -0.240478515625, -0.0889892578125, 0.0625, 0.2139892578125, 0.365478515625, 0.5169677734375, 0.66845703125, 0.8199462890625, 0.971435546875, 1.1229248046875, 1.2744140625, 1.4259033203125, 1.577392578125, 1.7288818359375, 1.88037109375, 2.0318603515625, 2.183349609375, 2.3348388671875, 2.486328125, 2.6378173828125, 2.789306640625, 2.9407958984375, 3.09228515625, 3.2437744140625, 3.395263671875, 3.5467529296875, 3.6982421875, 3.8497314453125, 4.001220703125, 4.1527099609375, 4.30419921875, 4.4556884765625, 4.607177734375, 4.7586669921875, 4.91015625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 16.0, 14.0, 20.0, 27.0, 55.0, 76.0, 93.0, 148.0, 238.0, 349.0, 584.0, 875.0, 1403.0, 2361.0, 3903.0, 6657.0, 11571.0, 21220.0, 42003.0, 93784.0, 245867.0, 697837.0, 1389951.0, 1027406.0, 385821.0, 139917.0, 57928.0, 28268.0, 14889.0, 8483.0, 4723.0, 2933.0, 1814.0, 1118.0, 672.0, 435.0, 293.0, 186.0, 128.0, 73.0, 46.0, 36.0, 27.0, 14.0, 11.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.93310546875, -10.5771484375, -10.22119140625, -9.865234375, -9.50927734375, -9.1533203125, -8.79736328125, -8.44140625, -8.08544921875, -7.7294921875, -7.37353515625, -7.017578125, -6.66162109375, -6.3056640625, -5.94970703125, -5.59375, -5.23779296875, -4.8818359375, -4.52587890625, -4.169921875, -3.81396484375, -3.4580078125, -3.10205078125, -2.74609375, -2.39013671875, -2.0341796875, -1.67822265625, -1.322265625, -0.96630859375, -0.6103515625, -0.25439453125, 0.1015625, 0.45751953125, 0.8134765625, 1.16943359375, 1.525390625, 1.88134765625, 2.2373046875, 2.59326171875, 2.94921875, 3.30517578125, 3.6611328125, 4.01708984375, 4.373046875, 4.72900390625, 5.0849609375, 5.44091796875, 5.796875, 6.15283203125, 6.5087890625, 6.86474609375, 7.220703125, 7.57666015625, 7.9326171875, 8.28857421875, 8.64453125, 9.00048828125, 9.3564453125, 9.71240234375, 10.068359375, 10.42431640625, 10.7802734375, 11.13623046875, 11.4921875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 11.0, 17.0, 17.0, 19.0, 17.0, 26.0, 37.0, 51.0, 48.0, 73.0, 121.0, 138.0, 175.0, 218.0, 249.0, 324.0, 318.0, 351.0, 335.0, 289.0, 287.0, 215.0, 178.0, 126.0, 93.0, 87.0, 60.0, 34.0, 35.0, 22.0, 21.0, 25.0, 11.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.646484375, -3.546051025390625, -3.44561767578125, -3.345184326171875, -3.2447509765625, -3.144317626953125, -3.04388427734375, -2.943450927734375, -2.843017578125, -2.742584228515625, -2.64215087890625, -2.541717529296875, -2.4412841796875, -2.340850830078125, -2.24041748046875, -2.139984130859375, -2.03955078125, -1.939117431640625, -1.83868408203125, -1.738250732421875, -1.6378173828125, -1.537384033203125, -1.43695068359375, -1.336517333984375, -1.236083984375, -1.135650634765625, -1.03521728515625, -0.934783935546875, -0.8343505859375, -0.733917236328125, -0.63348388671875, -0.533050537109375, -0.4326171875, -0.332183837890625, -0.23175048828125, -0.131317138671875, -0.0308837890625, 0.069549560546875, 0.16998291015625, 0.270416259765625, 0.370849609375, 0.471282958984375, 0.57171630859375, 0.672149658203125, 0.7725830078125, 0.873016357421875, 0.97344970703125, 1.073883056640625, 1.17431640625, 1.274749755859375, 1.37518310546875, 1.475616455078125, 1.5760498046875, 1.676483154296875, 1.77691650390625, 1.877349853515625, 1.977783203125, 2.078216552734375, 2.17864990234375, 2.279083251953125, 2.3795166015625, 2.479949951171875, 2.58038330078125, 2.680816650390625, 2.78125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 12.0, 10.0, 11.0, 8.0, 25.0, 26.0, 48.0, 62.0, 83.0, 103.0, 104.0, 107.0, 113.0, 84.0, 62.0, 41.0, 32.0, 14.0, 11.0, 9.0, 8.0, 7.0, 6.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.898653030395508, -16.463951110839844, -16.029247283935547, -15.594545364379883, -15.159843444824219, -14.725141525268555, -14.290438652038574, -13.855735778808594, -13.42103385925293, -12.986331939697266, -12.551629066467285, -12.116926193237305, -11.68222427368164, -11.247522354125977, -10.812819480895996, -10.378116607666016, -9.943414688110352, -9.508712768554688, -9.074009895324707, -8.639307022094727, -8.204605102539062, -7.76990270614624, -7.335200309753418, -6.900497913360596, -6.465795516967773, -6.031093120574951, -5.596390724182129, -5.161688327789307, -4.726985931396484, -4.292283535003662, -3.85758113861084, -3.4228787422180176, -2.9881763458251953, -2.553473949432373, -2.118771553039551, -1.6840691566467285, -1.2493667602539062, -0.814664363861084, -0.3799619674682617, 0.05474042892456055, 0.4894428253173828, 0.9241452217102051, 1.3588476181030273, 1.7935500144958496, 2.228252410888672, 2.662954807281494, 3.0976572036743164, 3.5323596000671387, 3.967061996459961, 4.401764392852783, 4.8364667892456055, 5.271169185638428, 5.70587158203125, 6.140573978424072, 6.5752763748168945, 7.009978771209717, 7.444681167602539, 7.879383563995361, 8.314085960388184, 8.748788833618164, 9.183490753173828, 9.618192672729492, 10.052895545959473, 10.487598419189453, 10.922300338745117]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 6.0, 10.0, 8.0, 16.0, 12.0, 12.0, 24.0, 35.0, 27.0, 25.0, 38.0, 23.0, 30.0, 39.0, 49.0, 46.0, 46.0, 42.0, 45.0, 48.0, 46.0, 35.0, 45.0, 33.0, 34.0, 30.0, 26.0, 23.0, 24.0, 20.0, 17.0, 10.0, 14.0, 13.0, 5.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.5228424072265625, -6.318317413330078, -6.113792896270752, -5.909267902374268, -5.704742908477783, -5.500218391418457, -5.295693397521973, -5.091168403625488, -4.886643409729004, -4.6821184158325195, -4.477593898773193, -4.273068904876709, -4.068543910980225, -3.8640191555023193, -3.659494400024414, -3.4549694061279297, -3.2504448890686035, -3.0459201335906982, -2.841395139694214, -2.6368703842163086, -2.432345390319824, -2.227820634841919, -2.0232958793640137, -1.8187710046768188, -1.614246129989624, -1.4097212553024292, -1.2051963806152344, -1.000671625137329, -0.7961467504501343, -0.5916218757629395, -0.3870971202850342, -0.18257224559783936, 0.02195262908935547, 0.2264774739742279, 0.43100231885910034, 0.6355271339416504, 0.8400520086288452, 1.04457688331604, 1.2491016387939453, 1.4536265134811401, 1.658151388168335, 1.8626762628555298, 2.0672011375427246, 2.27172589302063, 2.476250648498535, 2.6807756423950195, 2.885300397872925, 3.08982515335083, 3.2943501472473145, 3.4988749027252197, 3.703399896621704, 3.9079246520996094, 4.112449645996094, 4.316974639892578, 4.521499156951904, 4.726024150848389, 4.930548667907715, 5.135073661804199, 5.339598178863525, 5.54412317276001, 5.748648166656494, 5.95317268371582, 6.157697677612305, 6.362222671508789, 6.566747665405273]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 8.0, 16.0, 6.0, 19.0, 34.0, 47.0, 66.0, 107.0, 158.0, 194.0, 319.0, 517.0, 715.0, 1138.0, 1837.0, 2895.0, 4740.0, 7895.0, 13871.0, 25092.0, 46797.0, 88202.0, 157128.0, 220225.0, 200159.0, 125540.0, 67672.0, 35798.0, 19567.0, 10995.0, 6361.0, 3771.0, 2322.0, 1498.0, 947.0, 605.0, 428.0, 275.0, 189.0, 122.0, 86.0, 82.0, 40.0, 23.0, 21.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.76171875, -3.653594970703125, -3.54547119140625, -3.437347412109375, -3.3292236328125, -3.221099853515625, -3.11297607421875, -3.004852294921875, -2.896728515625, -2.788604736328125, -2.68048095703125, -2.572357177734375, -2.4642333984375, -2.356109619140625, -2.24798583984375, -2.139862060546875, -2.03173828125, -1.923614501953125, -1.81549072265625, -1.707366943359375, -1.5992431640625, -1.491119384765625, -1.38299560546875, -1.274871826171875, -1.166748046875, -1.058624267578125, -0.95050048828125, -0.842376708984375, -0.7342529296875, -0.626129150390625, -0.51800537109375, -0.409881591796875, -0.3017578125, -0.193634033203125, -0.08551025390625, 0.022613525390625, 0.1307373046875, 0.238861083984375, 0.34698486328125, 0.455108642578125, 0.563232421875, 0.671356201171875, 0.77947998046875, 0.887603759765625, 0.9957275390625, 1.103851318359375, 1.21197509765625, 1.320098876953125, 1.42822265625, 1.536346435546875, 1.64447021484375, 1.752593994140625, 1.8607177734375, 1.968841552734375, 2.07696533203125, 2.185089111328125, 2.293212890625, 2.401336669921875, 2.50946044921875, 2.617584228515625, 2.7257080078125, 2.833831787109375, 2.94195556640625, 3.050079345703125, 3.158203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 17.0, 32.0, 26.0, 14.0, 30.0, 28.0, 35.0, 42.0, 37.0, 33.0, 56.0, 51.0, 61.0, 43.0, 48.0, 42.0, 46.0, 35.0, 32.0, 39.0, 27.0, 29.0, 19.0, 23.0, 15.0, 21.0, 9.0, 16.0, 3.0, 8.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.0625, -6.8323974609375, -6.602294921875, -6.3721923828125, -6.14208984375, -5.9119873046875, -5.681884765625, -5.4517822265625, -5.2216796875, -4.9915771484375, -4.761474609375, -4.5313720703125, -4.30126953125, -4.0711669921875, -3.841064453125, -3.6109619140625, -3.380859375, -3.1507568359375, -2.920654296875, -2.6905517578125, -2.46044921875, -2.2303466796875, -2.000244140625, -1.7701416015625, -1.5400390625, -1.3099365234375, -1.079833984375, -0.8497314453125, -0.61962890625, -0.3895263671875, -0.159423828125, 0.0706787109375, 0.30078125, 0.5308837890625, 0.760986328125, 0.9910888671875, 1.22119140625, 1.4512939453125, 1.681396484375, 1.9114990234375, 2.1416015625, 2.3717041015625, 2.601806640625, 2.8319091796875, 3.06201171875, 3.2921142578125, 3.522216796875, 3.7523193359375, 3.982421875, 4.2125244140625, 4.442626953125, 4.6727294921875, 4.90283203125, 5.1329345703125, 5.363037109375, 5.5931396484375, 5.8232421875, 6.0533447265625, 6.283447265625, 6.5135498046875, 6.74365234375, 6.9737548828125, 7.203857421875, 7.4339599609375, 7.6640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 11.0, 14.0, 20.0, 20.0, 31.0, 45.0, 62.0, 80.0, 114.0, 157.0, 244.0, 293.0, 476.0, 717.0, 1120.0, 1643.0, 2708.0, 4233.0, 6996.0, 12577.0, 22852.0, 41910.0, 79970.0, 146193.0, 224220.0, 213420.0, 131520.0, 70487.0, 37572.0, 20098.0, 11202.0, 6510.0, 4031.0, 2336.0, 1486.0, 966.0, 675.0, 473.0, 313.0, 237.0, 152.0, 106.0, 80.0, 45.0, 44.0, 30.0, 28.0, 13.0, 9.0, 8.0, 1.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.339508056640625, -3.22784423828125, -3.116180419921875, -3.0045166015625, -2.892852783203125, -2.78118896484375, -2.669525146484375, -2.557861328125, -2.446197509765625, -2.33453369140625, -2.222869873046875, -2.1112060546875, -1.999542236328125, -1.88787841796875, -1.776214599609375, -1.66455078125, -1.552886962890625, -1.44122314453125, -1.329559326171875, -1.2178955078125, -1.106231689453125, -0.99456787109375, -0.882904052734375, -0.771240234375, -0.659576416015625, -0.54791259765625, -0.436248779296875, -0.3245849609375, -0.212921142578125, -0.10125732421875, 0.010406494140625, 0.1220703125, 0.233734130859375, 0.34539794921875, 0.457061767578125, 0.5687255859375, 0.680389404296875, 0.79205322265625, 0.903717041015625, 1.015380859375, 1.127044677734375, 1.23870849609375, 1.350372314453125, 1.4620361328125, 1.573699951171875, 1.68536376953125, 1.797027587890625, 1.90869140625, 2.020355224609375, 2.13201904296875, 2.243682861328125, 2.3553466796875, 2.467010498046875, 2.57867431640625, 2.690338134765625, 2.802001953125, 2.913665771484375, 3.02532958984375, 3.136993408203125, 3.2486572265625, 3.360321044921875, 3.47198486328125, 3.583648681640625, 3.6953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 16.0, 21.0, 12.0, 13.0, 22.0, 24.0, 23.0, 27.0, 24.0, 37.0, 29.0, 44.0, 31.0, 47.0, 25.0, 45.0, 30.0, 35.0, 38.0, 29.0, 39.0, 34.0, 35.0, 33.0, 28.0, 27.0, 27.0, 26.0, 24.0, 21.0, 19.0, 16.0, 12.0, 13.0, 7.0, 11.0, 9.0, 5.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.41015625, -3.30206298828125, -3.1939697265625, -3.08587646484375, -2.977783203125, -2.86968994140625, -2.7615966796875, -2.65350341796875, -2.54541015625, -2.43731689453125, -2.3292236328125, -2.22113037109375, -2.113037109375, -2.00494384765625, -1.8968505859375, -1.78875732421875, -1.6806640625, -1.57257080078125, -1.4644775390625, -1.35638427734375, -1.248291015625, -1.14019775390625, -1.0321044921875, -0.92401123046875, -0.81591796875, -0.70782470703125, -0.5997314453125, -0.49163818359375, -0.383544921875, -0.27545166015625, -0.1673583984375, -0.05926513671875, 0.048828125, 0.15692138671875, 0.2650146484375, 0.37310791015625, 0.481201171875, 0.58929443359375, 0.6973876953125, 0.80548095703125, 0.91357421875, 1.02166748046875, 1.1297607421875, 1.23785400390625, 1.345947265625, 1.45404052734375, 1.5621337890625, 1.67022705078125, 1.7783203125, 1.88641357421875, 1.9945068359375, 2.10260009765625, 2.210693359375, 2.31878662109375, 2.4268798828125, 2.53497314453125, 2.64306640625, 2.75115966796875, 2.8592529296875, 2.96734619140625, 3.075439453125, 3.18353271484375, 3.2916259765625, 3.39971923828125, 3.5078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 5.0, 11.0, 12.0, 17.0, 22.0, 22.0, 49.0, 47.0, 80.0, 89.0, 154.0, 211.0, 362.0, 642.0, 969.0, 1709.0, 3057.0, 5482.0, 10704.0, 21590.0, 47945.0, 116188.0, 274946.0, 312961.0, 140950.0, 57719.0, 25392.0, 12483.0, 6377.0, 3356.0, 1977.0, 1110.0, 683.0, 418.0, 278.0, 160.0, 110.0, 77.0, 46.0, 48.0, 23.0, 19.0, 17.0, 8.0, 14.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.330078125, -2.25750732421875, -2.1849365234375, -2.11236572265625, -2.039794921875, -1.96722412109375, -1.8946533203125, -1.82208251953125, -1.74951171875, -1.67694091796875, -1.6043701171875, -1.53179931640625, -1.459228515625, -1.38665771484375, -1.3140869140625, -1.24151611328125, -1.1689453125, -1.09637451171875, -1.0238037109375, -0.95123291015625, -0.878662109375, -0.80609130859375, -0.7335205078125, -0.66094970703125, -0.58837890625, -0.51580810546875, -0.4432373046875, -0.37066650390625, -0.298095703125, -0.22552490234375, -0.1529541015625, -0.08038330078125, -0.0078125, 0.06475830078125, 0.1373291015625, 0.20989990234375, 0.282470703125, 0.35504150390625, 0.4276123046875, 0.50018310546875, 0.57275390625, 0.64532470703125, 0.7178955078125, 0.79046630859375, 0.863037109375, 0.93560791015625, 1.0081787109375, 1.08074951171875, 1.1533203125, 1.22589111328125, 1.2984619140625, 1.37103271484375, 1.443603515625, 1.51617431640625, 1.5887451171875, 1.66131591796875, 1.73388671875, 1.80645751953125, 1.8790283203125, 1.95159912109375, 2.024169921875, 2.09674072265625, 2.1693115234375, 2.24188232421875, 2.314453125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 3.0, 12.0, 15.0, 24.0, 29.0, 45.0, 58.0, 71.0, 93.0, 97.0, 109.0, 104.0, 74.0, 70.0, 52.0, 48.0, 29.0, 25.0, 15.0, 6.0, 7.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011557340621948242, -0.00011135917156934738, -0.00010714493691921234, -0.0001029307022690773, -9.871646761894226e-05, -9.450223296880722e-05, -9.028799831867218e-05, -8.607376366853714e-05, -8.18595290184021e-05, -7.764529436826706e-05, -7.343105971813202e-05, -6.921682506799698e-05, -6.500259041786194e-05, -6.07883557677269e-05, -5.657412111759186e-05, -5.235988646745682e-05, -4.814565181732178e-05, -4.393141716718674e-05, -3.97171825170517e-05, -3.5502947866916656e-05, -3.1288713216781616e-05, -2.7074478566646576e-05, -2.2860243916511536e-05, -1.8646009266376495e-05, -1.4431774616241455e-05, -1.0217539966106415e-05, -6.0033053159713745e-06, -1.7890706658363342e-06, 2.425163984298706e-06, 6.639398634433746e-06, 1.0853633284568787e-05, 1.5067867934703827e-05, 1.9282102584838867e-05, 2.3496337234973907e-05, 2.7710571885108948e-05, 3.192480653524399e-05, 3.613904118537903e-05, 4.035327583551407e-05, 4.456751048564911e-05, 4.878174513578415e-05, 5.299597978591919e-05, 5.721021443605423e-05, 6.142444908618927e-05, 6.563868373632431e-05, 6.985291838645935e-05, 7.406715303659439e-05, 7.828138768672943e-05, 8.249562233686447e-05, 8.670985698699951e-05, 9.092409163713455e-05, 9.513832628726959e-05, 9.935256093740463e-05, 0.00010356679558753967, 0.00010778103023767471, 0.00011199526488780975, 0.0001162094995379448, 0.00012042373418807983, 0.00012463796883821487, 0.00012885220348834991, 0.00013306643813848495, 0.00013728067278862, 0.00014149490743875504, 0.00014570914208889008, 0.00014992337673902512, 0.00015413761138916016]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 10.0, 18.0, 19.0, 25.0, 56.0, 78.0, 129.0, 191.0, 296.0, 458.0, 735.0, 1299.0, 2162.0, 3820.0, 6881.0, 13817.0, 30205.0, 71794.0, 175588.0, 314336.0, 239409.0, 104900.0, 42722.0, 18876.0, 9224.0, 4697.0, 2697.0, 1568.0, 924.0, 607.0, 354.0, 206.0, 147.0, 101.0, 66.0, 40.0, 30.0, 20.0, 15.0, 6.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0], "bins": [-2.70703125, -2.6352386474609375, -2.563446044921875, -2.4916534423828125, -2.41986083984375, -2.3480682373046875, -2.276275634765625, -2.2044830322265625, -2.1326904296875, -2.0608978271484375, -1.989105224609375, -1.9173126220703125, -1.84552001953125, -1.7737274169921875, -1.701934814453125, -1.6301422119140625, -1.558349609375, -1.4865570068359375, -1.414764404296875, -1.3429718017578125, -1.27117919921875, -1.1993865966796875, -1.127593994140625, -1.0558013916015625, -0.9840087890625, -0.9122161865234375, -0.840423583984375, -0.7686309814453125, -0.69683837890625, -0.6250457763671875, -0.553253173828125, -0.4814605712890625, -0.40966796875, -0.3378753662109375, -0.266082763671875, -0.1942901611328125, -0.12249755859375, -0.0507049560546875, 0.021087646484375, 0.0928802490234375, 0.1646728515625, 0.2364654541015625, 0.308258056640625, 0.3800506591796875, 0.45184326171875, 0.5236358642578125, 0.595428466796875, 0.6672210693359375, 0.739013671875, 0.8108062744140625, 0.882598876953125, 0.9543914794921875, 1.02618408203125, 1.0979766845703125, 1.169769287109375, 1.2415618896484375, 1.3133544921875, 1.3851470947265625, 1.456939697265625, 1.5287322998046875, 1.60052490234375, 1.6723175048828125, 1.744110107421875, 1.8159027099609375, 1.8876953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 8.0, 11.0, 8.0, 22.0, 19.0, 37.0, 28.0, 40.0, 49.0, 50.0, 54.0, 67.0, 58.0, 79.0, 62.0, 55.0, 63.0, 45.0, 50.0, 24.0, 36.0, 37.0, 22.0, 15.0, 14.0, 5.0, 10.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5704879760742188, -0.5516204833984375, -0.5327529907226562, -0.513885498046875, -0.49501800537109375, -0.4761505126953125, -0.45728302001953125, -0.43841552734375, -0.41954803466796875, -0.4006805419921875, -0.38181304931640625, -0.362945556640625, -0.34407806396484375, -0.3252105712890625, -0.30634307861328125, -0.2874755859375, -0.26860809326171875, -0.2497406005859375, -0.23087310791015625, -0.212005615234375, -0.19313812255859375, -0.1742706298828125, -0.15540313720703125, -0.13653564453125, -0.11766815185546875, -0.0988006591796875, -0.07993316650390625, -0.061065673828125, -0.04219818115234375, -0.0233306884765625, -0.00446319580078125, 0.014404296875, 0.03327178955078125, 0.0521392822265625, 0.07100677490234375, 0.089874267578125, 0.10874176025390625, 0.1276092529296875, 0.14647674560546875, 0.16534423828125, 0.18421173095703125, 0.2030792236328125, 0.22194671630859375, 0.240814208984375, 0.25968170166015625, 0.2785491943359375, 0.29741668701171875, 0.3162841796875, 0.33515167236328125, 0.3540191650390625, 0.37288665771484375, 0.391754150390625, 0.41062164306640625, 0.4294891357421875, 0.44835662841796875, 0.46722412109375, 0.48609161376953125, 0.5049591064453125, 0.5238265991210938, 0.542694091796875, 0.5615615844726562, 0.5804290771484375, 0.5992965698242188, 0.6181640625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 9.0, 10.0, 9.0, 15.0, 16.0, 31.0, 51.0, 65.0, 75.0, 108.0, 99.0, 125.0, 108.0, 81.0, 50.0, 49.0, 23.0, 20.0, 9.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.352155685424805, -16.916059494018555, -16.479961395263672, -16.043865203857422, -15.607767105102539, -15.171670913696289, -14.735572814941406, -14.299476623535156, -13.86337947845459, -13.427282333374023, -12.991185188293457, -12.55508804321289, -12.118990898132324, -11.682893753051758, -11.246797561645508, -10.810700416564941, -10.374603271484375, -9.938506126403809, -9.502408981323242, -9.066311836242676, -8.63021469116211, -8.19411849975586, -7.758020877838135, -7.321924209594727, -6.885826110839844, -6.449728965759277, -6.013631820678711, -5.5775346755981445, -5.141438007354736, -4.70534086227417, -4.2692437171936035, -3.833146810531616, -3.397049903869629, -2.9609527587890625, -2.524855852127075, -2.088758707046509, -1.652661681175232, -1.216564655303955, -0.7804675102233887, -0.34437060356140137, 0.09172654151916504, 0.5278235673904419, 0.9639206528663635, 1.4000177383422852, 1.836114764213562, 2.272211790084839, 2.7083089351654053, 3.1444058418273926, 3.580502986907959, 4.016600131988525, 4.452697277069092, 4.8887939453125, 5.324891090393066, 5.760988235473633, 6.197085380554199, 6.633182525634766, 7.069279670715332, 7.505376815795898, 7.941473960876465, 8.377571105957031, 8.813668251037598, 9.249765396118164, 9.685861587524414, 10.12195873260498, 10.558055877685547]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 11.0, 9.0, 7.0, 8.0, 17.0, 13.0, 17.0, 24.0, 36.0, 25.0, 30.0, 31.0, 25.0, 40.0, 44.0, 45.0, 43.0, 56.0, 41.0, 45.0, 45.0, 46.0, 34.0, 36.0, 36.0, 35.0, 35.0, 19.0, 21.0, 25.0, 17.0, 12.0, 13.0, 13.0, 9.0, 6.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.585238933563232, -6.3816914558410645, -6.1781439781188965, -5.9745965003967285, -5.771048545837402, -5.567501068115234, -5.363953590393066, -5.160406112670898, -4.9568586349487305, -4.7533111572265625, -4.5497636795043945, -4.346216201782227, -4.142668724060059, -3.9391210079193115, -3.7355732917785645, -3.5320258140563965, -3.3284783363342285, -3.1249308586120605, -2.9213833808898926, -2.7178356647491455, -2.5142881870269775, -2.3107407093048096, -2.1071929931640625, -1.9036455154418945, -1.7000980377197266, -1.4965505599975586, -1.293002963066101, -1.0894553661346436, -0.8859078884124756, -0.6823604106903076, -0.4788128137588501, -0.2752652168273926, -0.07171773910522461, 0.13182979822158813, 0.3353773355484009, 0.5389248728752136, 0.7424724102020264, 0.9460198879241943, 1.1495674848556519, 1.3531150817871094, 1.5566625595092773, 1.7602100372314453, 1.9637576341629028, 2.1673052310943604, 2.3708527088165283, 2.5744001865386963, 2.7779479026794434, 2.9814953804016113, 3.1850428581237793, 3.3885903358459473, 3.5921378135681152, 3.7956855297088623, 3.9992330074310303, 4.202780723571777, 4.406328201293945, 4.609875679016113, 4.813423156738281, 5.016970634460449, 5.220518112182617, 5.424065589904785, 5.627613067626953, 5.831160545349121, 6.034708499908447, 6.238255977630615, 6.441803455352783]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 12.0, 15.0, 32.0, 40.0, 61.0, 59.0, 135.0, 181.0, 251.0, 371.0, 547.0, 878.0, 1307.0, 2067.0, 3256.0, 5411.0, 9334.0, 15767.0, 28727.0, 52994.0, 95855.0, 156487.0, 200991.0, 184104.0, 125888.0, 72467.0, 38995.0, 21476.0, 11873.0, 7084.0, 4377.0, 2616.0, 1651.0, 1045.0, 691.0, 486.0, 310.0, 223.0, 154.0, 83.0, 71.0, 56.0, 35.0, 31.0, 11.0, 17.0, 8.0, 8.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.6015625, -6.4000244140625, -6.198486328125, -5.9969482421875, -5.79541015625, -5.5938720703125, -5.392333984375, -5.1907958984375, -4.9892578125, -4.7877197265625, -4.586181640625, -4.3846435546875, -4.18310546875, -3.9815673828125, -3.780029296875, -3.5784912109375, -3.376953125, -3.1754150390625, -2.973876953125, -2.7723388671875, -2.57080078125, -2.3692626953125, -2.167724609375, -1.9661865234375, -1.7646484375, -1.5631103515625, -1.361572265625, -1.1600341796875, -0.95849609375, -0.7569580078125, -0.555419921875, -0.3538818359375, -0.15234375, 0.0491943359375, 0.250732421875, 0.4522705078125, 0.65380859375, 0.8553466796875, 1.056884765625, 1.2584228515625, 1.4599609375, 1.6614990234375, 1.863037109375, 2.0645751953125, 2.26611328125, 2.4676513671875, 2.669189453125, 2.8707275390625, 3.072265625, 3.2738037109375, 3.475341796875, 3.6768798828125, 3.87841796875, 4.0799560546875, 4.281494140625, 4.4830322265625, 4.6845703125, 4.8861083984375, 5.087646484375, 5.2891845703125, 5.49072265625, 5.6922607421875, 5.893798828125, 6.0953369140625, 6.296875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 6.0, 6.0, 15.0, 17.0, 18.0, 26.0, 39.0, 23.0, 25.0, 37.0, 44.0, 38.0, 41.0, 44.0, 57.0, 57.0, 36.0, 52.0, 59.0, 46.0, 29.0, 38.0, 38.0, 36.0, 32.0, 16.0, 18.0, 15.0, 15.0, 13.0, 11.0, 8.0, 5.0, 4.0, 4.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.74609375, -6.51226806640625, -6.2784423828125, -6.04461669921875, -5.810791015625, -5.57696533203125, -5.3431396484375, -5.10931396484375, -4.87548828125, -4.64166259765625, -4.4078369140625, -4.17401123046875, -3.940185546875, -3.70635986328125, -3.4725341796875, -3.23870849609375, -3.0048828125, -2.77105712890625, -2.5372314453125, -2.30340576171875, -2.069580078125, -1.83575439453125, -1.6019287109375, -1.36810302734375, -1.13427734375, -0.90045166015625, -0.6666259765625, -0.43280029296875, -0.198974609375, 0.03485107421875, 0.2686767578125, 0.50250244140625, 0.736328125, 0.97015380859375, 1.2039794921875, 1.43780517578125, 1.671630859375, 1.90545654296875, 2.1392822265625, 2.37310791015625, 2.60693359375, 2.84075927734375, 3.0745849609375, 3.30841064453125, 3.542236328125, 3.77606201171875, 4.0098876953125, 4.24371337890625, 4.4775390625, 4.71136474609375, 4.9451904296875, 5.17901611328125, 5.412841796875, 5.64666748046875, 5.8804931640625, 6.11431884765625, 6.34814453125, 6.58197021484375, 6.8157958984375, 7.04962158203125, 7.283447265625, 7.51727294921875, 7.7510986328125, 7.98492431640625, 8.21875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 5.0, 16.0, 10.0, 23.0, 36.0, 54.0, 63.0, 104.0, 175.0, 210.0, 357.0, 482.0, 711.0, 1123.0, 1710.0, 2720.0, 4101.0, 6663.0, 10718.0, 17180.0, 27830.0, 45874.0, 73337.0, 111592.0, 148560.0, 164165.0, 143737.0, 105837.0, 68861.0, 42825.0, 26254.0, 15879.0, 9838.0, 6241.0, 3889.0, 2557.0, 1590.0, 1060.0, 707.0, 451.0, 327.0, 229.0, 130.0, 104.0, 74.0, 39.0, 33.0, 23.0, 13.0, 12.0, 13.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.32421875, -5.1600341796875, -4.995849609375, -4.8316650390625, -4.66748046875, -4.5032958984375, -4.339111328125, -4.1749267578125, -4.0107421875, -3.8465576171875, -3.682373046875, -3.5181884765625, -3.35400390625, -3.1898193359375, -3.025634765625, -2.8614501953125, -2.697265625, -2.5330810546875, -2.368896484375, -2.2047119140625, -2.04052734375, -1.8763427734375, -1.712158203125, -1.5479736328125, -1.3837890625, -1.2196044921875, -1.055419921875, -0.8912353515625, -0.72705078125, -0.5628662109375, -0.398681640625, -0.2344970703125, -0.0703125, 0.0938720703125, 0.258056640625, 0.4222412109375, 0.58642578125, 0.7506103515625, 0.914794921875, 1.0789794921875, 1.2431640625, 1.4073486328125, 1.571533203125, 1.7357177734375, 1.89990234375, 2.0640869140625, 2.228271484375, 2.3924560546875, 2.556640625, 2.7208251953125, 2.885009765625, 3.0491943359375, 3.21337890625, 3.3775634765625, 3.541748046875, 3.7059326171875, 3.8701171875, 4.0343017578125, 4.198486328125, 4.3626708984375, 4.52685546875, 4.6910400390625, 4.855224609375, 5.0194091796875, 5.18359375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 1.0, 2.0, 5.0, 8.0, 9.0, 8.0, 14.0, 16.0, 21.0, 17.0, 13.0, 22.0, 20.0, 23.0, 29.0, 28.0, 33.0, 33.0, 30.0, 42.0, 50.0, 34.0, 47.0, 55.0, 36.0, 37.0, 47.0, 43.0, 23.0, 25.0, 28.0, 34.0, 19.0, 19.0, 17.0, 17.0, 16.0, 11.0, 12.0, 14.0, 8.0, 12.0, 3.0, 6.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8359375, -3.720062255859375, -3.60418701171875, -3.488311767578125, -3.3724365234375, -3.256561279296875, -3.14068603515625, -3.024810791015625, -2.908935546875, -2.793060302734375, -2.67718505859375, -2.561309814453125, -2.4454345703125, -2.329559326171875, -2.21368408203125, -2.097808837890625, -1.98193359375, -1.866058349609375, -1.75018310546875, -1.634307861328125, -1.5184326171875, -1.402557373046875, -1.28668212890625, -1.170806884765625, -1.054931640625, -0.939056396484375, -0.82318115234375, -0.707305908203125, -0.5914306640625, -0.475555419921875, -0.35968017578125, -0.243804931640625, -0.1279296875, -0.012054443359375, 0.10382080078125, 0.219696044921875, 0.3355712890625, 0.451446533203125, 0.56732177734375, 0.683197021484375, 0.799072265625, 0.914947509765625, 1.03082275390625, 1.146697998046875, 1.2625732421875, 1.378448486328125, 1.49432373046875, 1.610198974609375, 1.72607421875, 1.841949462890625, 1.95782470703125, 2.073699951171875, 2.1895751953125, 2.305450439453125, 2.42132568359375, 2.537200927734375, 2.653076171875, 2.768951416015625, 2.88482666015625, 3.000701904296875, 3.1165771484375, 3.232452392578125, 3.34832763671875, 3.464202880859375, 3.580078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 14.0, 20.0, 27.0, 42.0, 68.0, 107.0, 148.0, 243.0, 327.0, 505.0, 749.0, 1171.0, 1956.0, 3274.0, 5429.0, 9239.0, 16854.0, 30431.0, 56266.0, 101486.0, 165711.0, 209393.0, 181772.0, 115838.0, 65605.0, 35515.0, 19333.0, 11054.0, 6229.0, 3621.0, 2205.0, 1365.0, 818.0, 570.0, 381.0, 271.0, 172.0, 130.0, 67.0, 44.0, 35.0, 23.0, 17.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.712890625, -3.608673095703125, -3.50445556640625, -3.400238037109375, -3.2960205078125, -3.191802978515625, -3.08758544921875, -2.983367919921875, -2.879150390625, -2.774932861328125, -2.67071533203125, -2.566497802734375, -2.4622802734375, -2.358062744140625, -2.25384521484375, -2.149627685546875, -2.04541015625, -1.941192626953125, -1.83697509765625, -1.732757568359375, -1.6285400390625, -1.524322509765625, -1.42010498046875, -1.315887451171875, -1.211669921875, -1.107452392578125, -1.00323486328125, -0.899017333984375, -0.7947998046875, -0.690582275390625, -0.58636474609375, -0.482147216796875, -0.3779296875, -0.273712158203125, -0.16949462890625, -0.065277099609375, 0.0389404296875, 0.143157958984375, 0.24737548828125, 0.351593017578125, 0.455810546875, 0.560028076171875, 0.66424560546875, 0.768463134765625, 0.8726806640625, 0.976898193359375, 1.08111572265625, 1.185333251953125, 1.28955078125, 1.393768310546875, 1.49798583984375, 1.602203369140625, 1.7064208984375, 1.810638427734375, 1.91485595703125, 2.019073486328125, 2.123291015625, 2.227508544921875, 2.33172607421875, 2.435943603515625, 2.5401611328125, 2.644378662109375, 2.74859619140625, 2.852813720703125, 2.95703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 10.0, 8.0, 13.0, 17.0, 17.0, 29.0, 46.0, 47.0, 64.0, 63.0, 64.0, 81.0, 78.0, 83.0, 69.0, 60.0, 56.0, 44.0, 26.0, 19.0, 25.0, 18.0, 10.0, 13.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002994537353515625, -0.00028853118419647217, -0.00027760863304138184, -0.0002666860818862915, -0.00025576353073120117, -0.00024484097957611084, -0.0002339184284210205, -0.00022299587726593018, -0.00021207332611083984, -0.0002011507749557495, -0.00019022822380065918, -0.00017930567264556885, -0.00016838312149047852, -0.00015746057033538818, -0.00014653801918029785, -0.00013561546802520752, -0.0001246929168701172, -0.00011377036571502686, -0.00010284781455993652, -9.192526340484619e-05, -8.100271224975586e-05, -7.008016109466553e-05, -5.9157609939575195e-05, -4.823505878448486e-05, -3.731250762939453e-05, -2.63899564743042e-05, -1.5467405319213867e-05, -4.544854164123535e-06, 6.377696990966797e-06, 1.730024814605713e-05, 2.822279930114746e-05, 3.914535045623779e-05, 5.0067901611328125e-05, 6.099045276641846e-05, 7.191300392150879e-05, 8.283555507659912e-05, 9.375810623168945e-05, 0.00010468065738677979, 0.00011560320854187012, 0.00012652575969696045, 0.00013744831085205078, 0.0001483708620071411, 0.00015929341316223145, 0.00017021596431732178, 0.0001811385154724121, 0.00019206106662750244, 0.00020298361778259277, 0.0002139061689376831, 0.00022482872009277344, 0.00023575127124786377, 0.0002466738224029541, 0.00025759637355804443, 0.00026851892471313477, 0.0002794414758682251, 0.00029036402702331543, 0.00030128657817840576, 0.0003122091293334961, 0.0003231316804885864, 0.00033405423164367676, 0.0003449767827987671, 0.0003558993339538574, 0.00036682188510894775, 0.0003777444362640381, 0.0003886669874191284, 0.00039958953857421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 15.0, 25.0, 17.0, 25.0, 56.0, 100.0, 130.0, 239.0, 359.0, 597.0, 978.0, 1797.0, 3267.0, 6138.0, 11531.0, 22807.0, 45645.0, 90281.0, 161897.0, 226078.0, 206504.0, 130399.0, 68414.0, 34340.0, 17136.0, 8821.0, 4689.0, 2690.0, 1429.0, 808.0, 498.0, 302.0, 209.0, 123.0, 58.0, 42.0, 36.0, 21.0, 11.0, 12.0, 6.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.1875, -4.073699951171875, -3.95989990234375, -3.846099853515625, -3.7322998046875, -3.618499755859375, -3.50469970703125, -3.390899658203125, -3.277099609375, -3.163299560546875, -3.04949951171875, -2.935699462890625, -2.8218994140625, -2.708099365234375, -2.59429931640625, -2.480499267578125, -2.36669921875, -2.252899169921875, -2.13909912109375, -2.025299072265625, -1.9114990234375, -1.797698974609375, -1.68389892578125, -1.570098876953125, -1.456298828125, -1.342498779296875, -1.22869873046875, -1.114898681640625, -1.0010986328125, -0.887298583984375, -0.77349853515625, -0.659698486328125, -0.5458984375, -0.432098388671875, -0.31829833984375, -0.204498291015625, -0.0906982421875, 0.023101806640625, 0.13690185546875, 0.250701904296875, 0.364501953125, 0.478302001953125, 0.59210205078125, 0.705902099609375, 0.8197021484375, 0.933502197265625, 1.04730224609375, 1.161102294921875, 1.27490234375, 1.388702392578125, 1.50250244140625, 1.616302490234375, 1.7301025390625, 1.843902587890625, 1.95770263671875, 2.071502685546875, 2.185302734375, 2.299102783203125, 2.41290283203125, 2.526702880859375, 2.6405029296875, 2.754302978515625, 2.86810302734375, 2.981903076171875, 3.095703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 14.0, 16.0, 18.0, 24.0, 42.0, 40.0, 59.0, 62.0, 78.0, 80.0, 79.0, 81.0, 65.0, 73.0, 49.0, 60.0, 38.0, 13.0, 20.0, 21.0, 8.0, 5.0, 12.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.6259765625, -1.582733154296875, -1.53948974609375, -1.496246337890625, -1.4530029296875, -1.409759521484375, -1.36651611328125, -1.323272705078125, -1.280029296875, -1.236785888671875, -1.19354248046875, -1.150299072265625, -1.1070556640625, -1.063812255859375, -1.02056884765625, -0.977325439453125, -0.93408203125, -0.890838623046875, -0.84759521484375, -0.804351806640625, -0.7611083984375, -0.717864990234375, -0.67462158203125, -0.631378173828125, -0.588134765625, -0.544891357421875, -0.50164794921875, -0.458404541015625, -0.4151611328125, -0.371917724609375, -0.32867431640625, -0.285430908203125, -0.2421875, -0.198944091796875, -0.15570068359375, -0.112457275390625, -0.0692138671875, -0.025970458984375, 0.01727294921875, 0.060516357421875, 0.103759765625, 0.147003173828125, 0.19024658203125, 0.233489990234375, 0.2767333984375, 0.319976806640625, 0.36322021484375, 0.406463623046875, 0.44970703125, 0.492950439453125, 0.53619384765625, 0.579437255859375, 0.6226806640625, 0.665924072265625, 0.70916748046875, 0.752410888671875, 0.795654296875, 0.838897705078125, 0.88214111328125, 0.925384521484375, 0.9686279296875, 1.011871337890625, 1.05511474609375, 1.098358154296875, 1.1416015625]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 11.0, 6.0, 8.0, 9.0, 7.0, 16.0, 17.0, 30.0, 34.0, 62.0, 85.0, 82.0, 111.0, 102.0, 96.0, 70.0, 73.0, 54.0, 36.0, 34.0, 10.0, 12.0, 10.0, 7.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.316097259521484, -14.924983024597168, -14.533867835998535, -14.142753601074219, -13.751639366149902, -13.36052417755127, -12.969409942626953, -12.57829475402832, -12.187180519104004, -11.796066284179688, -11.404951095581055, -11.013836860656738, -10.622722625732422, -10.231607437133789, -9.840493202209473, -9.449378967285156, -9.058263778686523, -8.667149543762207, -8.276034355163574, -7.884920120239258, -7.493805408477783, -7.102690696716309, -6.711576461791992, -6.320461750030518, -5.929347991943359, -5.538233280181885, -5.147119045257568, -4.756004333496094, -4.364889621734619, -3.9737751483917236, -3.582660675048828, -3.1915459632873535, -2.800431251525879, -2.4093167781829834, -2.018202066421509, -1.6270875930786133, -1.2359730005264282, -0.8448584079742432, -0.45374393463134766, -0.06262922286987305, 0.32848525047302246, 0.7195998430252075, 1.1107144355773926, 1.501828908920288, 1.8929435014724731, 2.284058094024658, 2.6751725673675537, 3.0662872791290283, 3.457401752471924, 3.8485162258148193, 4.239630699157715, 4.6307454109191895, 5.021860122680664, 5.4129743576049805, 5.804089069366455, 6.19520378112793, 6.586318016052246, 6.977432727813721, 7.368546962738037, 7.759661674499512, 8.150775909423828, 8.541891098022461, 8.933005332946777, 9.324119567871094, 9.715234756469727]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 5.0, 9.0, 14.0, 12.0, 19.0, 9.0, 15.0, 23.0, 25.0, 28.0, 27.0, 39.0, 44.0, 39.0, 43.0, 51.0, 49.0, 52.0, 42.0, 32.0, 52.0, 39.0, 48.0, 30.0, 32.0, 24.0, 30.0, 24.0, 22.0, 18.0, 9.0, 11.0, 14.0, 9.0, 12.0, 12.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.461526393890381, -6.257798194885254, -6.054069519042969, -5.850341320037842, -5.646613121032715, -5.442884922027588, -5.239156723022461, -5.035428047180176, -4.831699848175049, -4.627971649169922, -4.424242973327637, -4.22051477432251, -4.016786575317383, -3.813058376312256, -3.60932993888855, -3.4056015014648438, -3.201873302459717, -2.99814510345459, -2.794416666030884, -2.5906882286071777, -2.386960029602051, -2.183231830596924, -1.9795033931732178, -1.7757750749588013, -1.5720467567443848, -1.3683184385299683, -1.1645901203155518, -0.9608618021011353, -0.7571334838867188, -0.5534051656723022, -0.34967684745788574, -0.14594852924346924, 0.05777931213378906, 0.26150763034820557, 0.46523594856262207, 0.6689642667770386, 0.8726925849914551, 1.0764209032058716, 1.280149221420288, 1.4838775396347046, 1.687605857849121, 1.8913341760635376, 2.095062494277954, 2.29879093170166, 2.502519130706787, 2.706247329711914, 2.90997576713562, 3.113704204559326, 3.317432403564453, 3.52116060256958, 3.724889039993286, 3.928617477416992, 4.132345676422119, 4.336073875427246, 4.539802551269531, 4.743530750274658, 4.947258949279785, 5.150987148284912, 5.354715347290039, 5.558444023132324, 5.762172222137451, 5.965900421142578, 6.169629096984863, 6.37335729598999, 6.577085494995117]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 16.0, 31.0, 34.0, 60.0, 87.0, 123.0, 154.0, 236.0, 295.0, 474.0, 687.0, 1037.0, 1576.0, 2345.0, 3522.0, 5888.0, 9360.0, 17051.0, 33053.0, 76030.0, 210161.0, 663047.0, 1474848.0, 1097783.0, 372793.0, 120593.0, 47379.0, 22198.0, 12034.0, 7291.0, 4536.0, 2899.0, 2006.0, 1342.0, 967.0, 653.0, 473.0, 331.0, 245.0, 174.0, 131.0, 82.0, 59.0, 60.0, 35.0, 22.0, 21.0, 18.0, 11.0, 10.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-9.8046875, -9.47509765625, -9.1455078125, -8.81591796875, -8.486328125, -8.15673828125, -7.8271484375, -7.49755859375, -7.16796875, -6.83837890625, -6.5087890625, -6.17919921875, -5.849609375, -5.52001953125, -5.1904296875, -4.86083984375, -4.53125, -4.20166015625, -3.8720703125, -3.54248046875, -3.212890625, -2.88330078125, -2.5537109375, -2.22412109375, -1.89453125, -1.56494140625, -1.2353515625, -0.90576171875, -0.576171875, -0.24658203125, 0.0830078125, 0.41259765625, 0.7421875, 1.07177734375, 1.4013671875, 1.73095703125, 2.060546875, 2.39013671875, 2.7197265625, 3.04931640625, 3.37890625, 3.70849609375, 4.0380859375, 4.36767578125, 4.697265625, 5.02685546875, 5.3564453125, 5.68603515625, 6.015625, 6.34521484375, 6.6748046875, 7.00439453125, 7.333984375, 7.66357421875, 7.9931640625, 8.32275390625, 8.65234375, 8.98193359375, 9.3115234375, 9.64111328125, 9.970703125, 10.30029296875, 10.6298828125, 10.95947265625, 11.2890625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 2.0, 15.0, 12.0, 15.0, 17.0, 23.0, 25.0, 29.0, 34.0, 28.0, 42.0, 49.0, 40.0, 45.0, 46.0, 51.0, 48.0, 52.0, 38.0, 56.0, 41.0, 36.0, 36.0, 33.0, 24.0, 21.0, 18.0, 13.0, 15.0, 17.0, 7.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.65625, -4.50616455078125, -4.3560791015625, -4.20599365234375, -4.055908203125, -3.90582275390625, -3.7557373046875, -3.60565185546875, -3.45556640625, -3.30548095703125, -3.1553955078125, -3.00531005859375, -2.855224609375, -2.70513916015625, -2.5550537109375, -2.40496826171875, -2.2548828125, -2.10479736328125, -1.9547119140625, -1.80462646484375, -1.654541015625, -1.50445556640625, -1.3543701171875, -1.20428466796875, -1.05419921875, -0.90411376953125, -0.7540283203125, -0.60394287109375, -0.453857421875, -0.30377197265625, -0.1536865234375, -0.00360107421875, 0.146484375, 0.29656982421875, 0.4466552734375, 0.59674072265625, 0.746826171875, 0.89691162109375, 1.0469970703125, 1.19708251953125, 1.34716796875, 1.49725341796875, 1.6473388671875, 1.79742431640625, 1.947509765625, 2.09759521484375, 2.2476806640625, 2.39776611328125, 2.5478515625, 2.69793701171875, 2.8480224609375, 2.99810791015625, 3.148193359375, 3.29827880859375, 3.4483642578125, 3.59844970703125, 3.74853515625, 3.89862060546875, 4.0487060546875, 4.19879150390625, 4.348876953125, 4.49896240234375, 4.6490478515625, 4.79913330078125, 4.94921875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 9.0, 14.0, 16.0, 36.0, 31.0, 57.0, 100.0, 127.0, 247.0, 388.0, 639.0, 1125.0, 2056.0, 3502.0, 6591.0, 12933.0, 26734.0, 62844.0, 178864.0, 615104.0, 1594887.0, 1152115.0, 346036.0, 108639.0, 41538.0, 18800.0, 9426.0, 4859.0, 2772.0, 1566.0, 893.0, 515.0, 320.0, 196.0, 105.0, 66.0, 51.0, 27.0, 19.0, 17.0, 10.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.6171875, -13.2139892578125, -12.810791015625, -12.4075927734375, -12.00439453125, -11.6011962890625, -11.197998046875, -10.7947998046875, -10.3916015625, -9.9884033203125, -9.585205078125, -9.1820068359375, -8.77880859375, -8.3756103515625, -7.972412109375, -7.5692138671875, -7.166015625, -6.7628173828125, -6.359619140625, -5.9564208984375, -5.55322265625, -5.1500244140625, -4.746826171875, -4.3436279296875, -3.9404296875, -3.5372314453125, -3.134033203125, -2.7308349609375, -2.32763671875, -1.9244384765625, -1.521240234375, -1.1180419921875, -0.71484375, -0.3116455078125, 0.091552734375, 0.4947509765625, 0.89794921875, 1.3011474609375, 1.704345703125, 2.1075439453125, 2.5107421875, 2.9139404296875, 3.317138671875, 3.7203369140625, 4.12353515625, 4.5267333984375, 4.929931640625, 5.3331298828125, 5.736328125, 6.1395263671875, 6.542724609375, 6.9459228515625, 7.34912109375, 7.7523193359375, 8.155517578125, 8.5587158203125, 8.9619140625, 9.3651123046875, 9.768310546875, 10.1715087890625, 10.57470703125, 10.9779052734375, 11.381103515625, 11.7843017578125, 12.1875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 6.0, 5.0, 12.0, 12.0, 18.0, 20.0, 21.0, 23.0, 41.0, 41.0, 60.0, 64.0, 76.0, 118.0, 143.0, 189.0, 233.0, 249.0, 309.0, 306.0, 299.0, 305.0, 293.0, 262.0, 213.0, 166.0, 113.0, 115.0, 65.0, 65.0, 48.0, 41.0, 26.0, 24.0, 21.0, 17.0, 8.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.169921875, -3.082427978515625, -2.99493408203125, -2.907440185546875, -2.8199462890625, -2.732452392578125, -2.64495849609375, -2.557464599609375, -2.469970703125, -2.382476806640625, -2.29498291015625, -2.207489013671875, -2.1199951171875, -2.032501220703125, -1.94500732421875, -1.857513427734375, -1.77001953125, -1.682525634765625, -1.59503173828125, -1.507537841796875, -1.4200439453125, -1.332550048828125, -1.24505615234375, -1.157562255859375, -1.070068359375, -0.982574462890625, -0.89508056640625, -0.807586669921875, -0.7200927734375, -0.632598876953125, -0.54510498046875, -0.457611083984375, -0.3701171875, -0.282623291015625, -0.19512939453125, -0.107635498046875, -0.0201416015625, 0.067352294921875, 0.15484619140625, 0.242340087890625, 0.329833984375, 0.417327880859375, 0.50482177734375, 0.592315673828125, 0.6798095703125, 0.767303466796875, 0.85479736328125, 0.942291259765625, 1.02978515625, 1.117279052734375, 1.20477294921875, 1.292266845703125, 1.3797607421875, 1.467254638671875, 1.55474853515625, 1.642242431640625, 1.729736328125, 1.817230224609375, 1.90472412109375, 1.992218017578125, 2.0797119140625, 2.167205810546875, 2.25469970703125, 2.342193603515625, 2.4296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 15.0, 19.0, 37.0, 65.0, 69.0, 111.0, 160.0, 166.0, 107.0, 76.0, 54.0, 34.0, 20.0, 16.0, 14.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-25.68865966796875, -25.15268898010254, -24.61672019958496, -24.08074951171875, -23.544780731201172, -23.00881004333496, -22.472841262817383, -21.936870574951172, -21.400901794433594, -20.864931106567383, -20.328962326049805, -19.792991638183594, -19.257022857666016, -18.721052169799805, -18.185083389282227, -17.649112701416016, -17.113142013549805, -16.577171325683594, -16.041202545166016, -15.505232810974121, -14.969263076782227, -14.433292388916016, -13.897322654724121, -13.361352920532227, -12.825383186340332, -12.289413452148438, -11.753443717956543, -11.217473983764648, -10.681503295898438, -10.14553451538086, -9.609563827514648, -9.073594093322754, -8.537625312805176, -8.001655578613281, -7.465685844421387, -6.929715633392334, -6.3937458992004395, -5.857776165008545, -5.321805953979492, -4.785836219787598, -4.249866485595703, -3.7138967514038086, -3.177926778793335, -2.6419568061828613, -2.105987071990967, -1.5700173377990723, -1.0340473651885986, -0.498077392578125, 0.03789234161376953, 0.5738621950149536, 1.1098320484161377, 1.6458019018173218, 2.181771755218506, 2.7177414894104004, 3.253711462020874, 3.7896814346313477, 4.325651168823242, 4.861620903015137, 5.397590637207031, 5.933560848236084, 6.4695305824279785, 7.005500316619873, 7.541470527648926, 8.07744026184082, 8.613409996032715]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 8.0, 5.0, 13.0, 8.0, 8.0, 20.0, 18.0, 16.0, 21.0, 33.0, 36.0, 36.0, 33.0, 32.0, 39.0, 48.0, 40.0, 51.0, 39.0, 43.0, 46.0, 31.0, 44.0, 42.0, 40.0, 41.0, 30.0, 32.0, 22.0, 15.0, 15.0, 15.0, 14.0, 15.0, 10.0, 4.0, 5.0, 7.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.42673921585083, -5.243031978607178, -5.059325218200684, -4.875617980957031, -4.691911220550537, -4.508203983306885, -4.324497222900391, -4.140789985656738, -3.957082986831665, -3.773375988006592, -3.5896689891815186, -3.4059619903564453, -3.222254753112793, -3.038547992706299, -2.8548407554626465, -2.6711337566375732, -2.4874267578125, -2.3037197589874268, -2.1200127601623535, -1.9363056421279907, -1.7525986433029175, -1.5688916444778442, -1.3851845264434814, -1.2014775276184082, -1.017770528793335, -0.8340635299682617, -0.6503564715385437, -0.4666494131088257, -0.28294241428375244, -0.0992354154586792, 0.0844717025756836, 0.26817870140075684, 0.4518852233886719, 0.6355922222137451, 0.8192992806434631, 1.0030063390731812, 1.1867133378982544, 1.3704203367233276, 1.5541274547576904, 1.7378344535827637, 1.921541452407837, 2.10524845123291, 2.2889554500579834, 2.4726624488830566, 2.656369686126709, 2.840076446533203, 3.0237836837768555, 3.2074906826019287, 3.391197681427002, 3.574904680252075, 3.7586116790771484, 3.942318916320801, 4.126025676727295, 4.309732913970947, 4.493439674377441, 4.677146911621094, 4.860854148864746, 5.044561386108398, 5.228268146514893, 5.411975383758545, 5.595682144165039, 5.779389381408691, 5.963096618652344, 6.146803379058838, 6.330510139465332]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 10.0, 21.0, 14.0, 22.0, 35.0, 43.0, 63.0, 116.0, 152.0, 206.0, 346.0, 506.0, 920.0, 1475.0, 2599.0, 4551.0, 8722.0, 16875.0, 34882.0, 74953.0, 155643.0, 258979.0, 237157.0, 130094.0, 60664.0, 28759.0, 14133.0, 7106.0, 3898.0, 2165.0, 1247.0, 755.0, 486.0, 333.0, 203.0, 128.0, 87.0, 59.0, 47.0, 31.0, 20.0, 18.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-4.09375, -3.972869873046875, -3.85198974609375, -3.731109619140625, -3.6102294921875, -3.489349365234375, -3.36846923828125, -3.247589111328125, -3.126708984375, -3.005828857421875, -2.88494873046875, -2.764068603515625, -2.6431884765625, -2.522308349609375, -2.40142822265625, -2.280548095703125, -2.15966796875, -2.038787841796875, -1.91790771484375, -1.797027587890625, -1.6761474609375, -1.555267333984375, -1.43438720703125, -1.313507080078125, -1.192626953125, -1.071746826171875, -0.95086669921875, -0.829986572265625, -0.7091064453125, -0.588226318359375, -0.46734619140625, -0.346466064453125, -0.2255859375, -0.104705810546875, 0.01617431640625, 0.137054443359375, 0.2579345703125, 0.378814697265625, 0.49969482421875, 0.620574951171875, 0.741455078125, 0.862335205078125, 0.98321533203125, 1.104095458984375, 1.2249755859375, 1.345855712890625, 1.46673583984375, 1.587615966796875, 1.70849609375, 1.829376220703125, 1.95025634765625, 2.071136474609375, 2.1920166015625, 2.312896728515625, 2.43377685546875, 2.554656982421875, 2.675537109375, 2.796417236328125, 2.91729736328125, 3.038177490234375, 3.1590576171875, 3.279937744140625, 3.40081787109375, 3.521697998046875, 3.642578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 15.0, 17.0, 11.0, 13.0, 33.0, 17.0, 19.0, 38.0, 36.0, 25.0, 42.0, 43.0, 49.0, 53.0, 46.0, 46.0, 53.0, 47.0, 43.0, 36.0, 46.0, 31.0, 28.0, 36.0, 27.0, 16.0, 22.0, 22.0, 12.0, 17.0, 9.0, 3.0, 3.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.953125, -5.7430419921875, -5.532958984375, -5.3228759765625, -5.11279296875, -4.9027099609375, -4.692626953125, -4.4825439453125, -4.2724609375, -4.0623779296875, -3.852294921875, -3.6422119140625, -3.43212890625, -3.2220458984375, -3.011962890625, -2.8018798828125, -2.591796875, -2.3817138671875, -2.171630859375, -1.9615478515625, -1.75146484375, -1.5413818359375, -1.331298828125, -1.1212158203125, -0.9111328125, -0.7010498046875, -0.490966796875, -0.2808837890625, -0.07080078125, 0.1392822265625, 0.349365234375, 0.5594482421875, 0.76953125, 0.9796142578125, 1.189697265625, 1.3997802734375, 1.60986328125, 1.8199462890625, 2.030029296875, 2.2401123046875, 2.4501953125, 2.6602783203125, 2.870361328125, 3.0804443359375, 3.29052734375, 3.5006103515625, 3.710693359375, 3.9207763671875, 4.130859375, 4.3409423828125, 4.551025390625, 4.7611083984375, 4.97119140625, 5.1812744140625, 5.391357421875, 5.6014404296875, 5.8115234375, 6.0216064453125, 6.231689453125, 6.4417724609375, 6.65185546875, 6.8619384765625, 7.072021484375, 7.2821044921875, 7.4921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 18.0, 20.0, 28.0, 45.0, 69.0, 83.0, 141.0, 215.0, 344.0, 540.0, 992.0, 1828.0, 3648.0, 7641.0, 17346.0, 43661.0, 122207.0, 312116.0, 325180.0, 130735.0, 47263.0, 18169.0, 7933.0, 3796.0, 1949.0, 1013.0, 570.0, 327.0, 196.0, 126.0, 94.0, 66.0, 55.0, 32.0, 11.0, 18.0, 12.0, 10.0, 2.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.88671875, -5.7137451171875, -5.540771484375, -5.3677978515625, -5.19482421875, -5.0218505859375, -4.848876953125, -4.6759033203125, -4.5029296875, -4.3299560546875, -4.156982421875, -3.9840087890625, -3.81103515625, -3.6380615234375, -3.465087890625, -3.2921142578125, -3.119140625, -2.9461669921875, -2.773193359375, -2.6002197265625, -2.42724609375, -2.2542724609375, -2.081298828125, -1.9083251953125, -1.7353515625, -1.5623779296875, -1.389404296875, -1.2164306640625, -1.04345703125, -0.8704833984375, -0.697509765625, -0.5245361328125, -0.3515625, -0.1785888671875, -0.005615234375, 0.1673583984375, 0.34033203125, 0.5133056640625, 0.686279296875, 0.8592529296875, 1.0322265625, 1.2052001953125, 1.378173828125, 1.5511474609375, 1.72412109375, 1.8970947265625, 2.070068359375, 2.2430419921875, 2.416015625, 2.5889892578125, 2.761962890625, 2.9349365234375, 3.10791015625, 3.2808837890625, 3.453857421875, 3.6268310546875, 3.7998046875, 3.9727783203125, 4.145751953125, 4.3187255859375, 4.49169921875, 4.6646728515625, 4.837646484375, 5.0106201171875, 5.18359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 5.0, 5.0, 7.0, 7.0, 5.0, 10.0, 14.0, 12.0, 10.0, 23.0, 20.0, 20.0, 14.0, 23.0, 37.0, 32.0, 38.0, 46.0, 38.0, 42.0, 33.0, 42.0, 34.0, 33.0, 34.0, 50.0, 32.0, 42.0, 29.0, 25.0, 27.0, 33.0, 24.0, 23.0, 18.0, 23.0, 16.0, 15.0, 9.0, 7.0, 7.0, 2.0, 8.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.169921875, -3.068115234375, -2.96630859375, -2.864501953125, -2.7626953125, -2.660888671875, -2.55908203125, -2.457275390625, -2.35546875, -2.253662109375, -2.15185546875, -2.050048828125, -1.9482421875, -1.846435546875, -1.74462890625, -1.642822265625, -1.541015625, -1.439208984375, -1.33740234375, -1.235595703125, -1.1337890625, -1.031982421875, -0.93017578125, -0.828369140625, -0.7265625, -0.624755859375, -0.52294921875, -0.421142578125, -0.3193359375, -0.217529296875, -0.11572265625, -0.013916015625, 0.087890625, 0.189697265625, 0.29150390625, 0.393310546875, 0.4951171875, 0.596923828125, 0.69873046875, 0.800537109375, 0.90234375, 1.004150390625, 1.10595703125, 1.207763671875, 1.3095703125, 1.411376953125, 1.51318359375, 1.614990234375, 1.716796875, 1.818603515625, 1.92041015625, 2.022216796875, 2.1240234375, 2.225830078125, 2.32763671875, 2.429443359375, 2.53125, 2.633056640625, 2.73486328125, 2.836669921875, 2.9384765625, 3.040283203125, 3.14208984375, 3.243896484375, 3.345703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 13.0, 7.0, 17.0, 33.0, 36.0, 69.0, 83.0, 113.0, 170.0, 305.0, 399.0, 672.0, 1079.0, 1695.0, 3049.0, 5597.0, 10990.0, 24776.0, 65665.0, 206028.0, 418578.0, 197147.0, 63849.0, 24085.0, 10809.0, 5526.0, 2997.0, 1699.0, 1008.0, 659.0, 462.0, 282.0, 212.0, 138.0, 94.0, 59.0, 49.0, 21.0, 21.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.494140625, -2.4173583984375, -2.340576171875, -2.2637939453125, -2.18701171875, -2.1102294921875, -2.033447265625, -1.9566650390625, -1.8798828125, -1.8031005859375, -1.726318359375, -1.6495361328125, -1.57275390625, -1.4959716796875, -1.419189453125, -1.3424072265625, -1.265625, -1.1888427734375, -1.112060546875, -1.0352783203125, -0.95849609375, -0.8817138671875, -0.804931640625, -0.7281494140625, -0.6513671875, -0.5745849609375, -0.497802734375, -0.4210205078125, -0.34423828125, -0.2674560546875, -0.190673828125, -0.1138916015625, -0.037109375, 0.0396728515625, 0.116455078125, 0.1932373046875, 0.27001953125, 0.3468017578125, 0.423583984375, 0.5003662109375, 0.5771484375, 0.6539306640625, 0.730712890625, 0.8074951171875, 0.88427734375, 0.9610595703125, 1.037841796875, 1.1146240234375, 1.19140625, 1.2681884765625, 1.344970703125, 1.4217529296875, 1.49853515625, 1.5753173828125, 1.652099609375, 1.7288818359375, 1.8056640625, 1.8824462890625, 1.959228515625, 2.0360107421875, 2.11279296875, 2.1895751953125, 2.266357421875, 2.3431396484375, 2.419921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 8.0, 9.0, 6.0, 13.0, 25.0, 21.0, 36.0, 54.0, 63.0, 104.0, 106.0, 101.0, 103.0, 70.0, 63.0, 49.0, 42.0, 29.0, 20.0, 9.0, 6.0, 11.0, 11.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.016824722290039e-05, -7.675494998693466e-05, -7.334165275096893e-05, -6.99283555150032e-05, -6.651505827903748e-05, -6.310176104307175e-05, -5.968846380710602e-05, -5.627516657114029e-05, -5.286186933517456e-05, -4.944857209920883e-05, -4.60352748632431e-05, -4.2621977627277374e-05, -3.9208680391311646e-05, -3.579538315534592e-05, -3.238208591938019e-05, -2.896878868341446e-05, -2.555549144744873e-05, -2.2142194211483002e-05, -1.8728896975517273e-05, -1.5315599739551544e-05, -1.1902302503585815e-05, -8.489005267620087e-06, -5.075708031654358e-06, -1.6624107956886292e-06, 1.7508864402770996e-06, 5.164183676242828e-06, 8.577480912208557e-06, 1.1990778148174286e-05, 1.5404075384140015e-05, 1.8817372620105743e-05, 2.2230669856071472e-05, 2.56439670920372e-05, 2.905726432800293e-05, 3.247056156396866e-05, 3.588385879993439e-05, 3.9297156035900116e-05, 4.2710453271865845e-05, 4.6123750507831573e-05, 4.95370477437973e-05, 5.295034497976303e-05, 5.636364221572876e-05, 5.977693945169449e-05, 6.319023668766022e-05, 6.660353392362595e-05, 7.001683115959167e-05, 7.34301283955574e-05, 7.684342563152313e-05, 8.025672286748886e-05, 8.367002010345459e-05, 8.708331733942032e-05, 9.049661457538605e-05, 9.390991181135178e-05, 9.73232090473175e-05, 0.00010073650628328323, 0.00010414980351924896, 0.00010756310075521469, 0.00011097639799118042, 0.00011438969522714615, 0.00011780299246311188, 0.0001212162896990776, 0.00012462958693504333, 0.00012804288417100906, 0.0001314561814069748, 0.00013486947864294052, 0.00013828277587890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 9.0, 7.0, 11.0, 23.0, 24.0, 38.0, 56.0, 66.0, 108.0, 147.0, 229.0, 355.0, 558.0, 867.0, 1292.0, 2210.0, 3837.0, 7004.0, 13744.0, 29994.0, 74610.0, 204991.0, 363198.0, 207947.0, 75783.0, 30688.0, 13810.0, 7156.0, 3758.0, 2214.0, 1311.0, 816.0, 544.0, 358.0, 261.0, 180.0, 114.0, 67.0, 56.0, 25.0, 29.0, 10.0, 12.0, 10.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.55078125, -2.47894287109375, -2.4071044921875, -2.33526611328125, -2.263427734375, -2.19158935546875, -2.1197509765625, -2.04791259765625, -1.97607421875, -1.90423583984375, -1.8323974609375, -1.76055908203125, -1.688720703125, -1.61688232421875, -1.5450439453125, -1.47320556640625, -1.4013671875, -1.32952880859375, -1.2576904296875, -1.18585205078125, -1.114013671875, -1.04217529296875, -0.9703369140625, -0.89849853515625, -0.82666015625, -0.75482177734375, -0.6829833984375, -0.61114501953125, -0.539306640625, -0.46746826171875, -0.3956298828125, -0.32379150390625, -0.251953125, -0.18011474609375, -0.1082763671875, -0.03643798828125, 0.035400390625, 0.10723876953125, 0.1790771484375, 0.25091552734375, 0.32275390625, 0.39459228515625, 0.4664306640625, 0.53826904296875, 0.610107421875, 0.68194580078125, 0.7537841796875, 0.82562255859375, 0.8974609375, 0.96929931640625, 1.0411376953125, 1.11297607421875, 1.184814453125, 1.25665283203125, 1.3284912109375, 1.40032958984375, 1.47216796875, 1.54400634765625, 1.6158447265625, 1.68768310546875, 1.759521484375, 1.83135986328125, 1.9031982421875, 1.97503662109375, 2.046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 8.0, 7.0, 8.0, 15.0, 11.0, 13.0, 16.0, 28.0, 36.0, 43.0, 60.0, 68.0, 75.0, 79.0, 97.0, 80.0, 68.0, 44.0, 42.0, 41.0, 25.0, 19.0, 16.0, 9.0, 12.0, 5.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.57421875, -0.5567398071289062, -0.5392608642578125, -0.5217819213867188, -0.504302978515625, -0.48682403564453125, -0.4693450927734375, -0.45186614990234375, -0.43438720703125, -0.41690826416015625, -0.3994293212890625, -0.38195037841796875, -0.364471435546875, -0.34699249267578125, -0.3295135498046875, -0.31203460693359375, -0.2945556640625, -0.27707672119140625, -0.2595977783203125, -0.24211883544921875, -0.224639892578125, -0.20716094970703125, -0.1896820068359375, -0.17220306396484375, -0.15472412109375, -0.13724517822265625, -0.1197662353515625, -0.10228729248046875, -0.084808349609375, -0.06732940673828125, -0.0498504638671875, -0.03237152099609375, -0.014892578125, 0.00258636474609375, 0.0200653076171875, 0.03754425048828125, 0.055023193359375, 0.07250213623046875, 0.0899810791015625, 0.10746002197265625, 0.12493896484375, 0.14241790771484375, 0.1598968505859375, 0.17737579345703125, 0.194854736328125, 0.21233367919921875, 0.2298126220703125, 0.24729156494140625, 0.2647705078125, 0.28224945068359375, 0.2997283935546875, 0.31720733642578125, 0.334686279296875, 0.35216522216796875, 0.3696441650390625, 0.38712310791015625, 0.40460205078125, 0.42208099365234375, 0.4395599365234375, 0.45703887939453125, 0.474517822265625, 0.49199676513671875, 0.5094757080078125, 0.5269546508789062, 0.54443359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 14.0, 12.0, 19.0, 40.0, 67.0, 73.0, 118.0, 156.0, 168.0, 109.0, 74.0, 44.0, 36.0, 22.0, 13.0, 14.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-26.084308624267578, -25.53853416442871, -24.992759704589844, -24.446983337402344, -23.901208877563477, -23.35543441772461, -22.809659957885742, -22.263885498046875, -21.718111038208008, -21.17233657836914, -20.626562118530273, -20.080787658691406, -19.535011291503906, -18.98923683166504, -18.443462371826172, -17.897687911987305, -17.351913452148438, -16.80613899230957, -16.260364532470703, -15.71458911895752, -15.168814659118652, -14.623039245605469, -14.077264785766602, -13.531490325927734, -12.985713958740234, -12.439939498901367, -11.894164085388184, -11.348389625549316, -10.80261516571045, -10.256839752197266, -9.711065292358398, -9.165290832519531, -8.619516372680664, -8.073741912841797, -7.5279669761657715, -6.982192039489746, -6.436417579650879, -5.8906426429748535, -5.344867706298828, -4.799093246459961, -4.2533183097839355, -3.7075436115264893, -3.161768913269043, -2.6159939765930176, -2.0702192783355713, -1.524444580078125, -0.9786696434020996, -0.4328949451446533, 0.11287975311279297, 0.658654510974884, 1.204429268836975, 1.750204086303711, 2.2959787845611572, 2.8417534828186035, 3.387528419494629, 3.933303117752075, 4.4790778160095215, 5.024852752685547, 5.570627212524414, 6.1164021492004395, 6.662177085876465, 7.207951545715332, 7.753726482391357, 8.299501419067383, 8.84527587890625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 5.0, 10.0, 9.0, 7.0, 14.0, 21.0, 16.0, 16.0, 24.0, 30.0, 36.0, 40.0, 35.0, 28.0, 43.0, 46.0, 40.0, 45.0, 49.0, 45.0, 35.0, 46.0, 41.0, 39.0, 43.0, 37.0, 29.0, 33.0, 14.0, 19.0, 14.0, 16.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.448026180267334, -5.263195514678955, -5.078364849090576, -4.893533706665039, -4.70870304107666, -4.523872375488281, -4.339041709899902, -4.154211044311523, -3.9693801403045654, -3.7845494747161865, -3.5997185707092285, -3.4148879051208496, -3.2300572395324707, -3.0452263355255127, -2.860395669937134, -2.675564765930176, -2.490734100341797, -2.305903434753418, -2.12107253074646, -1.936241865158081, -1.7514110803604126, -1.5665802955627441, -1.3817496299743652, -1.1969188451766968, -1.0120880603790283, -0.8272572755813599, -0.6424265503883362, -0.4575958251953125, -0.27276504039764404, -0.08793425559997559, 0.09689640998840332, 0.2817271947860718, 0.46655845642089844, 0.6513892412185669, 0.8362199664115906, 1.0210506916046143, 1.2058814764022827, 1.3907122611999512, 1.57554292678833, 1.7603737115859985, 1.945204496383667, 2.130035161972046, 2.314866065979004, 2.499696731567383, 2.6845273971557617, 2.8693583011627197, 3.0541889667510986, 3.2390198707580566, 3.4238505363464355, 3.6086812019348145, 3.7935121059417725, 3.9783427715301514, 4.163173675537109, 4.348004341125488, 4.532835006713867, 4.717665672302246, 4.902496337890625, 5.087327003479004, 5.272157669067383, 5.456988334655762, 5.641819477081299, 5.826650142669678, 6.011480808258057, 6.1963114738464355, 6.381142616271973]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 12.0, 11.0, 15.0, 28.0, 41.0, 35.0, 67.0, 98.0, 159.0, 249.0, 367.0, 612.0, 1066.0, 1777.0, 3430.0, 6396.0, 13542.0, 30277.0, 70867.0, 154646.0, 254420.0, 248014.0, 143420.0, 64999.0, 27962.0, 12239.0, 6061.0, 3242.0, 1745.0, 1056.0, 605.0, 376.0, 224.0, 153.0, 119.0, 77.0, 43.0, 37.0, 14.0, 18.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-8.640625, -8.3861083984375, -8.131591796875, -7.8770751953125, -7.62255859375, -7.3680419921875, -7.113525390625, -6.8590087890625, -6.6044921875, -6.3499755859375, -6.095458984375, -5.8409423828125, -5.58642578125, -5.3319091796875, -5.077392578125, -4.8228759765625, -4.568359375, -4.3138427734375, -4.059326171875, -3.8048095703125, -3.55029296875, -3.2957763671875, -3.041259765625, -2.7867431640625, -2.5322265625, -2.2777099609375, -2.023193359375, -1.7686767578125, -1.51416015625, -1.2596435546875, -1.005126953125, -0.7506103515625, -0.49609375, -0.2415771484375, 0.012939453125, 0.2674560546875, 0.52197265625, 0.7764892578125, 1.031005859375, 1.2855224609375, 1.5400390625, 1.7945556640625, 2.049072265625, 2.3035888671875, 2.55810546875, 2.8126220703125, 3.067138671875, 3.3216552734375, 3.576171875, 3.8306884765625, 4.085205078125, 4.3397216796875, 4.59423828125, 4.8487548828125, 5.103271484375, 5.3577880859375, 5.6123046875, 5.8668212890625, 6.121337890625, 6.3758544921875, 6.63037109375, 6.8848876953125, 7.139404296875, 7.3939208984375, 7.6484375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 10.0, 8.0, 5.0, 8.0, 7.0, 16.0, 13.0, 14.0, 23.0, 22.0, 24.0, 34.0, 37.0, 35.0, 45.0, 34.0, 37.0, 34.0, 42.0, 39.0, 48.0, 43.0, 46.0, 35.0, 53.0, 40.0, 43.0, 27.0, 33.0, 19.0, 21.0, 21.0, 12.0, 15.0, 9.0, 12.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.78125, -5.58740234375, -5.3935546875, -5.19970703125, -5.005859375, -4.81201171875, -4.6181640625, -4.42431640625, -4.23046875, -4.03662109375, -3.8427734375, -3.64892578125, -3.455078125, -3.26123046875, -3.0673828125, -2.87353515625, -2.6796875, -2.48583984375, -2.2919921875, -2.09814453125, -1.904296875, -1.71044921875, -1.5166015625, -1.32275390625, -1.12890625, -0.93505859375, -0.7412109375, -0.54736328125, -0.353515625, -0.15966796875, 0.0341796875, 0.22802734375, 0.421875, 0.61572265625, 0.8095703125, 1.00341796875, 1.197265625, 1.39111328125, 1.5849609375, 1.77880859375, 1.97265625, 2.16650390625, 2.3603515625, 2.55419921875, 2.748046875, 2.94189453125, 3.1357421875, 3.32958984375, 3.5234375, 3.71728515625, 3.9111328125, 4.10498046875, 4.298828125, 4.49267578125, 4.6865234375, 4.88037109375, 5.07421875, 5.26806640625, 5.4619140625, 5.65576171875, 5.849609375, 6.04345703125, 6.2373046875, 6.43115234375, 6.625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 15.0, 14.0, 19.0, 25.0, 38.0, 48.0, 92.0, 140.0, 180.0, 267.0, 442.0, 748.0, 1207.0, 2059.0, 3652.0, 6653.0, 12578.0, 24152.0, 47157.0, 88375.0, 152226.0, 207081.0, 199171.0, 137222.0, 78292.0, 40679.0, 21114.0, 10928.0, 5982.0, 3244.0, 1867.0, 1032.0, 699.0, 377.0, 232.0, 171.0, 120.0, 76.0, 62.0, 30.0, 26.0, 16.0, 7.0, 10.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.53515625, -6.33648681640625, -6.1378173828125, -5.93914794921875, -5.740478515625, -5.54180908203125, -5.3431396484375, -5.14447021484375, -4.94580078125, -4.74713134765625, -4.5484619140625, -4.34979248046875, -4.151123046875, -3.95245361328125, -3.7537841796875, -3.55511474609375, -3.3564453125, -3.15777587890625, -2.9591064453125, -2.76043701171875, -2.561767578125, -2.36309814453125, -2.1644287109375, -1.96575927734375, -1.76708984375, -1.56842041015625, -1.3697509765625, -1.17108154296875, -0.972412109375, -0.77374267578125, -0.5750732421875, -0.37640380859375, -0.177734375, 0.02093505859375, 0.2196044921875, 0.41827392578125, 0.616943359375, 0.81561279296875, 1.0142822265625, 1.21295166015625, 1.41162109375, 1.61029052734375, 1.8089599609375, 2.00762939453125, 2.206298828125, 2.40496826171875, 2.6036376953125, 2.80230712890625, 3.0009765625, 3.19964599609375, 3.3983154296875, 3.59698486328125, 3.795654296875, 3.99432373046875, 4.1929931640625, 4.39166259765625, 4.59033203125, 4.78900146484375, 4.9876708984375, 5.18634033203125, 5.385009765625, 5.58367919921875, 5.7823486328125, 5.98101806640625, 6.1796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 12.0, 14.0, 19.0, 22.0, 19.0, 20.0, 36.0, 27.0, 22.0, 31.0, 35.0, 35.0, 29.0, 44.0, 49.0, 44.0, 40.0, 39.0, 29.0, 40.0, 42.0, 36.0, 33.0, 27.0, 37.0, 21.0, 25.0, 29.0, 17.0, 13.0, 19.0, 14.0, 12.0, 15.0, 7.0, 7.0, 12.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.84503173828125, -2.7408447265625, -2.63665771484375, -2.532470703125, -2.42828369140625, -2.3240966796875, -2.21990966796875, -2.11572265625, -2.01153564453125, -1.9073486328125, -1.80316162109375, -1.698974609375, -1.59478759765625, -1.4906005859375, -1.38641357421875, -1.2822265625, -1.17803955078125, -1.0738525390625, -0.96966552734375, -0.865478515625, -0.76129150390625, -0.6571044921875, -0.55291748046875, -0.44873046875, -0.34454345703125, -0.2403564453125, -0.13616943359375, -0.031982421875, 0.07220458984375, 0.1763916015625, 0.28057861328125, 0.384765625, 0.48895263671875, 0.5931396484375, 0.69732666015625, 0.801513671875, 0.90570068359375, 1.0098876953125, 1.11407470703125, 1.21826171875, 1.32244873046875, 1.4266357421875, 1.53082275390625, 1.635009765625, 1.73919677734375, 1.8433837890625, 1.94757080078125, 2.0517578125, 2.15594482421875, 2.2601318359375, 2.36431884765625, 2.468505859375, 2.57269287109375, 2.6768798828125, 2.78106689453125, 2.88525390625, 2.98944091796875, 3.0936279296875, 3.19781494140625, 3.302001953125, 3.40618896484375, 3.5103759765625, 3.61456298828125, 3.71875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 18.0, 21.0, 23.0, 24.0, 45.0, 59.0, 83.0, 120.0, 167.0, 268.0, 419.0, 713.0, 1127.0, 1960.0, 3407.0, 6098.0, 11195.0, 21851.0, 44670.0, 95016.0, 185230.0, 258946.0, 203304.0, 108820.0, 51697.0, 24551.0, 12575.0, 6785.0, 3837.0, 2153.0, 1229.0, 733.0, 474.0, 322.0, 190.0, 111.0, 74.0, 57.0, 47.0, 24.0, 25.0, 17.0, 17.0, 5.0, 11.0, 2.0, 3.0, 7.0, 1.0, 5.0, 5.0, 2.0], "bins": [-4.0, -3.88092041015625, -3.7618408203125, -3.64276123046875, -3.523681640625, -3.40460205078125, -3.2855224609375, -3.16644287109375, -3.04736328125, -2.92828369140625, -2.8092041015625, -2.69012451171875, -2.571044921875, -2.45196533203125, -2.3328857421875, -2.21380615234375, -2.0947265625, -1.97564697265625, -1.8565673828125, -1.73748779296875, -1.618408203125, -1.49932861328125, -1.3802490234375, -1.26116943359375, -1.14208984375, -1.02301025390625, -0.9039306640625, -0.78485107421875, -0.665771484375, -0.54669189453125, -0.4276123046875, -0.30853271484375, -0.189453125, -0.07037353515625, 0.0487060546875, 0.16778564453125, 0.286865234375, 0.40594482421875, 0.5250244140625, 0.64410400390625, 0.76318359375, 0.88226318359375, 1.0013427734375, 1.12042236328125, 1.239501953125, 1.35858154296875, 1.4776611328125, 1.59674072265625, 1.7158203125, 1.83489990234375, 1.9539794921875, 2.07305908203125, 2.192138671875, 2.31121826171875, 2.4302978515625, 2.54937744140625, 2.66845703125, 2.78753662109375, 2.9066162109375, 3.02569580078125, 3.144775390625, 3.26385498046875, 3.3829345703125, 3.50201416015625, 3.62109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 16.0, 27.0, 31.0, 23.0, 42.0, 48.0, 52.0, 81.0, 69.0, 63.0, 74.0, 75.0, 69.0, 56.0, 63.0, 46.0, 35.0, 23.0, 19.0, 15.0, 14.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00032806396484375, -0.00031822919845581055, -0.0003083944320678711, -0.00029855966567993164, -0.0002887248992919922, -0.00027889013290405273, -0.0002690553665161133, -0.00025922060012817383, -0.0002493858337402344, -0.00023955106735229492, -0.00022971630096435547, -0.00021988153457641602, -0.00021004676818847656, -0.0002002120018005371, -0.00019037723541259766, -0.0001805424690246582, -0.00017070770263671875, -0.0001608729362487793, -0.00015103816986083984, -0.0001412034034729004, -0.00013136863708496094, -0.00012153387069702148, -0.00011169910430908203, -0.00010186433792114258, -9.202957153320312e-05, -8.219480514526367e-05, -7.236003875732422e-05, -6.252527236938477e-05, -5.269050598144531e-05, -4.285573959350586e-05, -3.3020973205566406e-05, -2.3186206817626953e-05, -1.33514404296875e-05, -3.516674041748047e-06, 6.318092346191406e-06, 1.615285873413086e-05, 2.5987625122070312e-05, 3.5822391510009766e-05, 4.565715789794922e-05, 5.549192428588867e-05, 6.532669067382812e-05, 7.516145706176758e-05, 8.499622344970703e-05, 9.483098983764648e-05, 0.00010466575622558594, 0.00011450052261352539, 0.00012433528900146484, 0.0001341700553894043, 0.00014400482177734375, 0.0001538395881652832, 0.00016367435455322266, 0.0001735091209411621, 0.00018334388732910156, 0.00019317865371704102, 0.00020301342010498047, 0.00021284818649291992, 0.00022268295288085938, 0.00023251771926879883, 0.00024235248565673828, 0.00025218725204467773, 0.0002620220184326172, 0.00027185678482055664, 0.0002816915512084961, 0.00029152631759643555, 0.000301361083984375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 9.0, 11.0, 12.0, 27.0, 31.0, 50.0, 62.0, 94.0, 194.0, 294.0, 474.0, 796.0, 1322.0, 2304.0, 4126.0, 7518.0, 14704.0, 29987.0, 63092.0, 131120.0, 229817.0, 250037.0, 158447.0, 78204.0, 37086.0, 18101.0, 9400.0, 4727.0, 2605.0, 1534.0, 935.0, 574.0, 299.0, 205.0, 113.0, 92.0, 55.0, 34.0, 22.0, 17.0, 10.0, 8.0, 8.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69921875, -3.584136962890625, -3.46905517578125, -3.353973388671875, -3.2388916015625, -3.123809814453125, -3.00872802734375, -2.893646240234375, -2.778564453125, -2.663482666015625, -2.54840087890625, -2.433319091796875, -2.3182373046875, -2.203155517578125, -2.08807373046875, -1.972991943359375, -1.85791015625, -1.742828369140625, -1.62774658203125, -1.512664794921875, -1.3975830078125, -1.282501220703125, -1.16741943359375, -1.052337646484375, -0.937255859375, -0.822174072265625, -0.70709228515625, -0.592010498046875, -0.4769287109375, -0.361846923828125, -0.24676513671875, -0.131683349609375, -0.0166015625, 0.098480224609375, 0.21356201171875, 0.328643798828125, 0.4437255859375, 0.558807373046875, 0.67388916015625, 0.788970947265625, 0.904052734375, 1.019134521484375, 1.13421630859375, 1.249298095703125, 1.3643798828125, 1.479461669921875, 1.59454345703125, 1.709625244140625, 1.82470703125, 1.939788818359375, 2.05487060546875, 2.169952392578125, 2.2850341796875, 2.400115966796875, 2.51519775390625, 2.630279541015625, 2.745361328125, 2.860443115234375, 2.97552490234375, 3.090606689453125, 3.2056884765625, 3.320770263671875, 3.43585205078125, 3.550933837890625, 3.666015625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 4.0, 8.0, 9.0, 8.0, 12.0, 13.0, 9.0, 12.0, 26.0, 25.0, 26.0, 38.0, 37.0, 42.0, 40.0, 53.0, 51.0, 56.0, 44.0, 59.0, 49.0, 49.0, 40.0, 45.0, 42.0, 36.0, 29.0, 23.0, 24.0, 15.0, 11.0, 10.0, 14.0, 9.0, 6.0, 3.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6657943725585938, -0.6396942138671875, -0.6135940551757812, -0.587493896484375, -0.5613937377929688, -0.5352935791015625, -0.5091934204101562, -0.48309326171875, -0.45699310302734375, -0.4308929443359375, -0.40479278564453125, -0.378692626953125, -0.35259246826171875, -0.3264923095703125, -0.30039215087890625, -0.2742919921875, -0.24819183349609375, -0.2220916748046875, -0.19599151611328125, -0.169891357421875, -0.14379119873046875, -0.1176910400390625, -0.09159088134765625, -0.06549072265625, -0.03939056396484375, -0.0132904052734375, 0.01280975341796875, 0.038909912109375, 0.06501007080078125, 0.0911102294921875, 0.11721038818359375, 0.143310546875, 0.16941070556640625, 0.1955108642578125, 0.22161102294921875, 0.247711181640625, 0.27381134033203125, 0.2999114990234375, 0.32601165771484375, 0.35211181640625, 0.37821197509765625, 0.4043121337890625, 0.43041229248046875, 0.456512451171875, 0.48261260986328125, 0.5087127685546875, 0.5348129272460938, 0.5609130859375, 0.5870132446289062, 0.6131134033203125, 0.6392135620117188, 0.665313720703125, 0.6914138793945312, 0.7175140380859375, 0.7436141967773438, 0.76971435546875, 0.7958145141601562, 0.8219146728515625, 0.8480148315429688, 0.874114990234375, 0.9002151489257812, 0.9263153076171875, 0.9524154663085938, 0.978515625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 12.0, 15.0, 20.0, 48.0, 69.0, 112.0, 142.0, 165.0, 137.0, 95.0, 54.0, 53.0, 23.0, 18.0, 11.0, 11.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.881580352783203, -26.314258575439453, -25.746936798095703, -25.179616928100586, -24.612295150756836, -24.044973373413086, -23.477651596069336, -22.910329818725586, -22.34300994873047, -21.77568817138672, -21.20836639404297, -20.64104652404785, -20.0737247467041, -19.50640296936035, -18.9390811920166, -18.37175941467285, -17.8044376373291, -17.23711585998535, -16.6697940826416, -16.102474212646484, -15.535152435302734, -14.967830657958984, -14.400508880615234, -13.833187103271484, -13.26586627960205, -12.6985445022583, -12.131223678588867, -11.563901901245117, -10.996580123901367, -10.429259300231934, -9.861937522888184, -9.29461669921875, -8.727293014526367, -8.159971237182617, -7.592650413513184, -7.025328636169434, -6.458007335662842, -5.89068603515625, -5.3233642578125, -4.756042957305908, -4.188721656799316, -3.6214003562927246, -3.0540788173675537, -2.486757278442383, -1.919435977935791, -1.3521146774291992, -0.7847931385040283, -0.21747159957885742, 0.3498497009277344, 0.9171711206436157, 1.484492540359497, 2.051814079284668, 2.6191353797912598, 3.1864566802978516, 3.7537782192230225, 4.321099758148193, 4.888421058654785, 5.455742359161377, 6.023063659667969, 6.590385437011719, 7.1577067375183105, 7.725028038024902, 8.292349815368652, 8.859670639038086, 9.426992416381836]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 11.0, 9.0, 11.0, 13.0, 19.0, 28.0, 29.0, 33.0, 37.0, 40.0, 35.0, 42.0, 45.0, 48.0, 50.0, 45.0, 38.0, 41.0, 51.0, 36.0, 36.0, 53.0, 32.0, 26.0, 25.0, 21.0, 22.0, 18.0, 17.0, 13.0, 14.0, 9.0, 4.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.047612190246582, -5.851572513580322, -5.6555328369140625, -5.459493160247803, -5.263453483581543, -5.067413806915283, -4.871374130249023, -4.675334930419922, -4.479294776916504, -4.283255100250244, -4.087215423583984, -3.8911757469177246, -3.695136070251465, -3.499096393585205, -3.3030569553375244, -3.1070172786712646, -2.910977840423584, -2.714938163757324, -2.5188984870910645, -2.3228588104248047, -2.126819133758545, -1.9307795763015747, -1.7347400188446045, -1.5387003421783447, -1.342660665512085, -1.1466209888458252, -0.9505813717842102, -0.7545417547225952, -0.5585020780563354, -0.3624624013900757, -0.16642284393310547, 0.029616832733154297, 0.22565650939941406, 0.42169615626335144, 0.6177358031272888, 0.8137754201889038, 1.0098150968551636, 1.2058547735214233, 1.4018943309783936, 1.5979340076446533, 1.793973684310913, 1.9900133609771729, 2.1860530376434326, 2.3820924758911133, 2.578132152557373, 2.774171829223633, 2.9702115058898926, 3.1662511825561523, 3.362290859222412, 3.558330535888672, 3.7543702125549316, 3.9504098892211914, 4.146449565887451, 4.342489242553711, 4.5385284423828125, 4.7345685958862305, 4.930607795715332, 5.126647472381592, 5.322687149047852, 5.518726825714111, 5.714766502380371, 5.910806179046631, 6.106845855712891, 6.302885055541992, 6.49892520904541]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 8.0, 4.0, 9.0, 13.0, 18.0, 36.0, 42.0, 74.0, 97.0, 144.0, 227.0, 358.0, 499.0, 802.0, 1181.0, 1863.0, 3022.0, 4978.0, 8409.0, 15414.0, 30658.0, 72428.0, 208449.0, 672589.0, 1518427.0, 1098244.0, 354119.0, 110107.0, 42115.0, 20063.0, 10761.0, 6481.0, 4144.0, 2695.0, 1708.0, 1167.0, 845.0, 564.0, 412.0, 313.0, 230.0, 152.0, 108.0, 68.0, 79.0, 42.0, 29.0, 24.0, 20.0, 14.0, 10.0, 13.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.1328125, -9.7919921875, -9.451171875, -9.1103515625, -8.76953125, -8.4287109375, -8.087890625, -7.7470703125, -7.40625, -7.0654296875, -6.724609375, -6.3837890625, -6.04296875, -5.7021484375, -5.361328125, -5.0205078125, -4.6796875, -4.3388671875, -3.998046875, -3.6572265625, -3.31640625, -2.9755859375, -2.634765625, -2.2939453125, -1.953125, -1.6123046875, -1.271484375, -0.9306640625, -0.58984375, -0.2490234375, 0.091796875, 0.4326171875, 0.7734375, 1.1142578125, 1.455078125, 1.7958984375, 2.13671875, 2.4775390625, 2.818359375, 3.1591796875, 3.5, 3.8408203125, 4.181640625, 4.5224609375, 4.86328125, 5.2041015625, 5.544921875, 5.8857421875, 6.2265625, 6.5673828125, 6.908203125, 7.2490234375, 7.58984375, 7.9306640625, 8.271484375, 8.6123046875, 8.953125, 9.2939453125, 9.634765625, 9.9755859375, 10.31640625, 10.6572265625, 10.998046875, 11.3388671875, 11.6796875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 9.0, 8.0, 12.0, 18.0, 21.0, 21.0, 25.0, 32.0, 38.0, 40.0, 45.0, 36.0, 46.0, 40.0, 45.0, 50.0, 44.0, 38.0, 52.0, 47.0, 40.0, 39.0, 35.0, 29.0, 25.0, 24.0, 27.0, 15.0, 15.0, 13.0, 10.0, 13.0, 6.0, 8.0, 9.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.09765625, -3.95611572265625, -3.8145751953125, -3.67303466796875, -3.531494140625, -3.38995361328125, -3.2484130859375, -3.10687255859375, -2.96533203125, -2.82379150390625, -2.6822509765625, -2.54071044921875, -2.399169921875, -2.25762939453125, -2.1160888671875, -1.97454833984375, -1.8330078125, -1.69146728515625, -1.5499267578125, -1.40838623046875, -1.266845703125, -1.12530517578125, -0.9837646484375, -0.84222412109375, -0.70068359375, -0.55914306640625, -0.4176025390625, -0.27606201171875, -0.134521484375, 0.00701904296875, 0.1485595703125, 0.29010009765625, 0.431640625, 0.57318115234375, 0.7147216796875, 0.85626220703125, 0.997802734375, 1.13934326171875, 1.2808837890625, 1.42242431640625, 1.56396484375, 1.70550537109375, 1.8470458984375, 1.98858642578125, 2.130126953125, 2.27166748046875, 2.4132080078125, 2.55474853515625, 2.6962890625, 2.83782958984375, 2.9793701171875, 3.12091064453125, 3.262451171875, 3.40399169921875, 3.5455322265625, 3.68707275390625, 3.82861328125, 3.97015380859375, 4.1116943359375, 4.25323486328125, 4.394775390625, 4.53631591796875, 4.6778564453125, 4.81939697265625, 4.9609375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 15.0, 32.0, 35.0, 40.0, 76.0, 127.0, 171.0, 293.0, 462.0, 719.0, 1174.0, 1925.0, 3166.0, 5461.0, 9947.0, 18527.0, 38631.0, 92651.0, 276086.0, 906867.0, 1616696.0, 814525.0, 246723.0, 84189.0, 35899.0, 17325.0, 9430.0, 5185.0, 3104.0, 1850.0, 1086.0, 664.0, 433.0, 255.0, 161.0, 98.0, 61.0, 54.0, 41.0, 29.0, 19.0, 11.0, 7.0, 7.0, 1.0, 4.0, 1.0], "bins": [-14.25, -13.8695068359375, -13.489013671875, -13.1085205078125, -12.72802734375, -12.3475341796875, -11.967041015625, -11.5865478515625, -11.2060546875, -10.8255615234375, -10.445068359375, -10.0645751953125, -9.68408203125, -9.3035888671875, -8.923095703125, -8.5426025390625, -8.162109375, -7.7816162109375, -7.401123046875, -7.0206298828125, -6.64013671875, -6.2596435546875, -5.879150390625, -5.4986572265625, -5.1181640625, -4.7376708984375, -4.357177734375, -3.9766845703125, -3.59619140625, -3.2156982421875, -2.835205078125, -2.4547119140625, -2.07421875, -1.6937255859375, -1.313232421875, -0.9327392578125, -0.55224609375, -0.1717529296875, 0.208740234375, 0.5892333984375, 0.9697265625, 1.3502197265625, 1.730712890625, 2.1112060546875, 2.49169921875, 2.8721923828125, 3.252685546875, 3.6331787109375, 4.013671875, 4.3941650390625, 4.774658203125, 5.1551513671875, 5.53564453125, 5.9161376953125, 6.296630859375, 6.6771240234375, 7.0576171875, 7.4381103515625, 7.818603515625, 8.1990966796875, 8.57958984375, 8.9600830078125, 9.340576171875, 9.7210693359375, 10.1015625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 4.0, 5.0, 11.0, 11.0, 13.0, 22.0, 14.0, 17.0, 21.0, 33.0, 42.0, 55.0, 67.0, 93.0, 103.0, 154.0, 196.0, 219.0, 256.0, 328.0, 305.0, 336.0, 314.0, 290.0, 236.0, 202.0, 162.0, 129.0, 93.0, 92.0, 54.0, 54.0, 27.0, 27.0, 17.0, 12.0, 15.0, 14.0, 5.0, 6.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.0235595703125, -2.937744140625, -2.8519287109375, -2.76611328125, -2.6802978515625, -2.594482421875, -2.5086669921875, -2.4228515625, -2.3370361328125, -2.251220703125, -2.1654052734375, -2.07958984375, -1.9937744140625, -1.907958984375, -1.8221435546875, -1.736328125, -1.6505126953125, -1.564697265625, -1.4788818359375, -1.39306640625, -1.3072509765625, -1.221435546875, -1.1356201171875, -1.0498046875, -0.9639892578125, -0.878173828125, -0.7923583984375, -0.70654296875, -0.6207275390625, -0.534912109375, -0.4490966796875, -0.36328125, -0.2774658203125, -0.191650390625, -0.1058349609375, -0.02001953125, 0.0657958984375, 0.151611328125, 0.2374267578125, 0.3232421875, 0.4090576171875, 0.494873046875, 0.5806884765625, 0.66650390625, 0.7523193359375, 0.838134765625, 0.9239501953125, 1.009765625, 1.0955810546875, 1.181396484375, 1.2672119140625, 1.35302734375, 1.4388427734375, 1.524658203125, 1.6104736328125, 1.6962890625, 1.7821044921875, 1.867919921875, 1.9537353515625, 2.03955078125, 2.1253662109375, 2.211181640625, 2.2969970703125, 2.3828125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 13.0, 3.0, 12.0, 16.0, 39.0, 51.0, 98.0, 133.0, 150.0, 141.0, 141.0, 71.0, 45.0, 31.0, 23.0, 4.0, 8.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53737449645996, -23.95140266418457, -23.365428924560547, -22.779457092285156, -22.193485260009766, -21.607511520385742, -21.02153968811035, -20.435565948486328, -19.849594116210938, -19.263622283935547, -18.677648544311523, -18.091676712036133, -17.50570297241211, -16.91973114013672, -16.333759307861328, -15.747786521911621, -15.161813735961914, -14.575840950012207, -13.9898681640625, -13.40389633178711, -12.817923545837402, -12.231950759887695, -11.645978927612305, -11.060006141662598, -10.47403335571289, -9.888060569763184, -9.302087783813477, -8.716115951538086, -8.130143165588379, -7.544170379638672, -6.958198070526123, -6.372225761413574, -5.786252021789551, -5.200279235839844, -4.614306926727295, -4.028334617614746, -3.442361831665039, -2.856389284133911, -2.270416736602783, -1.6844444274902344, -1.0984716415405273, -0.5124990940093994, 0.07347345352172852, 0.6594460010528564, 1.2454185485839844, 1.8313910961151123, 2.4173636436462402, 3.003335952758789, 3.589308738708496, 4.175281524658203, 4.761253833770752, 5.347226142883301, 5.933198928833008, 6.519171714782715, 7.105144023895264, 7.6911163330078125, 8.27708911895752, 8.863061904907227, 9.449033737182617, 10.035006523132324, 10.620979309082031, 11.206952095031738, 11.792924880981445, 12.378896713256836, 12.964869499206543]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 9.0, 8.0, 9.0, 5.0, 12.0, 16.0, 20.0, 29.0, 35.0, 23.0, 21.0, 39.0, 42.0, 44.0, 43.0, 48.0, 52.0, 47.0, 36.0, 51.0, 45.0, 47.0, 38.0, 31.0, 32.0, 24.0, 36.0, 25.0, 21.0, 20.0, 12.0, 19.0, 13.0, 4.0, 2.0, 10.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.803647994995117, -5.616357803344727, -5.429068088531494, -5.2417778968811035, -5.054487705230713, -4.867197513580322, -4.67990779876709, -4.492617607116699, -4.305327415466309, -4.118037223815918, -3.9307472705841064, -3.743457317352295, -3.5561671257019043, -3.3688771724700928, -3.1815872192382812, -2.9942970275878906, -2.807007074356079, -2.6197171211242676, -2.432426929473877, -2.2451369762420654, -2.057846784591675, -1.8705568313598633, -1.6832667589187622, -1.4959766864776611, -1.30868661403656, -1.121396541595459, -0.9341064691543579, -0.7468164563179016, -0.5595263838768005, -0.37223631143569946, -0.18494629859924316, 0.00234377384185791, 0.18963384628295898, 0.37692391872406006, 0.5642139911651611, 0.7515040040016174, 0.9387940764427185, 1.1260840892791748, 1.3133741617202759, 1.500664234161377, 1.687954306602478, 1.875244379043579, 2.0625343322753906, 2.2498245239257812, 2.4371144771575928, 2.6244046688079834, 2.811694622039795, 2.9989848136901855, 3.186274766921997, 3.3735647201538086, 3.560854911804199, 3.7481448650360107, 3.9354350566864014, 4.122725009918213, 4.3100152015686035, 4.497304916381836, 4.684595108032227, 4.871885299682617, 5.05917501449585, 5.24646520614624, 5.433755397796631, 5.6210455894470215, 5.808335304260254, 5.9956254959106445, 6.182915687561035]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 11.0, 18.0, 17.0, 33.0, 59.0, 77.0, 133.0, 181.0, 242.0, 375.0, 560.0, 926.0, 1414.0, 2326.0, 3680.0, 6196.0, 10307.0, 18784.0, 34191.0, 63978.0, 118464.0, 191582.0, 220152.0, 164259.0, 95255.0, 50967.0, 27224.0, 14852.0, 8628.0, 5240.0, 3028.0, 1915.0, 1224.0, 808.0, 474.0, 320.0, 196.0, 151.0, 88.0, 66.0, 48.0, 29.0, 23.0, 16.0, 11.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.428863525390625, -2.34600830078125, -2.263153076171875, -2.1802978515625, -2.097442626953125, -2.01458740234375, -1.931732177734375, -1.848876953125, -1.766021728515625, -1.68316650390625, -1.600311279296875, -1.5174560546875, -1.434600830078125, -1.35174560546875, -1.268890380859375, -1.18603515625, -1.103179931640625, -1.02032470703125, -0.937469482421875, -0.8546142578125, -0.771759033203125, -0.68890380859375, -0.606048583984375, -0.523193359375, -0.440338134765625, -0.35748291015625, -0.274627685546875, -0.1917724609375, -0.108917236328125, -0.02606201171875, 0.056793212890625, 0.1396484375, 0.222503662109375, 0.30535888671875, 0.388214111328125, 0.4710693359375, 0.553924560546875, 0.63677978515625, 0.719635009765625, 0.802490234375, 0.885345458984375, 0.96820068359375, 1.051055908203125, 1.1339111328125, 1.216766357421875, 1.29962158203125, 1.382476806640625, 1.46533203125, 1.548187255859375, 1.63104248046875, 1.713897705078125, 1.7967529296875, 1.879608154296875, 1.96246337890625, 2.045318603515625, 2.128173828125, 2.211029052734375, 2.29388427734375, 2.376739501953125, 2.4595947265625, 2.542449951171875, 2.62530517578125, 2.708160400390625, 2.791015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 3.0, 6.0, 10.0, 13.0, 19.0, 19.0, 24.0, 22.0, 27.0, 30.0, 25.0, 42.0, 36.0, 49.0, 36.0, 53.0, 46.0, 48.0, 40.0, 55.0, 52.0, 32.0, 36.0, 39.0, 30.0, 26.0, 21.0, 19.0, 22.0, 18.0, 18.0, 14.0, 13.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2109375, -6.0069580078125, -5.802978515625, -5.5989990234375, -5.39501953125, -5.1910400390625, -4.987060546875, -4.7830810546875, -4.5791015625, -4.3751220703125, -4.171142578125, -3.9671630859375, -3.76318359375, -3.5592041015625, -3.355224609375, -3.1512451171875, -2.947265625, -2.7432861328125, -2.539306640625, -2.3353271484375, -2.13134765625, -1.9273681640625, -1.723388671875, -1.5194091796875, -1.3154296875, -1.1114501953125, -0.907470703125, -0.7034912109375, -0.49951171875, -0.2955322265625, -0.091552734375, 0.1124267578125, 0.31640625, 0.5203857421875, 0.724365234375, 0.9283447265625, 1.13232421875, 1.3363037109375, 1.540283203125, 1.7442626953125, 1.9482421875, 2.1522216796875, 2.356201171875, 2.5601806640625, 2.76416015625, 2.9681396484375, 3.172119140625, 3.3760986328125, 3.580078125, 3.7840576171875, 3.988037109375, 4.1920166015625, 4.39599609375, 4.5999755859375, 4.803955078125, 5.0079345703125, 5.2119140625, 5.4158935546875, 5.619873046875, 5.8238525390625, 6.02783203125, 6.2318115234375, 6.435791015625, 6.6397705078125, 6.84375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 16.0, 16.0, 21.0, 37.0, 61.0, 73.0, 122.0, 153.0, 205.0, 339.0, 546.0, 759.0, 1118.0, 1788.0, 2709.0, 4175.0, 6882.0, 11190.0, 19480.0, 34496.0, 63712.0, 115253.0, 187886.0, 220225.0, 161505.0, 94139.0, 51392.0, 28438.0, 16294.0, 9262.0, 5745.0, 3616.0, 2284.0, 1470.0, 1023.0, 683.0, 426.0, 310.0, 217.0, 171.0, 89.0, 59.0, 71.0, 42.0, 24.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.73046875, -2.643310546875, -2.55615234375, -2.468994140625, -2.3818359375, -2.294677734375, -2.20751953125, -2.120361328125, -2.033203125, -1.946044921875, -1.85888671875, -1.771728515625, -1.6845703125, -1.597412109375, -1.51025390625, -1.423095703125, -1.3359375, -1.248779296875, -1.16162109375, -1.074462890625, -0.9873046875, -0.900146484375, -0.81298828125, -0.725830078125, -0.638671875, -0.551513671875, -0.46435546875, -0.377197265625, -0.2900390625, -0.202880859375, -0.11572265625, -0.028564453125, 0.05859375, 0.145751953125, 0.23291015625, 0.320068359375, 0.4072265625, 0.494384765625, 0.58154296875, 0.668701171875, 0.755859375, 0.843017578125, 0.93017578125, 1.017333984375, 1.1044921875, 1.191650390625, 1.27880859375, 1.365966796875, 1.453125, 1.540283203125, 1.62744140625, 1.714599609375, 1.8017578125, 1.888916015625, 1.97607421875, 2.063232421875, 2.150390625, 2.237548828125, 2.32470703125, 2.411865234375, 2.4990234375, 2.586181640625, 2.67333984375, 2.760498046875, 2.84765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 6.0, 6.0, 3.0, 7.0, 8.0, 10.0, 16.0, 13.0, 12.0, 28.0, 21.0, 28.0, 29.0, 33.0, 41.0, 31.0, 40.0, 26.0, 37.0, 45.0, 33.0, 46.0, 34.0, 39.0, 46.0, 40.0, 30.0, 30.0, 25.0, 27.0, 31.0, 27.0, 17.0, 19.0, 16.0, 22.0, 10.0, 18.0, 10.0, 9.0, 11.0, 13.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.31988525390625, -3.2159423828125, -3.11199951171875, -3.008056640625, -2.90411376953125, -2.8001708984375, -2.69622802734375, -2.59228515625, -2.48834228515625, -2.3843994140625, -2.28045654296875, -2.176513671875, -2.07257080078125, -1.9686279296875, -1.86468505859375, -1.7607421875, -1.65679931640625, -1.5528564453125, -1.44891357421875, -1.344970703125, -1.24102783203125, -1.1370849609375, -1.03314208984375, -0.92919921875, -0.82525634765625, -0.7213134765625, -0.61737060546875, -0.513427734375, -0.40948486328125, -0.3055419921875, -0.20159912109375, -0.09765625, 0.00628662109375, 0.1102294921875, 0.21417236328125, 0.318115234375, 0.42205810546875, 0.5260009765625, 0.62994384765625, 0.73388671875, 0.83782958984375, 0.9417724609375, 1.04571533203125, 1.149658203125, 1.25360107421875, 1.3575439453125, 1.46148681640625, 1.5654296875, 1.66937255859375, 1.7733154296875, 1.87725830078125, 1.981201171875, 2.08514404296875, 2.1890869140625, 2.29302978515625, 2.39697265625, 2.50091552734375, 2.6048583984375, 2.70880126953125, 2.812744140625, 2.91668701171875, 3.0206298828125, 3.12457275390625, 3.228515625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 3.0, 10.0, 10.0, 16.0, 12.0, 32.0, 41.0, 63.0, 100.0, 137.0, 214.0, 381.0, 606.0, 967.0, 1764.0, 3272.0, 6472.0, 14159.0, 32317.0, 85225.0, 241519.0, 377921.0, 174343.0, 61837.0, 24872.0, 10950.0, 5233.0, 2717.0, 1304.0, 783.0, 462.0, 298.0, 171.0, 118.0, 70.0, 47.0, 41.0, 31.0, 12.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.060546875, -1.996826171875, -1.93310546875, -1.869384765625, -1.8056640625, -1.741943359375, -1.67822265625, -1.614501953125, -1.55078125, -1.487060546875, -1.42333984375, -1.359619140625, -1.2958984375, -1.232177734375, -1.16845703125, -1.104736328125, -1.041015625, -0.977294921875, -0.91357421875, -0.849853515625, -0.7861328125, -0.722412109375, -0.65869140625, -0.594970703125, -0.53125, -0.467529296875, -0.40380859375, -0.340087890625, -0.2763671875, -0.212646484375, -0.14892578125, -0.085205078125, -0.021484375, 0.042236328125, 0.10595703125, 0.169677734375, 0.2333984375, 0.297119140625, 0.36083984375, 0.424560546875, 0.48828125, 0.552001953125, 0.61572265625, 0.679443359375, 0.7431640625, 0.806884765625, 0.87060546875, 0.934326171875, 0.998046875, 1.061767578125, 1.12548828125, 1.189208984375, 1.2529296875, 1.316650390625, 1.38037109375, 1.444091796875, 1.5078125, 1.571533203125, 1.63525390625, 1.698974609375, 1.7626953125, 1.826416015625, 1.89013671875, 1.953857421875, 2.017578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 6.0, 9.0, 7.0, 4.0, 13.0, 9.0, 16.0, 17.0, 25.0, 44.0, 41.0, 50.0, 56.0, 68.0, 96.0, 79.0, 73.0, 78.0, 68.0, 53.0, 43.0, 37.0, 28.0, 20.0, 12.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.784366607666016e-05, -7.53793865442276e-05, -7.291510701179504e-05, -7.045082747936249e-05, -6.798654794692993e-05, -6.552226841449738e-05, -6.305798888206482e-05, -6.059370934963226e-05, -5.812942981719971e-05, -5.566515028476715e-05, -5.3200870752334595e-05, -5.073659121990204e-05, -4.827231168746948e-05, -4.5808032155036926e-05, -4.334375262260437e-05, -4.0879473090171814e-05, -3.841519355773926e-05, -3.59509140253067e-05, -3.3486634492874146e-05, -3.102235496044159e-05, -2.8558075428009033e-05, -2.6093795895576477e-05, -2.362951636314392e-05, -2.1165236830711365e-05, -1.870095729827881e-05, -1.6236677765846252e-05, -1.3772398233413696e-05, -1.130811870098114e-05, -8.843839168548584e-06, -6.379559636116028e-06, -3.915280103683472e-06, -1.4510005712509155e-06, 1.0132789611816406e-06, 3.4775584936141968e-06, 5.941838026046753e-06, 8.406117558479309e-06, 1.0870397090911865e-05, 1.3334676623344421e-05, 1.5798956155776978e-05, 1.8263235688209534e-05, 2.072751522064209e-05, 2.3191794753074646e-05, 2.5656074285507202e-05, 2.8120353817939758e-05, 3.0584633350372314e-05, 3.304891288280487e-05, 3.551319241523743e-05, 3.797747194766998e-05, 4.044175148010254e-05, 4.2906031012535095e-05, 4.537031054496765e-05, 4.783459007740021e-05, 5.0298869609832764e-05, 5.276314914226532e-05, 5.5227428674697876e-05, 5.769170820713043e-05, 6.015598773956299e-05, 6.262026727199554e-05, 6.50845468044281e-05, 6.754882633686066e-05, 7.001310586929321e-05, 7.247738540172577e-05, 7.494166493415833e-05, 7.740594446659088e-05, 7.987022399902344e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 13.0, 15.0, 32.0, 50.0, 79.0, 112.0, 184.0, 255.0, 383.0, 564.0, 975.0, 1763.0, 3135.0, 5807.0, 11872.0, 25440.0, 59941.0, 146921.0, 290096.0, 272251.0, 130115.0, 52715.0, 22710.0, 10691.0, 5418.0, 2874.0, 1560.0, 898.0, 596.0, 359.0, 243.0, 155.0, 90.0, 73.0, 57.0, 34.0, 18.0, 10.0, 11.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5458984375, -1.492462158203125, -1.43902587890625, -1.385589599609375, -1.3321533203125, -1.278717041015625, -1.22528076171875, -1.171844482421875, -1.118408203125, -1.064971923828125, -1.01153564453125, -0.958099365234375, -0.9046630859375, -0.851226806640625, -0.79779052734375, -0.744354248046875, -0.69091796875, -0.637481689453125, -0.58404541015625, -0.530609130859375, -0.4771728515625, -0.423736572265625, -0.37030029296875, -0.316864013671875, -0.263427734375, -0.209991455078125, -0.15655517578125, -0.103118896484375, -0.0496826171875, 0.003753662109375, 0.05718994140625, 0.110626220703125, 0.1640625, 0.217498779296875, 0.27093505859375, 0.324371337890625, 0.3778076171875, 0.431243896484375, 0.48468017578125, 0.538116455078125, 0.591552734375, 0.644989013671875, 0.69842529296875, 0.751861572265625, 0.8052978515625, 0.858734130859375, 0.91217041015625, 0.965606689453125, 1.01904296875, 1.072479248046875, 1.12591552734375, 1.179351806640625, 1.2327880859375, 1.286224365234375, 1.33966064453125, 1.393096923828125, 1.446533203125, 1.499969482421875, 1.55340576171875, 1.606842041015625, 1.6602783203125, 1.713714599609375, 1.76715087890625, 1.820587158203125, 1.8740234375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 3.0, 7.0, 12.0, 6.0, 13.0, 8.0, 15.0, 15.0, 23.0, 21.0, 17.0, 28.0, 32.0, 31.0, 43.0, 58.0, 62.0, 60.0, 79.0, 54.0, 61.0, 51.0, 52.0, 44.0, 31.0, 24.0, 22.0, 21.0, 18.0, 13.0, 11.0, 8.0, 10.0, 5.0, 13.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36551666259765625, -0.3538360595703125, -0.34215545654296875, -0.330474853515625, -0.31879425048828125, -0.3071136474609375, -0.29543304443359375, -0.28375244140625, -0.27207183837890625, -0.2603912353515625, -0.24871063232421875, -0.237030029296875, -0.22534942626953125, -0.2136688232421875, -0.20198822021484375, -0.1903076171875, -0.17862701416015625, -0.1669464111328125, -0.15526580810546875, -0.143585205078125, -0.13190460205078125, -0.1202239990234375, -0.10854339599609375, -0.09686279296875, -0.08518218994140625, -0.0735015869140625, -0.06182098388671875, -0.050140380859375, -0.03845977783203125, -0.0267791748046875, -0.01509857177734375, -0.00341796875, 0.00826263427734375, 0.0199432373046875, 0.03162384033203125, 0.043304443359375, 0.05498504638671875, 0.0666656494140625, 0.07834625244140625, 0.09002685546875, 0.10170745849609375, 0.1133880615234375, 0.12506866455078125, 0.136749267578125, 0.14842987060546875, 0.1601104736328125, 0.17179107666015625, 0.1834716796875, 0.19515228271484375, 0.2068328857421875, 0.21851348876953125, 0.230194091796875, 0.24187469482421875, 0.2535552978515625, 0.26523590087890625, 0.27691650390625, 0.28859710693359375, 0.3002777099609375, 0.31195831298828125, 0.323638916015625, 0.33531951904296875, 0.3470001220703125, 0.35868072509765625, 0.370361328125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 8.0, 11.0, 5.0, 14.0, 18.0, 38.0, 60.0, 99.0, 136.0, 160.0, 135.0, 127.0, 67.0, 48.0, 30.0, 16.0, 8.0, 10.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.418651580810547, -23.833621978759766, -23.248592376708984, -22.66356086730957, -22.07853126525879, -21.493501663208008, -20.908470153808594, -20.323440551757812, -19.73841094970703, -19.15338134765625, -18.56835174560547, -17.983320236206055, -17.398290634155273, -16.813261032104492, -16.228229522705078, -15.643199920654297, -15.058170318603516, -14.473140716552734, -13.888110160827637, -13.303079605102539, -12.718050003051758, -12.133020401000977, -11.547989845275879, -10.962959289550781, -10.3779296875, -9.792900085449219, -9.207869529724121, -8.622838973999023, -8.037809371948242, -7.452779293060303, -6.867749214172363, -6.282719135284424, -5.697690010070801, -5.112659931182861, -4.527629852294922, -3.9425997734069824, -3.357569694519043, -2.7725396156311035, -2.187509536743164, -1.6024794578552246, -1.0174493789672852, -0.4324193000793457, 0.15261077880859375, 0.7376408576965332, 1.3226709365844727, 1.907701015472412, 2.4927310943603516, 3.077761173248291, 3.6627912521362305, 4.24782133102417, 4.832851409912109, 5.417881488800049, 6.002911567687988, 6.587941646575928, 7.172971725463867, 7.758001804351807, 8.343031883239746, 8.928062438964844, 9.513092041015625, 10.098121643066406, 10.683152198791504, 11.268182754516602, 11.853212356567383, 12.438241958618164, 13.023272514343262]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 1.0, 10.0, 10.0, 8.0, 6.0, 14.0, 15.0, 29.0, 22.0, 29.0, 26.0, 31.0, 36.0, 42.0, 44.0, 34.0, 51.0, 53.0, 53.0, 37.0, 49.0, 45.0, 43.0, 44.0, 25.0, 29.0, 29.0, 33.0, 26.0, 17.0, 20.0, 15.0, 18.0, 11.0, 5.0, 4.0, 5.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.686367511749268, -5.500733375549316, -5.315099239349365, -5.129465103149414, -4.943830966949463, -4.758196830749512, -4.5725626945495605, -4.386928558349609, -4.201294422149658, -4.015660285949707, -3.830026149749756, -3.6443920135498047, -3.4587578773498535, -3.2731237411499023, -3.087489604949951, -2.90185546875, -2.7162210941314697, -2.5305869579315186, -2.3449528217315674, -2.159318685531616, -1.973684549331665, -1.7880504131317139, -1.6024161577224731, -1.416782021522522, -1.2311478853225708, -1.0455137491226196, -0.8598796129226685, -0.6742454171180725, -0.48861128091812134, -0.30297714471817017, -0.11734294891357422, 0.06829118728637695, 0.2539253234863281, 0.4395594596862793, 0.6251935958862305, 0.8108277916908264, 0.9964619278907776, 1.182096004486084, 1.3677302598953247, 1.5533643960952759, 1.738998532295227, 1.9246326684951782, 2.110266923904419, 2.29590106010437, 2.4815351963043213, 2.6671693325042725, 2.8528034687042236, 3.038437604904175, 3.224071741104126, 3.409705877304077, 3.5953400135040283, 3.7809741497039795, 3.9666082859039307, 4.152242660522461, 4.337876796722412, 4.523510932922363, 4.7091450691223145, 4.894779205322266, 5.080413341522217, 5.266047477722168, 5.451681613922119, 5.63731575012207, 5.8229498863220215, 6.008584022521973, 6.194218158721924]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 11.0, 11.0, 18.0, 23.0, 51.0, 73.0, 98.0, 155.0, 197.0, 327.0, 507.0, 860.0, 1400.0, 2339.0, 3844.0, 6710.0, 11952.0, 21587.0, 41710.0, 78042.0, 136078.0, 195617.0, 204053.0, 150009.0, 88622.0, 47182.0, 25226.0, 13357.0, 7570.0, 4322.0, 2523.0, 1510.0, 975.0, 554.0, 357.0, 248.0, 146.0, 93.0, 58.0, 38.0, 34.0, 26.0, 17.0, 6.0, 6.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.42681884765625, -5.2403564453125, -5.05389404296875, -4.867431640625, -4.68096923828125, -4.4945068359375, -4.30804443359375, -4.12158203125, -3.93511962890625, -3.7486572265625, -3.56219482421875, -3.375732421875, -3.18927001953125, -3.0028076171875, -2.81634521484375, -2.6298828125, -2.44342041015625, -2.2569580078125, -2.07049560546875, -1.884033203125, -1.69757080078125, -1.5111083984375, -1.32464599609375, -1.13818359375, -0.95172119140625, -0.7652587890625, -0.57879638671875, -0.392333984375, -0.20587158203125, -0.0194091796875, 0.16705322265625, 0.353515625, 0.53997802734375, 0.7264404296875, 0.91290283203125, 1.099365234375, 1.28582763671875, 1.4722900390625, 1.65875244140625, 1.84521484375, 2.03167724609375, 2.2181396484375, 2.40460205078125, 2.591064453125, 2.77752685546875, 2.9639892578125, 3.15045166015625, 3.3369140625, 3.52337646484375, 3.7098388671875, 3.89630126953125, 4.082763671875, 4.26922607421875, 4.4556884765625, 4.64215087890625, 4.82861328125, 5.01507568359375, 5.2015380859375, 5.38800048828125, 5.574462890625, 5.76092529296875, 5.9473876953125, 6.13385009765625, 6.3203125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 15.0, 8.0, 14.0, 20.0, 23.0, 29.0, 29.0, 33.0, 33.0, 44.0, 45.0, 50.0, 49.0, 59.0, 63.0, 50.0, 46.0, 48.0, 46.0, 38.0, 37.0, 31.0, 34.0, 32.0, 17.0, 16.0, 14.0, 7.0, 16.0, 9.0, 7.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33203125, -6.11053466796875, -5.8890380859375, -5.66754150390625, -5.446044921875, -5.22454833984375, -5.0030517578125, -4.78155517578125, -4.56005859375, -4.33856201171875, -4.1170654296875, -3.89556884765625, -3.674072265625, -3.45257568359375, -3.2310791015625, -3.00958251953125, -2.7880859375, -2.56658935546875, -2.3450927734375, -2.12359619140625, -1.902099609375, -1.68060302734375, -1.4591064453125, -1.23760986328125, -1.01611328125, -0.79461669921875, -0.5731201171875, -0.35162353515625, -0.130126953125, 0.09136962890625, 0.3128662109375, 0.53436279296875, 0.755859375, 0.97735595703125, 1.1988525390625, 1.42034912109375, 1.641845703125, 1.86334228515625, 2.0848388671875, 2.30633544921875, 2.52783203125, 2.74932861328125, 2.9708251953125, 3.19232177734375, 3.413818359375, 3.63531494140625, 3.8568115234375, 4.07830810546875, 4.2998046875, 4.52130126953125, 4.7427978515625, 4.96429443359375, 5.185791015625, 5.40728759765625, 5.6287841796875, 5.85028076171875, 6.07177734375, 6.29327392578125, 6.5147705078125, 6.73626708984375, 6.957763671875, 7.17926025390625, 7.4007568359375, 7.62225341796875, 7.84375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 11.0, 12.0, 21.0, 22.0, 49.0, 78.0, 143.0, 190.0, 339.0, 610.0, 1103.0, 2084.0, 3696.0, 7526.0, 14794.0, 29994.0, 59645.0, 112618.0, 185530.0, 222434.0, 181205.0, 109720.0, 58138.0, 29036.0, 14226.0, 7143.0, 3789.0, 1877.0, 1102.0, 592.0, 321.0, 204.0, 105.0, 78.0, 45.0, 30.0, 16.0, 12.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.037353515625, -5.83251953125, -5.627685546875, -5.4228515625, -5.218017578125, -5.01318359375, -4.808349609375, -4.603515625, -4.398681640625, -4.19384765625, -3.989013671875, -3.7841796875, -3.579345703125, -3.37451171875, -3.169677734375, -2.96484375, -2.760009765625, -2.55517578125, -2.350341796875, -2.1455078125, -1.940673828125, -1.73583984375, -1.531005859375, -1.326171875, -1.121337890625, -0.91650390625, -0.711669921875, -0.5068359375, -0.302001953125, -0.09716796875, 0.107666015625, 0.3125, 0.517333984375, 0.72216796875, 0.927001953125, 1.1318359375, 1.336669921875, 1.54150390625, 1.746337890625, 1.951171875, 2.156005859375, 2.36083984375, 2.565673828125, 2.7705078125, 2.975341796875, 3.18017578125, 3.385009765625, 3.58984375, 3.794677734375, 3.99951171875, 4.204345703125, 4.4091796875, 4.614013671875, 4.81884765625, 5.023681640625, 5.228515625, 5.433349609375, 5.63818359375, 5.843017578125, 6.0478515625, 6.252685546875, 6.45751953125, 6.662353515625, 6.8671875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 10.0, 13.0, 16.0, 27.0, 21.0, 22.0, 27.0, 29.0, 29.0, 35.0, 45.0, 40.0, 52.0, 40.0, 40.0, 42.0, 53.0, 50.0, 44.0, 42.0, 29.0, 33.0, 25.0, 35.0, 27.0, 19.0, 29.0, 16.0, 12.0, 13.0, 13.0, 8.0, 14.0, 6.0, 1.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.208984375, -3.095550537109375, -2.98211669921875, -2.868682861328125, -2.7552490234375, -2.641815185546875, -2.52838134765625, -2.414947509765625, -2.301513671875, -2.188079833984375, -2.07464599609375, -1.961212158203125, -1.8477783203125, -1.734344482421875, -1.62091064453125, -1.507476806640625, -1.39404296875, -1.280609130859375, -1.16717529296875, -1.053741455078125, -0.9403076171875, -0.826873779296875, -0.71343994140625, -0.600006103515625, -0.486572265625, -0.373138427734375, -0.25970458984375, -0.146270751953125, -0.0328369140625, 0.080596923828125, 0.19403076171875, 0.307464599609375, 0.4208984375, 0.534332275390625, 0.64776611328125, 0.761199951171875, 0.8746337890625, 0.988067626953125, 1.10150146484375, 1.214935302734375, 1.328369140625, 1.441802978515625, 1.55523681640625, 1.668670654296875, 1.7821044921875, 1.895538330078125, 2.00897216796875, 2.122406005859375, 2.23583984375, 2.349273681640625, 2.46270751953125, 2.576141357421875, 2.6895751953125, 2.803009033203125, 2.91644287109375, 3.029876708984375, 3.143310546875, 3.256744384765625, 3.37017822265625, 3.483612060546875, 3.5970458984375, 3.710479736328125, 3.82391357421875, 3.937347412109375, 4.05078125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 15.0, 16.0, 26.0, 50.0, 50.0, 74.0, 99.0, 146.0, 191.0, 325.0, 490.0, 757.0, 1191.0, 2057.0, 3662.0, 6525.0, 11963.0, 23049.0, 44396.0, 85892.0, 153464.0, 217060.0, 205989.0, 135610.0, 73421.0, 37987.0, 19700.0, 10545.0, 5716.0, 3187.0, 1854.0, 1023.0, 708.0, 418.0, 257.0, 176.0, 119.0, 99.0, 62.0, 54.0, 42.0, 30.0, 13.0, 16.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.60888671875, -2.5185546875, -2.42822265625, -2.337890625, -2.24755859375, -2.1572265625, -2.06689453125, -1.9765625, -1.88623046875, -1.7958984375, -1.70556640625, -1.615234375, -1.52490234375, -1.4345703125, -1.34423828125, -1.25390625, -1.16357421875, -1.0732421875, -0.98291015625, -0.892578125, -0.80224609375, -0.7119140625, -0.62158203125, -0.53125, -0.44091796875, -0.3505859375, -0.26025390625, -0.169921875, -0.07958984375, 0.0107421875, 0.10107421875, 0.19140625, 0.28173828125, 0.3720703125, 0.46240234375, 0.552734375, 0.64306640625, 0.7333984375, 0.82373046875, 0.9140625, 1.00439453125, 1.0947265625, 1.18505859375, 1.275390625, 1.36572265625, 1.4560546875, 1.54638671875, 1.63671875, 1.72705078125, 1.8173828125, 1.90771484375, 1.998046875, 2.08837890625, 2.1787109375, 2.26904296875, 2.359375, 2.44970703125, 2.5400390625, 2.63037109375, 2.720703125, 2.81103515625, 2.9013671875, 2.99169921875, 3.08203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 5.0, 12.0, 4.0, 10.0, 9.0, 11.0, 15.0, 24.0, 18.0, 33.0, 30.0, 35.0, 46.0, 38.0, 36.0, 54.0, 36.0, 55.0, 52.0, 59.0, 48.0, 47.0, 47.0, 40.0, 32.0, 28.0, 25.0, 25.0, 23.0, 15.0, 13.0, 13.0, 11.0, 4.0, 10.0, 10.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017440319061279297, -0.00016897358000278473, -0.0001635439693927765, -0.00015811435878276825, -0.00015268474817276, -0.00014725513756275177, -0.00014182552695274353, -0.0001363959163427353, -0.00013096630573272705, -0.0001255366951227188, -0.00012010708451271057, -0.00011467747390270233, -0.00010924786329269409, -0.00010381825268268585, -9.838864207267761e-05, -9.295903146266937e-05, -8.752942085266113e-05, -8.209981024265289e-05, -7.667019963264465e-05, -7.124058902263641e-05, -6.581097841262817e-05, -6.0381367802619934e-05, -5.4951757192611694e-05, -4.9522146582603455e-05, -4.4092535972595215e-05, -3.8662925362586975e-05, -3.3233314752578735e-05, -2.7803704142570496e-05, -2.2374093532562256e-05, -1.6944482922554016e-05, -1.1514872312545776e-05, -6.085261702537537e-06, -6.556510925292969e-07, 4.773959517478943e-06, 1.0203570127487183e-05, 1.5633180737495422e-05, 2.1062791347503662e-05, 2.6492401957511902e-05, 3.192201256752014e-05, 3.735162317752838e-05, 4.278123378753662e-05, 4.821084439754486e-05, 5.36404550075531e-05, 5.907006561756134e-05, 6.449967622756958e-05, 6.992928683757782e-05, 7.535889744758606e-05, 8.07885080575943e-05, 8.621811866760254e-05, 9.164772927761078e-05, 9.707733988761902e-05, 0.00010250695049762726, 0.0001079365611076355, 0.00011336617171764374, 0.00011879578232765198, 0.00012422539293766022, 0.00012965500354766846, 0.0001350846141576767, 0.00014051422476768494, 0.00014594383537769318, 0.00015137344598770142, 0.00015680305659770966, 0.0001622326672077179, 0.00016766227781772614, 0.00017309188842773438]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 11.0, 10.0, 14.0, 20.0, 26.0, 33.0, 49.0, 54.0, 86.0, 151.0, 171.0, 265.0, 507.0, 844.0, 1609.0, 3299.0, 7060.0, 16246.0, 40014.0, 97698.0, 212139.0, 292363.0, 209654.0, 97023.0, 39170.0, 16094.0, 6972.0, 3218.0, 1619.0, 807.0, 428.0, 270.0, 169.0, 134.0, 90.0, 60.0, 59.0, 25.0, 24.0, 21.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1796875, -3.06402587890625, -2.9483642578125, -2.83270263671875, -2.717041015625, -2.60137939453125, -2.4857177734375, -2.37005615234375, -2.25439453125, -2.13873291015625, -2.0230712890625, -1.90740966796875, -1.791748046875, -1.67608642578125, -1.5604248046875, -1.44476318359375, -1.3291015625, -1.21343994140625, -1.0977783203125, -0.98211669921875, -0.866455078125, -0.75079345703125, -0.6351318359375, -0.51947021484375, -0.40380859375, -0.28814697265625, -0.1724853515625, -0.05682373046875, 0.058837890625, 0.17449951171875, 0.2901611328125, 0.40582275390625, 0.521484375, 0.63714599609375, 0.7528076171875, 0.86846923828125, 0.984130859375, 1.09979248046875, 1.2154541015625, 1.33111572265625, 1.44677734375, 1.56243896484375, 1.6781005859375, 1.79376220703125, 1.909423828125, 2.02508544921875, 2.1407470703125, 2.25640869140625, 2.3720703125, 2.48773193359375, 2.6033935546875, 2.71905517578125, 2.834716796875, 2.95037841796875, 3.0660400390625, 3.18170166015625, 3.29736328125, 3.41302490234375, 3.5286865234375, 3.64434814453125, 3.760009765625, 3.87567138671875, 3.9913330078125, 4.10699462890625, 4.22265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 9.0, 11.0, 19.0, 20.0, 16.0, 25.0, 49.0, 27.0, 37.0, 44.0, 53.0, 58.0, 49.0, 63.0, 52.0, 51.0, 55.0, 48.0, 39.0, 44.0, 31.0, 34.0, 21.0, 24.0, 19.0, 12.0, 13.0, 13.0, 5.0, 8.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6347808837890625, -0.611358642578125, -0.5879364013671875, -0.56451416015625, -0.5410919189453125, -0.517669677734375, -0.4942474365234375, -0.4708251953125, -0.4474029541015625, -0.423980712890625, -0.4005584716796875, -0.37713623046875, -0.3537139892578125, -0.330291748046875, -0.3068695068359375, -0.283447265625, -0.2600250244140625, -0.236602783203125, -0.2131805419921875, -0.18975830078125, -0.1663360595703125, -0.142913818359375, -0.1194915771484375, -0.0960693359375, -0.0726470947265625, -0.049224853515625, -0.0258026123046875, -0.00238037109375, 0.0210418701171875, 0.044464111328125, 0.0678863525390625, 0.09130859375, 0.1147308349609375, 0.138153076171875, 0.1615753173828125, 0.18499755859375, 0.2084197998046875, 0.231842041015625, 0.2552642822265625, 0.2786865234375, 0.3021087646484375, 0.325531005859375, 0.3489532470703125, 0.37237548828125, 0.3957977294921875, 0.419219970703125, 0.4426422119140625, 0.466064453125, 0.4894866943359375, 0.512908935546875, 0.5363311767578125, 0.55975341796875, 0.5831756591796875, 0.606597900390625, 0.6300201416015625, 0.6534423828125, 0.6768646240234375, 0.700286865234375, 0.7237091064453125, 0.74713134765625, 0.7705535888671875, 0.793975830078125, 0.8173980712890625, 0.8408203125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 15.0, 15.0, 25.0, 51.0, 73.0, 116.0, 153.0, 134.0, 133.0, 103.0, 64.0, 35.0, 23.0, 15.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.390901565551758, -21.834444046020508, -21.27798843383789, -20.72153091430664, -20.16507339477539, -19.60861587524414, -19.052160263061523, -18.495702743530273, -17.939247131347656, -17.382789611816406, -16.82633399963379, -16.26987648010254, -15.713418960571289, -15.156962394714355, -14.600505828857422, -14.044048309326172, -13.487590789794922, -12.931134223937988, -12.374676704406738, -11.818220138549805, -11.261762619018555, -10.705306053161621, -10.148849487304688, -9.592391967773438, -9.035935401916504, -8.47947883605957, -7.92302131652832, -7.366564750671387, -6.810107707977295, -6.253650665283203, -5.6971940994262695, -5.140737056732178, -4.584280014038086, -4.027822971343994, -3.4713661670684814, -2.9149093627929688, -2.358452320098877, -1.8019952774047852, -1.2455384731292725, -0.6890816688537598, -0.13262462615966797, 0.4238322973251343, 0.9802892208099365, 1.5367461442947388, 2.093203067779541, 2.649660110473633, 3.2061169147491455, 3.762573719024658, 4.31903076171875, 4.875487804412842, 5.431944847106934, 5.988401412963867, 6.544858455657959, 7.101315498352051, 7.657772064208984, 8.214229583740234, 8.770686149597168, 9.327142715454102, 9.883600234985352, 10.440056800842285, 10.996513366699219, 11.552970886230469, 12.109427452087402, 12.665884017944336, 13.222341537475586]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 7.0, 10.0, 7.0, 17.0, 10.0, 15.0, 16.0, 24.0, 29.0, 26.0, 34.0, 27.0, 32.0, 45.0, 44.0, 24.0, 47.0, 43.0, 40.0, 42.0, 37.0, 48.0, 43.0, 34.0, 24.0, 26.0, 40.0, 24.0, 33.0, 21.0, 11.0, 13.0, 15.0, 14.0, 10.0, 13.0, 4.0, 5.0, 8.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.121384620666504, -4.95353364944458, -4.785682201385498, -4.617831230163574, -4.44998025894165, -4.282129287719727, -4.1142778396606445, -3.9464268684387207, -3.778575897216797, -3.610724687576294, -3.44287371635437, -3.275022506713867, -3.1071715354919434, -2.9393203258514404, -2.7714691162109375, -2.6036181449890137, -2.4357669353485107, -2.267915725708008, -2.100064754486084, -1.932213544845581, -1.7643625736236572, -1.5965113639831543, -1.428660273551941, -1.2608091831207275, -1.0929580926895142, -0.9251070022583008, -0.7572559118270874, -0.5894047617912292, -0.42155367136001587, -0.2537025809288025, -0.08585143089294434, 0.08199965953826904, 0.24985074996948242, 0.4177018404006958, 0.5855529308319092, 0.7534040808677673, 0.9212551712989807, 1.0891063213348389, 1.2569574117660522, 1.4248085021972656, 1.592659592628479, 1.7605106830596924, 1.9283617734909058, 2.096212863922119, 2.264064073562622, 2.431915044784546, 2.599766254425049, 2.7676172256469727, 2.9354684352874756, 3.1033196449279785, 3.2711706161499023, 3.4390218257904053, 3.606872797012329, 3.774724006652832, 3.942574977874756, 4.11042594909668, 4.278277397155762, 4.4461283683776855, 4.613979816436768, 4.781830787658691, 4.949681758880615, 5.117532730102539, 5.285384178161621, 5.453235149383545, 5.621086120605469]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 10.0, 12.0, 10.0, 20.0, 29.0, 41.0, 57.0, 85.0, 116.0, 177.0, 288.0, 355.0, 599.0, 879.0, 1493.0, 2363.0, 3821.0, 6575.0, 12141.0, 25232.0, 64131.0, 223690.0, 932350.0, 1871904.0, 760020.0, 179736.0, 55171.0, 23322.0, 11923.0, 6687.0, 3897.0, 2439.0, 1528.0, 1039.0, 681.0, 433.0, 290.0, 213.0, 160.0, 107.0, 75.0, 54.0, 35.0, 36.0, 16.0, 14.0, 9.0, 6.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0], "bins": [-12.9765625, -12.576416015625, -12.17626953125, -11.776123046875, -11.3759765625, -10.975830078125, -10.57568359375, -10.175537109375, -9.775390625, -9.375244140625, -8.97509765625, -8.574951171875, -8.1748046875, -7.774658203125, -7.37451171875, -6.974365234375, -6.57421875, -6.174072265625, -5.77392578125, -5.373779296875, -4.9736328125, -4.573486328125, -4.17333984375, -3.773193359375, -3.373046875, -2.972900390625, -2.57275390625, -2.172607421875, -1.7724609375, -1.372314453125, -0.97216796875, -0.572021484375, -0.171875, 0.228271484375, 0.62841796875, 1.028564453125, 1.4287109375, 1.828857421875, 2.22900390625, 2.629150390625, 3.029296875, 3.429443359375, 3.82958984375, 4.229736328125, 4.6298828125, 5.030029296875, 5.43017578125, 5.830322265625, 6.23046875, 6.630615234375, 7.03076171875, 7.430908203125, 7.8310546875, 8.231201171875, 8.63134765625, 9.031494140625, 9.431640625, 9.831787109375, 10.23193359375, 10.632080078125, 11.0322265625, 11.432373046875, 11.83251953125, 12.232666015625, 12.6328125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 7.0, 7.0, 5.0, 17.0, 19.0, 14.0, 12.0, 10.0, 20.0, 29.0, 34.0, 37.0, 38.0, 43.0, 59.0, 40.0, 36.0, 47.0, 40.0, 54.0, 48.0, 42.0, 47.0, 32.0, 36.0, 28.0, 37.0, 20.0, 25.0, 18.0, 13.0, 11.0, 15.0, 13.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.34375, -4.20880126953125, -4.0738525390625, -3.93890380859375, -3.803955078125, -3.66900634765625, -3.5340576171875, -3.39910888671875, -3.26416015625, -3.12921142578125, -2.9942626953125, -2.85931396484375, -2.724365234375, -2.58941650390625, -2.4544677734375, -2.31951904296875, -2.1845703125, -2.04962158203125, -1.9146728515625, -1.77972412109375, -1.644775390625, -1.50982666015625, -1.3748779296875, -1.23992919921875, -1.10498046875, -0.97003173828125, -0.8350830078125, -0.70013427734375, -0.565185546875, -0.43023681640625, -0.2952880859375, -0.16033935546875, -0.025390625, 0.10955810546875, 0.2445068359375, 0.37945556640625, 0.514404296875, 0.64935302734375, 0.7843017578125, 0.91925048828125, 1.05419921875, 1.18914794921875, 1.3240966796875, 1.45904541015625, 1.593994140625, 1.72894287109375, 1.8638916015625, 1.99884033203125, 2.1337890625, 2.26873779296875, 2.4036865234375, 2.53863525390625, 2.673583984375, 2.80853271484375, 2.9434814453125, 3.07843017578125, 3.21337890625, 3.34832763671875, 3.4832763671875, 3.61822509765625, 3.753173828125, 3.88812255859375, 4.0230712890625, 4.15802001953125, 4.29296875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 24.0, 25.0, 35.0, 55.0, 77.0, 139.0, 229.0, 343.0, 553.0, 913.0, 1525.0, 2553.0, 4294.0, 7599.0, 13629.0, 26086.0, 56007.0, 144541.0, 472255.0, 1407689.0, 1360993.0, 445860.0, 138213.0, 54084.0, 25620.0, 13104.0, 7350.0, 4251.0, 2475.0, 1450.0, 876.0, 535.0, 343.0, 196.0, 121.0, 90.0, 46.0, 36.0, 10.0, 17.0, 7.0, 4.0, 6.0, 7.0, 6.0, 1.0, 0.0, 3.0], "bins": [-13.921875, -13.534912109375, -13.14794921875, -12.760986328125, -12.3740234375, -11.987060546875, -11.60009765625, -11.213134765625, -10.826171875, -10.439208984375, -10.05224609375, -9.665283203125, -9.2783203125, -8.891357421875, -8.50439453125, -8.117431640625, -7.73046875, -7.343505859375, -6.95654296875, -6.569580078125, -6.1826171875, -5.795654296875, -5.40869140625, -5.021728515625, -4.634765625, -4.247802734375, -3.86083984375, -3.473876953125, -3.0869140625, -2.699951171875, -2.31298828125, -1.926025390625, -1.5390625, -1.152099609375, -0.76513671875, -0.378173828125, 0.0087890625, 0.395751953125, 0.78271484375, 1.169677734375, 1.556640625, 1.943603515625, 2.33056640625, 2.717529296875, 3.1044921875, 3.491455078125, 3.87841796875, 4.265380859375, 4.65234375, 5.039306640625, 5.42626953125, 5.813232421875, 6.2001953125, 6.587158203125, 6.97412109375, 7.361083984375, 7.748046875, 8.135009765625, 8.52197265625, 8.908935546875, 9.2958984375, 9.682861328125, 10.06982421875, 10.456787109375, 10.84375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 13.0, 13.0, 16.0, 26.0, 26.0, 35.0, 39.0, 59.0, 71.0, 96.0, 129.0, 174.0, 219.0, 264.0, 321.0, 350.0, 373.0, 333.0, 304.0, 247.0, 217.0, 154.0, 129.0, 112.0, 60.0, 65.0, 38.0, 45.0, 33.0, 18.0, 14.0, 14.0, 16.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.921875, -2.832122802734375, -2.74237060546875, -2.652618408203125, -2.5628662109375, -2.473114013671875, -2.38336181640625, -2.293609619140625, -2.203857421875, -2.114105224609375, -2.02435302734375, -1.934600830078125, -1.8448486328125, -1.755096435546875, -1.66534423828125, -1.575592041015625, -1.48583984375, -1.396087646484375, -1.30633544921875, -1.216583251953125, -1.1268310546875, -1.037078857421875, -0.94732666015625, -0.857574462890625, -0.767822265625, -0.678070068359375, -0.58831787109375, -0.498565673828125, -0.4088134765625, -0.319061279296875, -0.22930908203125, -0.139556884765625, -0.0498046875, 0.039947509765625, 0.12969970703125, 0.219451904296875, 0.3092041015625, 0.398956298828125, 0.48870849609375, 0.578460693359375, 0.668212890625, 0.757965087890625, 0.84771728515625, 0.937469482421875, 1.0272216796875, 1.116973876953125, 1.20672607421875, 1.296478271484375, 1.38623046875, 1.475982666015625, 1.56573486328125, 1.655487060546875, 1.7452392578125, 1.834991455078125, 1.92474365234375, 2.014495849609375, 2.104248046875, 2.194000244140625, 2.28375244140625, 2.373504638671875, 2.4632568359375, 2.553009033203125, 2.64276123046875, 2.732513427734375, 2.822265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 11.0, 8.0, 8.0, 18.0, 32.0, 33.0, 57.0, 91.0, 152.0, 145.0, 130.0, 115.0, 62.0, 51.0, 32.0, 22.0, 8.0, 12.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.550376892089844, -20.00428581237793, -19.458194732666016, -18.9121036529541, -18.366012573242188, -17.819923400878906, -17.27383041381836, -16.727741241455078, -16.181650161743164, -15.63555908203125, -15.089468002319336, -14.543376922607422, -13.997286796569824, -13.45119571685791, -12.905104637145996, -12.359013557434082, -11.812922477722168, -11.266831398010254, -10.72074031829834, -10.174650192260742, -9.628559112548828, -9.082468032836914, -8.536376953125, -7.990285873413086, -7.44419527053833, -6.898104190826416, -6.35201358795166, -5.805922508239746, -5.259831428527832, -4.713740825653076, -4.167649745941162, -3.621558904647827, -3.0754690170288086, -2.5293781757354736, -1.9832872152328491, -1.4371962547302246, -0.8911054134368896, -0.3450145721435547, 0.20107650756835938, 0.7471673488616943, 1.2932581901550293, 1.8393490314483643, 2.385439872741699, 2.9315309524536133, 3.4776217937469482, 4.023712635040283, 4.569803714752197, 5.115894317626953, 5.661985397338867, 6.208076477050781, 6.754167079925537, 7.300258159637451, 7.846348762512207, 8.392439842224121, 8.938530921936035, 9.48462200164795, 10.030712127685547, 10.576803207397461, 11.122894287109375, 11.668985366821289, 12.215075492858887, 12.7611665725708, 13.307257652282715, 13.853348731994629, 14.399439811706543]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 11.0, 5.0, 13.0, 13.0, 12.0, 18.0, 12.0, 12.0, 29.0, 29.0, 32.0, 39.0, 45.0, 52.0, 37.0, 52.0, 42.0, 46.0, 42.0, 45.0, 34.0, 50.0, 45.0, 32.0, 41.0, 28.0, 24.0, 15.0, 27.0, 16.0, 19.0, 9.0, 14.0, 9.0, 12.0, 12.0, 3.0, 1.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.3932414054870605, -5.21558141708374, -5.03792142868042, -4.8602614402771, -4.682601451873779, -4.504941463470459, -4.327281951904297, -4.149621963500977, -3.971961736679077, -3.794301748275757, -3.6166417598724365, -3.4389820098876953, -3.261322021484375, -3.0836620330810547, -2.9060020446777344, -2.728342056274414, -2.5506820678710938, -2.3730220794677734, -2.195362091064453, -2.017702102661133, -1.840042233467102, -1.6623822450637817, -1.484722375869751, -1.3070623874664307, -1.1294023990631104, -0.95174241065979, -0.7740824818611145, -0.596422553062439, -0.41876256465911865, -0.24110257625579834, -0.06344270706176758, 0.11421728134155273, 0.29187774658203125, 0.4695377051830292, 0.6471976637840271, 0.8248575925827026, 1.002517580986023, 1.1801775693893433, 1.357837438583374, 1.5354974269866943, 1.7131574153900146, 1.890817403793335, 2.0684773921966553, 2.2461371421813965, 2.423797130584717, 2.601457118988037, 2.7791171073913574, 2.9567770957946777, 3.134437084197998, 3.3120970726013184, 3.4897570610046387, 3.667417049407959, 3.8450770378112793, 4.0227370262146, 4.200396537780762, 4.378056526184082, 4.555716514587402, 4.733376502990723, 4.911036491394043, 5.088696479797363, 5.266356468200684, 5.444016456604004, 5.621676445007324, 5.7993364334106445, 5.976996421813965]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 11.0, 15.0, 21.0, 34.0, 42.0, 71.0, 113.0, 148.0, 234.0, 313.0, 522.0, 781.0, 1228.0, 1945.0, 3232.0, 5237.0, 8964.0, 15778.0, 28061.0, 51888.0, 95986.0, 167766.0, 223434.0, 189945.0, 113315.0, 60878.0, 33337.0, 18640.0, 10471.0, 6254.0, 3686.0, 2235.0, 1429.0, 903.0, 567.0, 380.0, 212.0, 150.0, 110.0, 67.0, 49.0, 26.0, 33.0, 10.0, 7.0, 11.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.46563720703125, -2.3824462890625, -2.29925537109375, -2.216064453125, -2.13287353515625, -2.0496826171875, -1.96649169921875, -1.88330078125, -1.80010986328125, -1.7169189453125, -1.63372802734375, -1.550537109375, -1.46734619140625, -1.3841552734375, -1.30096435546875, -1.2177734375, -1.13458251953125, -1.0513916015625, -0.96820068359375, -0.885009765625, -0.80181884765625, -0.7186279296875, -0.63543701171875, -0.55224609375, -0.46905517578125, -0.3858642578125, -0.30267333984375, -0.219482421875, -0.13629150390625, -0.0531005859375, 0.03009033203125, 0.11328125, 0.19647216796875, 0.2796630859375, 0.36285400390625, 0.446044921875, 0.52923583984375, 0.6124267578125, 0.69561767578125, 0.77880859375, 0.86199951171875, 0.9451904296875, 1.02838134765625, 1.111572265625, 1.19476318359375, 1.2779541015625, 1.36114501953125, 1.4443359375, 1.52752685546875, 1.6107177734375, 1.69390869140625, 1.777099609375, 1.86029052734375, 1.9434814453125, 2.02667236328125, 2.10986328125, 2.19305419921875, 2.2762451171875, 2.35943603515625, 2.442626953125, 2.52581787109375, 2.6090087890625, 2.69219970703125, 2.775390625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 3.0, 8.0, 6.0, 10.0, 12.0, 14.0, 13.0, 21.0, 21.0, 21.0, 25.0, 50.0, 35.0, 38.0, 37.0, 46.0, 43.0, 37.0, 51.0, 53.0, 47.0, 51.0, 36.0, 39.0, 35.0, 35.0, 22.0, 30.0, 17.0, 25.0, 15.0, 18.0, 14.0, 10.0, 11.0, 6.0, 8.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.591064453125, -5.39697265625, -5.202880859375, -5.0087890625, -4.814697265625, -4.62060546875, -4.426513671875, -4.232421875, -4.038330078125, -3.84423828125, -3.650146484375, -3.4560546875, -3.261962890625, -3.06787109375, -2.873779296875, -2.6796875, -2.485595703125, -2.29150390625, -2.097412109375, -1.9033203125, -1.709228515625, -1.51513671875, -1.321044921875, -1.126953125, -0.932861328125, -0.73876953125, -0.544677734375, -0.3505859375, -0.156494140625, 0.03759765625, 0.231689453125, 0.42578125, 0.619873046875, 0.81396484375, 1.008056640625, 1.2021484375, 1.396240234375, 1.59033203125, 1.784423828125, 1.978515625, 2.172607421875, 2.36669921875, 2.560791015625, 2.7548828125, 2.948974609375, 3.14306640625, 3.337158203125, 3.53125, 3.725341796875, 3.91943359375, 4.113525390625, 4.3076171875, 4.501708984375, 4.69580078125, 4.889892578125, 5.083984375, 5.278076171875, 5.47216796875, 5.666259765625, 5.8603515625, 6.054443359375, 6.24853515625, 6.442626953125, 6.63671875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 14.0, 16.0, 16.0, 40.0, 56.0, 81.0, 137.0, 190.0, 298.0, 442.0, 708.0, 1054.0, 1731.0, 2836.0, 4658.0, 7940.0, 13910.0, 25070.0, 45288.0, 83133.0, 148019.0, 219186.0, 204188.0, 128598.0, 70903.0, 38729.0, 21234.0, 12154.0, 6958.0, 4186.0, 2493.0, 1582.0, 957.0, 584.0, 377.0, 257.0, 188.0, 124.0, 77.0, 45.0, 29.0, 31.0, 14.0, 7.0, 5.0, 3.0, 3.0, 0.0, 6.0, 3.0, 1.0], "bins": [-3.181640625, -3.09039306640625, -2.9991455078125, -2.90789794921875, -2.816650390625, -2.72540283203125, -2.6341552734375, -2.54290771484375, -2.45166015625, -2.36041259765625, -2.2691650390625, -2.17791748046875, -2.086669921875, -1.99542236328125, -1.9041748046875, -1.81292724609375, -1.7216796875, -1.63043212890625, -1.5391845703125, -1.44793701171875, -1.356689453125, -1.26544189453125, -1.1741943359375, -1.08294677734375, -0.99169921875, -0.90045166015625, -0.8092041015625, -0.71795654296875, -0.626708984375, -0.53546142578125, -0.4442138671875, -0.35296630859375, -0.26171875, -0.17047119140625, -0.0792236328125, 0.01202392578125, 0.103271484375, 0.19451904296875, 0.2857666015625, 0.37701416015625, 0.46826171875, 0.55950927734375, 0.6507568359375, 0.74200439453125, 0.833251953125, 0.92449951171875, 1.0157470703125, 1.10699462890625, 1.1982421875, 1.28948974609375, 1.3807373046875, 1.47198486328125, 1.563232421875, 1.65447998046875, 1.7457275390625, 1.83697509765625, 1.92822265625, 2.01947021484375, 2.1107177734375, 2.20196533203125, 2.293212890625, 2.38446044921875, 2.4757080078125, 2.56695556640625, 2.658203125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 16.0, 11.0, 16.0, 19.0, 17.0, 24.0, 16.0, 35.0, 28.0, 30.0, 33.0, 42.0, 35.0, 33.0, 38.0, 47.0, 40.0, 47.0, 42.0, 47.0, 43.0, 33.0, 28.0, 35.0, 28.0, 33.0, 34.0, 23.0, 26.0, 21.0, 16.0, 12.0, 2.0, 7.0, 9.0, 7.0, 4.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.421875, -3.3111572265625, -3.200439453125, -3.0897216796875, -2.97900390625, -2.8682861328125, -2.757568359375, -2.6468505859375, -2.5361328125, -2.4254150390625, -2.314697265625, -2.2039794921875, -2.09326171875, -1.9825439453125, -1.871826171875, -1.7611083984375, -1.650390625, -1.5396728515625, -1.428955078125, -1.3182373046875, -1.20751953125, -1.0968017578125, -0.986083984375, -0.8753662109375, -0.7646484375, -0.6539306640625, -0.543212890625, -0.4324951171875, -0.32177734375, -0.2110595703125, -0.100341796875, 0.0103759765625, 0.12109375, 0.2318115234375, 0.342529296875, 0.4532470703125, 0.56396484375, 0.6746826171875, 0.785400390625, 0.8961181640625, 1.0068359375, 1.1175537109375, 1.228271484375, 1.3389892578125, 1.44970703125, 1.5604248046875, 1.671142578125, 1.7818603515625, 1.892578125, 2.0032958984375, 2.114013671875, 2.2247314453125, 2.33544921875, 2.4461669921875, 2.556884765625, 2.6676025390625, 2.7783203125, 2.8890380859375, 2.999755859375, 3.1104736328125, 3.22119140625, 3.3319091796875, 3.442626953125, 3.5533447265625, 3.6640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 7.0, 12.0, 10.0, 19.0, 28.0, 40.0, 59.0, 110.0, 140.0, 212.0, 337.0, 503.0, 831.0, 1324.0, 2190.0, 3526.0, 6337.0, 11223.0, 21065.0, 41669.0, 86252.0, 183396.0, 288517.0, 203576.0, 97735.0, 46746.0, 23485.0, 12340.0, 6781.0, 3777.0, 2415.0, 1360.0, 866.0, 550.0, 369.0, 240.0, 147.0, 119.0, 70.0, 48.0, 36.0, 19.0, 29.0, 15.0, 10.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.290771484375, -1.24560546875, -1.200439453125, -1.1552734375, -1.110107421875, -1.06494140625, -1.019775390625, -0.974609375, -0.929443359375, -0.88427734375, -0.839111328125, -0.7939453125, -0.748779296875, -0.70361328125, -0.658447265625, -0.61328125, -0.568115234375, -0.52294921875, -0.477783203125, -0.4326171875, -0.387451171875, -0.34228515625, -0.297119140625, -0.251953125, -0.206787109375, -0.16162109375, -0.116455078125, -0.0712890625, -0.026123046875, 0.01904296875, 0.064208984375, 0.109375, 0.154541015625, 0.19970703125, 0.244873046875, 0.2900390625, 0.335205078125, 0.38037109375, 0.425537109375, 0.470703125, 0.515869140625, 0.56103515625, 0.606201171875, 0.6513671875, 0.696533203125, 0.74169921875, 0.786865234375, 0.83203125, 0.877197265625, 0.92236328125, 0.967529296875, 1.0126953125, 1.057861328125, 1.10302734375, 1.148193359375, 1.193359375, 1.238525390625, 1.28369140625, 1.328857421875, 1.3740234375, 1.419189453125, 1.46435546875, 1.509521484375, 1.5546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 4.0, 4.0, 12.0, 13.0, 16.0, 25.0, 38.0, 25.0, 46.0, 55.0, 84.0, 66.0, 71.0, 81.0, 85.0, 72.0, 70.0, 51.0, 51.0, 26.0, 24.0, 29.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.862768739461899e-05, -5.6101009249687195e-05, -5.35743311047554e-05, -5.104765295982361e-05, -4.8520974814891815e-05, -4.599429666996002e-05, -4.346761852502823e-05, -4.0940940380096436e-05, -3.841426223516464e-05, -3.588758409023285e-05, -3.3360905945301056e-05, -3.083422780036926e-05, -2.830754965543747e-05, -2.5780871510505676e-05, -2.3254193365573883e-05, -2.072751522064209e-05, -1.8200837075710297e-05, -1.5674158930778503e-05, -1.314748078584671e-05, -1.0620802640914917e-05, -8.094124495983124e-06, -5.5674463510513306e-06, -3.0407682061195374e-06, -5.140900611877441e-07, 2.012588083744049e-06, 4.539266228675842e-06, 7.0659443736076355e-06, 9.592622518539429e-06, 1.2119300663471222e-05, 1.4645978808403015e-05, 1.717265695333481e-05, 1.96993350982666e-05, 2.2226013243198395e-05, 2.4752691388130188e-05, 2.727936953306198e-05, 2.9806047677993774e-05, 3.233272582292557e-05, 3.485940396785736e-05, 3.7386082112789154e-05, 3.991276025772095e-05, 4.243943840265274e-05, 4.4966116547584534e-05, 4.749279469251633e-05, 5.001947283744812e-05, 5.254615098237991e-05, 5.5072829127311707e-05, 5.75995072722435e-05, 6.012618541717529e-05, 6.265286356210709e-05, 6.517954170703888e-05, 6.770621985197067e-05, 7.023289799690247e-05, 7.275957614183426e-05, 7.528625428676605e-05, 7.781293243169785e-05, 8.033961057662964e-05, 8.286628872156143e-05, 8.539296686649323e-05, 8.791964501142502e-05, 9.044632315635681e-05, 9.29730013012886e-05, 9.54996794462204e-05, 9.802635759115219e-05, 0.00010055303573608398]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 15.0, 20.0, 24.0, 30.0, 65.0, 104.0, 180.0, 313.0, 555.0, 880.0, 1609.0, 2770.0, 5202.0, 10626.0, 22395.0, 49745.0, 114703.0, 237027.0, 288863.0, 171968.0, 76332.0, 33402.0, 15474.0, 7509.0, 3898.0, 2003.0, 1206.0, 676.0, 365.0, 247.0, 137.0, 73.0, 45.0, 27.0, 20.0, 14.0, 11.0, 11.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6064453125, -1.556640625, -1.5068359375, -1.45703125, -1.4072265625, -1.357421875, -1.3076171875, -1.2578125, -1.2080078125, -1.158203125, -1.1083984375, -1.05859375, -1.0087890625, -0.958984375, -0.9091796875, -0.859375, -0.8095703125, -0.759765625, -0.7099609375, -0.66015625, -0.6103515625, -0.560546875, -0.5107421875, -0.4609375, -0.4111328125, -0.361328125, -0.3115234375, -0.26171875, -0.2119140625, -0.162109375, -0.1123046875, -0.0625, -0.0126953125, 0.037109375, 0.0869140625, 0.13671875, 0.1865234375, 0.236328125, 0.2861328125, 0.3359375, 0.3857421875, 0.435546875, 0.4853515625, 0.53515625, 0.5849609375, 0.634765625, 0.6845703125, 0.734375, 0.7841796875, 0.833984375, 0.8837890625, 0.93359375, 0.9833984375, 1.033203125, 1.0830078125, 1.1328125, 1.1826171875, 1.232421875, 1.2822265625, 1.33203125, 1.3818359375, 1.431640625, 1.4814453125, 1.53125, 1.5810546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 8.0, 12.0, 10.0, 16.0, 23.0, 26.0, 31.0, 28.0, 37.0, 31.0, 48.0, 62.0, 53.0, 78.0, 60.0, 67.0, 40.0, 47.0, 49.0, 47.0, 33.0, 36.0, 17.0, 21.0, 18.0, 14.0, 8.0, 13.0, 6.0, 3.0, 5.0, 6.0, 5.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3701171875, -0.3580360412597656, -0.34595489501953125, -0.3338737487792969, -0.3217926025390625, -0.3097114562988281, -0.29763031005859375, -0.2855491638183594, -0.273468017578125, -0.2613868713378906, -0.24930572509765625, -0.23722457885742188, -0.2251434326171875, -0.21306228637695312, -0.20098114013671875, -0.18889999389648438, -0.17681884765625, -0.16473770141601562, -0.15265655517578125, -0.14057540893554688, -0.1284942626953125, -0.11641311645507812, -0.10433197021484375, -0.09225082397460938, -0.080169677734375, -0.06808853149414062, -0.05600738525390625, -0.043926239013671875, -0.0318450927734375, -0.019763946533203125, -0.00768280029296875, 0.004398345947265625, 0.0164794921875, 0.028560638427734375, 0.04064178466796875, 0.052722930908203125, 0.0648040771484375, 0.07688522338867188, 0.08896636962890625, 0.10104751586914062, 0.113128662109375, 0.12520980834960938, 0.13729095458984375, 0.14937210083007812, 0.1614532470703125, 0.17353439331054688, 0.18561553955078125, 0.19769668579101562, 0.20977783203125, 0.22185897827148438, 0.23394012451171875, 0.24602127075195312, 0.2581024169921875, 0.2701835632324219, 0.28226470947265625, 0.2943458557128906, 0.306427001953125, 0.3185081481933594, 0.33058929443359375, 0.3426704406738281, 0.3547515869140625, 0.3668327331542969, 0.37891387939453125, 0.3909950256347656, 0.403076171875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 11.0, 6.0, 8.0, 26.0, 30.0, 48.0, 63.0, 112.0, 167.0, 137.0, 129.0, 95.0, 45.0, 50.0, 29.0, 12.0, 10.0, 13.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.687089920043945, -20.13101577758789, -19.57494354248047, -19.018869400024414, -18.462797164916992, -17.906723022460938, -17.350650787353516, -16.79457664489746, -16.238502502441406, -15.682429313659668, -15.12635612487793, -14.570282936096191, -14.014209747314453, -13.458135604858398, -12.90206241607666, -12.345989227294922, -11.7899169921875, -11.233843803405762, -10.677770614624023, -10.121697425842285, -9.565624237060547, -9.009550094604492, -8.453476905822754, -7.897403717041016, -7.341330528259277, -6.785257339477539, -6.229184150695801, -5.673110485076904, -5.117037296295166, -4.560964107513428, -4.004890441894531, -3.448817253112793, -2.892742156982422, -2.3366689682006836, -1.7805955410003662, -1.2245222330093384, -0.6684489250183105, -0.11237573623657227, 0.4436976909637451, 0.9997711181640625, 1.5558443069458008, 2.111917495727539, 2.6679909229278564, 3.224064350128174, 3.780137538909912, 4.33621072769165, 4.892284393310547, 5.448357582092285, 6.004430770874023, 6.560503959655762, 7.1165771484375, 7.6726508140563965, 8.228723526000977, 8.784797668457031, 9.34087085723877, 9.896944046020508, 10.453017234802246, 11.009090423583984, 11.565163612365723, 12.121236801147461, 12.677310943603516, 13.233383178710938, 13.789457321166992, 14.34553050994873, 14.901603698730469]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 10.0, 3.0, 10.0, 17.0, 10.0, 19.0, 13.0, 11.0, 27.0, 31.0, 32.0, 38.0, 42.0, 49.0, 44.0, 50.0, 44.0, 47.0, 44.0, 42.0, 47.0, 41.0, 44.0, 39.0, 36.0, 26.0, 23.0, 18.0, 28.0, 14.0, 19.0, 12.0, 15.0, 4.0, 13.0, 12.0, 2.0, 3.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.409811973571777, -5.231508255004883, -5.053204536437988, -4.874900817871094, -4.696597099304199, -4.518293380737305, -4.33998966217041, -4.161685943603516, -3.983381986618042, -3.8050782680511475, -3.626774549484253, -3.4484705924987793, -3.2701668739318848, -3.0918631553649902, -2.9135594367980957, -2.735255718231201, -2.5569519996643066, -2.378648281097412, -2.2003445625305176, -2.022040843963623, -1.843737006187439, -1.6654332876205444, -1.4871294498443604, -1.3088257312774658, -1.1305220127105713, -0.9522182941436768, -0.7739145159721375, -0.5956107378005981, -0.4173070192337036, -0.23900330066680908, -0.060699462890625, 0.11760425567626953, 0.29590845108032227, 0.4742121994495392, 0.6525159478187561, 0.8308197259902954, 1.00912344455719, 1.1874271631240845, 1.3657310009002686, 1.544034719467163, 1.7223384380340576, 1.9006421566009521, 2.0789458751678467, 2.2572498321533203, 2.435553550720215, 2.6138572692871094, 2.792160987854004, 2.9704647064208984, 3.148768424987793, 3.3270721435546875, 3.505375862121582, 3.6836795806884766, 3.861983299255371, 4.040287017822266, 4.21859073638916, 4.396894454956055, 4.575198173522949, 4.753501892089844, 4.931805610656738, 5.110109329223633, 5.288413047790527, 5.466716766357422, 5.645020484924316, 5.823324203491211, 6.001628398895264]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 10.0, 27.0, 16.0, 37.0, 47.0, 69.0, 116.0, 149.0, 195.0, 344.0, 504.0, 826.0, 1237.0, 2005.0, 3076.0, 5054.0, 8207.0, 14395.0, 25203.0, 46073.0, 85212.0, 146706.0, 204086.0, 196716.0, 135226.0, 76079.0, 40931.0, 22587.0, 12909.0, 7688.0, 4727.0, 2882.0, 1775.0, 1192.0, 730.0, 511.0, 285.0, 227.0, 171.0, 116.0, 69.0, 31.0, 27.0, 26.0, 12.0, 14.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.73785400390625, -5.5460205078125, -5.35418701171875, -5.162353515625, -4.97052001953125, -4.7786865234375, -4.58685302734375, -4.39501953125, -4.20318603515625, -4.0113525390625, -3.81951904296875, -3.627685546875, -3.43585205078125, -3.2440185546875, -3.05218505859375, -2.8603515625, -2.66851806640625, -2.4766845703125, -2.28485107421875, -2.093017578125, -1.90118408203125, -1.7093505859375, -1.51751708984375, -1.32568359375, -1.13385009765625, -0.9420166015625, -0.75018310546875, -0.558349609375, -0.36651611328125, -0.1746826171875, 0.01715087890625, 0.208984375, 0.40081787109375, 0.5926513671875, 0.78448486328125, 0.976318359375, 1.16815185546875, 1.3599853515625, 1.55181884765625, 1.74365234375, 1.93548583984375, 2.1273193359375, 2.31915283203125, 2.510986328125, 2.70281982421875, 2.8946533203125, 3.08648681640625, 3.2783203125, 3.47015380859375, 3.6619873046875, 3.85382080078125, 4.045654296875, 4.23748779296875, 4.4293212890625, 4.62115478515625, 4.81298828125, 5.00482177734375, 5.1966552734375, 5.38848876953125, 5.580322265625, 5.77215576171875, 5.9639892578125, 6.15582275390625, 6.34765625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 7.0, 9.0, 9.0, 10.0, 5.0, 10.0, 18.0, 25.0, 30.0, 28.0, 38.0, 28.0, 43.0, 45.0, 34.0, 61.0, 52.0, 52.0, 52.0, 47.0, 43.0, 31.0, 49.0, 35.0, 36.0, 16.0, 22.0, 29.0, 17.0, 20.0, 15.0, 14.0, 6.0, 10.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.74609375, -5.54779052734375, -5.3494873046875, -5.15118408203125, -4.952880859375, -4.75457763671875, -4.5562744140625, -4.35797119140625, -4.15966796875, -3.96136474609375, -3.7630615234375, -3.56475830078125, -3.366455078125, -3.16815185546875, -2.9698486328125, -2.77154541015625, -2.5732421875, -2.37493896484375, -2.1766357421875, -1.97833251953125, -1.780029296875, -1.58172607421875, -1.3834228515625, -1.18511962890625, -0.98681640625, -0.78851318359375, -0.5902099609375, -0.39190673828125, -0.193603515625, 0.00469970703125, 0.2030029296875, 0.40130615234375, 0.599609375, 0.79791259765625, 0.9962158203125, 1.19451904296875, 1.392822265625, 1.59112548828125, 1.7894287109375, 1.98773193359375, 2.18603515625, 2.38433837890625, 2.5826416015625, 2.78094482421875, 2.979248046875, 3.17755126953125, 3.3758544921875, 3.57415771484375, 3.7724609375, 3.97076416015625, 4.1690673828125, 4.36737060546875, 4.565673828125, 4.76397705078125, 4.9622802734375, 5.16058349609375, 5.35888671875, 5.55718994140625, 5.7554931640625, 5.95379638671875, 6.152099609375, 6.35040283203125, 6.5487060546875, 6.74700927734375, 6.9453125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 9.0, 9.0, 19.0, 28.0, 33.0, 60.0, 79.0, 124.0, 224.0, 346.0, 518.0, 774.0, 1294.0, 2080.0, 3532.0, 5756.0, 9737.0, 16360.0, 27774.0, 48325.0, 81047.0, 126411.0, 171101.0, 178320.0, 142424.0, 93766.0, 56983.0, 33313.0, 19427.0, 11281.0, 6768.0, 3997.0, 2496.0, 1498.0, 967.0, 601.0, 381.0, 254.0, 139.0, 90.0, 75.0, 50.0, 31.0, 16.0, 14.0, 3.0, 11.0, 10.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765625, -4.59637451171875, -4.4271240234375, -4.25787353515625, -4.088623046875, -3.91937255859375, -3.7501220703125, -3.58087158203125, -3.41162109375, -3.24237060546875, -3.0731201171875, -2.90386962890625, -2.734619140625, -2.56536865234375, -2.3961181640625, -2.22686767578125, -2.0576171875, -1.88836669921875, -1.7191162109375, -1.54986572265625, -1.380615234375, -1.21136474609375, -1.0421142578125, -0.87286376953125, -0.70361328125, -0.53436279296875, -0.3651123046875, -0.19586181640625, -0.026611328125, 0.14263916015625, 0.3118896484375, 0.48114013671875, 0.650390625, 0.81964111328125, 0.9888916015625, 1.15814208984375, 1.327392578125, 1.49664306640625, 1.6658935546875, 1.83514404296875, 2.00439453125, 2.17364501953125, 2.3428955078125, 2.51214599609375, 2.681396484375, 2.85064697265625, 3.0198974609375, 3.18914794921875, 3.3583984375, 3.52764892578125, 3.6968994140625, 3.86614990234375, 4.035400390625, 4.20465087890625, 4.3739013671875, 4.54315185546875, 4.71240234375, 4.88165283203125, 5.0509033203125, 5.22015380859375, 5.389404296875, 5.55865478515625, 5.7279052734375, 5.89715576171875, 6.06640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 7.0, 14.0, 12.0, 14.0, 18.0, 8.0, 18.0, 18.0, 37.0, 34.0, 34.0, 38.0, 33.0, 42.0, 40.0, 39.0, 28.0, 39.0, 35.0, 39.0, 25.0, 41.0, 39.0, 46.0, 35.0, 24.0, 35.0, 29.0, 21.0, 13.0, 13.0, 21.0, 18.0, 16.0, 11.0, 16.0, 7.0, 3.0, 11.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.537109375, -3.431396484375, -3.32568359375, -3.219970703125, -3.1142578125, -3.008544921875, -2.90283203125, -2.797119140625, -2.69140625, -2.585693359375, -2.47998046875, -2.374267578125, -2.2685546875, -2.162841796875, -2.05712890625, -1.951416015625, -1.845703125, -1.739990234375, -1.63427734375, -1.528564453125, -1.4228515625, -1.317138671875, -1.21142578125, -1.105712890625, -1.0, -0.894287109375, -0.78857421875, -0.682861328125, -0.5771484375, -0.471435546875, -0.36572265625, -0.260009765625, -0.154296875, -0.048583984375, 0.05712890625, 0.162841796875, 0.2685546875, 0.374267578125, 0.47998046875, 0.585693359375, 0.69140625, 0.797119140625, 0.90283203125, 1.008544921875, 1.1142578125, 1.219970703125, 1.32568359375, 1.431396484375, 1.537109375, 1.642822265625, 1.74853515625, 1.854248046875, 1.9599609375, 2.065673828125, 2.17138671875, 2.277099609375, 2.3828125, 2.488525390625, 2.59423828125, 2.699951171875, 2.8056640625, 2.911376953125, 3.01708984375, 3.122802734375, 3.228515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 10.0, 12.0, 28.0, 46.0, 83.0, 128.0, 238.0, 399.0, 713.0, 1317.0, 2390.0, 4660.0, 9410.0, 19544.0, 43760.0, 100926.0, 215071.0, 292830.0, 195306.0, 88075.0, 38699.0, 17423.0, 8375.0, 4181.0, 2158.0, 1262.0, 637.0, 366.0, 203.0, 124.0, 78.0, 40.0, 15.0, 16.0, 12.0, 7.0, 4.0, 0.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.70440673828125, -3.5826416015625, -3.46087646484375, -3.339111328125, -3.21734619140625, -3.0955810546875, -2.97381591796875, -2.85205078125, -2.73028564453125, -2.6085205078125, -2.48675537109375, -2.364990234375, -2.24322509765625, -2.1214599609375, -1.99969482421875, -1.8779296875, -1.75616455078125, -1.6343994140625, -1.51263427734375, -1.390869140625, -1.26910400390625, -1.1473388671875, -1.02557373046875, -0.90380859375, -0.78204345703125, -0.6602783203125, -0.53851318359375, -0.416748046875, -0.29498291015625, -0.1732177734375, -0.05145263671875, 0.0703125, 0.19207763671875, 0.3138427734375, 0.43560791015625, 0.557373046875, 0.67913818359375, 0.8009033203125, 0.92266845703125, 1.04443359375, 1.16619873046875, 1.2879638671875, 1.40972900390625, 1.531494140625, 1.65325927734375, 1.7750244140625, 1.89678955078125, 2.0185546875, 2.14031982421875, 2.2620849609375, 2.38385009765625, 2.505615234375, 2.62738037109375, 2.7491455078125, 2.87091064453125, 2.99267578125, 3.11444091796875, 3.2362060546875, 3.35797119140625, 3.479736328125, 3.60150146484375, 3.7232666015625, 3.84503173828125, 3.966796875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 3.0, 11.0, 13.0, 17.0, 22.0, 25.0, 39.0, 55.0, 74.0, 84.0, 107.0, 93.0, 98.0, 76.0, 71.0, 58.0, 39.0, 36.0, 18.0, 13.0, 17.0, 11.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000308990478515625, -0.0002985522150993347, -0.00028811395168304443, -0.00027767568826675415, -0.00026723742485046387, -0.0002567991614341736, -0.0002463608980178833, -0.00023592263460159302, -0.00022548437118530273, -0.00021504610776901245, -0.00020460784435272217, -0.00019416958093643188, -0.0001837313175201416, -0.00017329305410385132, -0.00016285479068756104, -0.00015241652727127075, -0.00014197826385498047, -0.00013154000043869019, -0.0001211017370223999, -0.00011066347360610962, -0.00010022521018981934, -8.978694677352905e-05, -7.934868335723877e-05, -6.891041994094849e-05, -5.84721565246582e-05, -4.803389310836792e-05, -3.759562969207764e-05, -2.7157366275787354e-05, -1.671910285949707e-05, -6.280839443206787e-06, 4.157423973083496e-06, 1.459568738937378e-05, 2.5033950805664062e-05, 3.5472214221954346e-05, 4.591047763824463e-05, 5.634874105453491e-05, 6.67870044708252e-05, 7.722526788711548e-05, 8.766353130340576e-05, 9.810179471969604e-05, 0.00010854005813598633, 0.00011897832155227661, 0.0001294165849685669, 0.00013985484838485718, 0.00015029311180114746, 0.00016073137521743774, 0.00017116963863372803, 0.0001816079020500183, 0.0001920461654663086, 0.00020248442888259888, 0.00021292269229888916, 0.00022336095571517944, 0.00023379921913146973, 0.00024423748254776, 0.0002546757459640503, 0.0002651140093803406, 0.00027555227279663086, 0.00028599053621292114, 0.0002964287996292114, 0.0003068670630455017, 0.000317305326461792, 0.0003277435898780823, 0.00033818185329437256, 0.00034862011671066284, 0.0003590583801269531]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 8.0, 11.0, 17.0, 32.0, 50.0, 59.0, 111.0, 166.0, 292.0, 458.0, 869.0, 1553.0, 2765.0, 5329.0, 10905.0, 23021.0, 51293.0, 113212.0, 220454.0, 273010.0, 182596.0, 87322.0, 39039.0, 17839.0, 8530.0, 4385.0, 2241.0, 1249.0, 670.0, 389.0, 236.0, 165.0, 86.0, 55.0, 42.0, 30.0, 27.0, 12.0, 8.0, 6.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.685546875, -3.574981689453125, -3.46441650390625, -3.353851318359375, -3.2432861328125, -3.132720947265625, -3.02215576171875, -2.911590576171875, -2.801025390625, -2.690460205078125, -2.57989501953125, -2.469329833984375, -2.3587646484375, -2.248199462890625, -2.13763427734375, -2.027069091796875, -1.91650390625, -1.805938720703125, -1.69537353515625, -1.584808349609375, -1.4742431640625, -1.363677978515625, -1.25311279296875, -1.142547607421875, -1.031982421875, -0.921417236328125, -0.81085205078125, -0.700286865234375, -0.5897216796875, -0.479156494140625, -0.36859130859375, -0.258026123046875, -0.1474609375, -0.036895751953125, 0.07366943359375, 0.184234619140625, 0.2947998046875, 0.405364990234375, 0.51593017578125, 0.626495361328125, 0.737060546875, 0.847625732421875, 0.95819091796875, 1.068756103515625, 1.1793212890625, 1.289886474609375, 1.40045166015625, 1.511016845703125, 1.62158203125, 1.732147216796875, 1.84271240234375, 1.953277587890625, 2.0638427734375, 2.174407958984375, 2.28497314453125, 2.395538330078125, 2.506103515625, 2.616668701171875, 2.72723388671875, 2.837799072265625, 2.9483642578125, 3.058929443359375, 3.16949462890625, 3.280059814453125, 3.390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 8.0, 10.0, 11.0, 11.0, 18.0, 17.0, 29.0, 26.0, 25.0, 45.0, 42.0, 44.0, 53.0, 60.0, 68.0, 57.0, 59.0, 55.0, 55.0, 63.0, 41.0, 28.0, 30.0, 36.0, 12.0, 25.0, 16.0, 9.0, 9.0, 11.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6720123291015625, -0.646270751953125, -0.6205291748046875, -0.59478759765625, -0.5690460205078125, -0.543304443359375, -0.5175628662109375, -0.4918212890625, -0.4660797119140625, -0.440338134765625, -0.4145965576171875, -0.38885498046875, -0.3631134033203125, -0.337371826171875, -0.3116302490234375, -0.285888671875, -0.2601470947265625, -0.234405517578125, -0.2086639404296875, -0.18292236328125, -0.1571807861328125, -0.131439208984375, -0.1056976318359375, -0.0799560546875, -0.0542144775390625, -0.028472900390625, -0.0027313232421875, 0.02301025390625, 0.0487518310546875, 0.074493408203125, 0.1002349853515625, 0.1259765625, 0.1517181396484375, 0.177459716796875, 0.2032012939453125, 0.22894287109375, 0.2546844482421875, 0.280426025390625, 0.3061676025390625, 0.3319091796875, 0.3576507568359375, 0.383392333984375, 0.4091339111328125, 0.43487548828125, 0.4606170654296875, 0.486358642578125, 0.5121002197265625, 0.537841796875, 0.5635833740234375, 0.589324951171875, 0.6150665283203125, 0.64080810546875, 0.6665496826171875, 0.692291259765625, 0.7180328369140625, 0.7437744140625, 0.7695159912109375, 0.795257568359375, 0.8209991455078125, 0.84674072265625, 0.8724822998046875, 0.898223876953125, 0.9239654541015625, 0.94970703125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 10.0, 12.0, 27.0, 35.0, 46.0, 81.0, 121.0, 160.0, 137.0, 113.0, 93.0, 53.0, 41.0, 16.0, 17.0, 16.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.06598472595215, -19.508255004882812, -18.950525283813477, -18.39279556274414, -17.835065841674805, -17.27733612060547, -16.719606399536133, -16.161876678466797, -15.604147911071777, -15.046418190002441, -14.488688468933105, -13.93095874786377, -13.37322998046875, -12.815500259399414, -12.257770538330078, -11.700040817260742, -11.142311096191406, -10.58458137512207, -10.026851654052734, -9.469121932983398, -8.911392211914062, -8.353662490844727, -7.795933723449707, -7.238204002380371, -6.680474281311035, -6.122744560241699, -5.565014839172363, -5.0072855949401855, -4.44955587387085, -3.8918261528015137, -3.334096670150757, -2.7763671875, -2.2186365127563477, -1.6609069108963013, -1.1031773090362549, -0.5454477071762085, 0.01228189468383789, 0.5700116157531738, 1.1277410984039307, 1.6854705810546875, 2.2432003021240234, 2.8009300231933594, 3.358659505844116, 3.916388988494873, 4.474118709564209, 5.031848430633545, 5.589577674865723, 6.147307395935059, 6.7050371170043945, 7.2627668380737305, 7.820496559143066, 8.378226280212402, 8.935955047607422, 9.493684768676758, 10.051414489746094, 10.60914421081543, 11.166873931884766, 11.724603652954102, 12.282333374023438, 12.840063095092773, 13.39779281616211, 13.955522537231445, 14.513251304626465, 15.0709810256958, 15.628710746765137]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 8.0, 12.0, 18.0, 13.0, 17.0, 19.0, 25.0, 44.0, 34.0, 33.0, 35.0, 48.0, 56.0, 55.0, 44.0, 43.0, 51.0, 44.0, 55.0, 36.0, 38.0, 33.0, 35.0, 26.0, 26.0, 18.0, 17.0, 15.0, 21.0, 12.0, 14.0, 5.0, 9.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.087007522583008, -5.894461631774902, -5.701915740966797, -5.509369850158691, -5.316823959350586, -5.1242780685424805, -4.931732177734375, -4.7391862869262695, -4.546640396118164, -4.354094505310059, -4.161548614501953, -3.9690027236938477, -3.776456832885742, -3.5839109420776367, -3.3913652896881104, -3.198819398880005, -3.0062737464904785, -2.813727855682373, -2.6211819648742676, -2.428636074066162, -2.2360901832580566, -2.043544292449951, -1.8509986400604248, -1.6584527492523193, -1.4659068584442139, -1.2733609676361084, -1.080815076828003, -0.888269305229187, -0.6957234144210815, -0.5031775236129761, -0.31063175201416016, -0.11808586120605469, 0.07445955276489258, 0.26700541377067566, 0.45955127477645874, 0.6520971059799194, 0.8446429967880249, 1.0371888875961304, 1.2297346591949463, 1.4222805500030518, 1.6148264408111572, 1.8073723316192627, 1.9999182224273682, 2.1924638748168945, 2.385009765625, 2.5775556564331055, 2.770101547241211, 2.9626474380493164, 3.155193328857422, 3.3477392196655273, 3.540285110473633, 3.7328310012817383, 3.9253768920898438, 4.117922782897949, 4.310468673706055, 4.50301456451416, 4.695560455322266, 4.888106346130371, 5.080652236938477, 5.273198127746582, 5.4657440185546875, 5.658289909362793, 5.850835800170898, 6.043381690979004, 6.235927104949951]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 8.0, 19.0, 22.0, 36.0, 50.0, 65.0, 125.0, 191.0, 306.0, 487.0, 831.0, 1352.0, 2463.0, 4417.0, 8154.0, 16809.0, 40339.0, 126505.0, 552500.0, 1868822.0, 1190665.0, 255359.0, 69516.0, 26788.0, 12748.0, 6750.0, 3629.0, 2159.0, 1225.0, 767.0, 423.0, 244.0, 197.0, 111.0, 60.0, 49.0, 31.0, 28.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.6171875, -14.1710205078125, -13.724853515625, -13.2786865234375, -12.83251953125, -12.3863525390625, -11.940185546875, -11.4940185546875, -11.0478515625, -10.6016845703125, -10.155517578125, -9.7093505859375, -9.26318359375, -8.8170166015625, -8.370849609375, -7.9246826171875, -7.478515625, -7.0323486328125, -6.586181640625, -6.1400146484375, -5.69384765625, -5.2476806640625, -4.801513671875, -4.3553466796875, -3.9091796875, -3.4630126953125, -3.016845703125, -2.5706787109375, -2.12451171875, -1.6783447265625, -1.232177734375, -0.7860107421875, -0.33984375, 0.1063232421875, 0.552490234375, 0.9986572265625, 1.44482421875, 1.8909912109375, 2.337158203125, 2.7833251953125, 3.2294921875, 3.6756591796875, 4.121826171875, 4.5679931640625, 5.01416015625, 5.4603271484375, 5.906494140625, 6.3526611328125, 6.798828125, 7.2449951171875, 7.691162109375, 8.1373291015625, 8.58349609375, 9.0296630859375, 9.475830078125, 9.9219970703125, 10.3681640625, 10.8143310546875, 11.260498046875, 11.7066650390625, 12.15283203125, 12.5989990234375, 13.045166015625, 13.4913330078125, 13.9375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 8.0, 0.0, 6.0, 8.0, 5.0, 17.0, 9.0, 14.0, 21.0, 18.0, 26.0, 32.0, 40.0, 37.0, 35.0, 43.0, 53.0, 41.0, 49.0, 50.0, 59.0, 46.0, 40.0, 38.0, 41.0, 41.0, 34.0, 34.0, 32.0, 20.0, 20.0, 16.0, 9.0, 14.0, 15.0, 11.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.8828125, -4.735107421875, -4.58740234375, -4.439697265625, -4.2919921875, -4.144287109375, -3.99658203125, -3.848876953125, -3.701171875, -3.553466796875, -3.40576171875, -3.258056640625, -3.1103515625, -2.962646484375, -2.81494140625, -2.667236328125, -2.51953125, -2.371826171875, -2.22412109375, -2.076416015625, -1.9287109375, -1.781005859375, -1.63330078125, -1.485595703125, -1.337890625, -1.190185546875, -1.04248046875, -0.894775390625, -0.7470703125, -0.599365234375, -0.45166015625, -0.303955078125, -0.15625, -0.008544921875, 0.13916015625, 0.286865234375, 0.4345703125, 0.582275390625, 0.72998046875, 0.877685546875, 1.025390625, 1.173095703125, 1.32080078125, 1.468505859375, 1.6162109375, 1.763916015625, 1.91162109375, 2.059326171875, 2.20703125, 2.354736328125, 2.50244140625, 2.650146484375, 2.7978515625, 2.945556640625, 3.09326171875, 3.240966796875, 3.388671875, 3.536376953125, 3.68408203125, 3.831787109375, 3.9794921875, 4.127197265625, 4.27490234375, 4.422607421875, 4.5703125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 0.0, 5.0, 8.0, 10.0, 5.0, 19.0, 26.0, 32.0, 44.0, 77.0, 135.0, 218.0, 311.0, 474.0, 710.0, 1033.0, 1695.0, 2512.0, 3875.0, 6205.0, 9902.0, 16566.0, 29506.0, 57571.0, 127713.0, 327277.0, 862588.0, 1385073.0, 809094.0, 304184.0, 120422.0, 55681.0, 28796.0, 15986.0, 9655.0, 5914.0, 3810.0, 2508.0, 1600.0, 1109.0, 674.0, 426.0, 283.0, 184.0, 122.0, 92.0, 52.0, 33.0, 25.0, 23.0, 8.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3515625, -10.0225830078125, -9.693603515625, -9.3646240234375, -9.03564453125, -8.7066650390625, -8.377685546875, -8.0487060546875, -7.7197265625, -7.3907470703125, -7.061767578125, -6.7327880859375, -6.40380859375, -6.0748291015625, -5.745849609375, -5.4168701171875, -5.087890625, -4.7589111328125, -4.429931640625, -4.1009521484375, -3.77197265625, -3.4429931640625, -3.114013671875, -2.7850341796875, -2.4560546875, -2.1270751953125, -1.798095703125, -1.4691162109375, -1.14013671875, -0.8111572265625, -0.482177734375, -0.1531982421875, 0.17578125, 0.5047607421875, 0.833740234375, 1.1627197265625, 1.49169921875, 1.8206787109375, 2.149658203125, 2.4786376953125, 2.8076171875, 3.1365966796875, 3.465576171875, 3.7945556640625, 4.12353515625, 4.4525146484375, 4.781494140625, 5.1104736328125, 5.439453125, 5.7684326171875, 6.097412109375, 6.4263916015625, 6.75537109375, 7.0843505859375, 7.413330078125, 7.7423095703125, 8.0712890625, 8.4002685546875, 8.729248046875, 9.0582275390625, 9.38720703125, 9.7161865234375, 10.045166015625, 10.3741455078125, 10.703125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 19.0, 18.0, 20.0, 28.0, 25.0, 35.0, 65.0, 77.0, 103.0, 152.0, 203.0, 225.0, 288.0, 326.0, 363.0, 374.0, 351.0, 310.0, 232.0, 188.0, 156.0, 119.0, 83.0, 61.0, 58.0, 36.0, 31.0, 27.0, 21.0, 13.0, 12.0, 14.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.994140625, -2.89825439453125, -2.8023681640625, -2.70648193359375, -2.610595703125, -2.51470947265625, -2.4188232421875, -2.32293701171875, -2.22705078125, -2.13116455078125, -2.0352783203125, -1.93939208984375, -1.843505859375, -1.74761962890625, -1.6517333984375, -1.55584716796875, -1.4599609375, -1.36407470703125, -1.2681884765625, -1.17230224609375, -1.076416015625, -0.98052978515625, -0.8846435546875, -0.78875732421875, -0.69287109375, -0.59698486328125, -0.5010986328125, -0.40521240234375, -0.309326171875, -0.21343994140625, -0.1175537109375, -0.02166748046875, 0.07421875, 0.17010498046875, 0.2659912109375, 0.36187744140625, 0.457763671875, 0.55364990234375, 0.6495361328125, 0.74542236328125, 0.84130859375, 0.93719482421875, 1.0330810546875, 1.12896728515625, 1.224853515625, 1.32073974609375, 1.4166259765625, 1.51251220703125, 1.6083984375, 1.70428466796875, 1.8001708984375, 1.89605712890625, 1.991943359375, 2.08782958984375, 2.1837158203125, 2.27960205078125, 2.37548828125, 2.47137451171875, 2.5672607421875, 2.66314697265625, 2.759033203125, 2.85491943359375, 2.9508056640625, 3.04669189453125, 3.142578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 11.0, 8.0, 16.0, 25.0, 18.0, 45.0, 59.0, 86.0, 102.0, 112.0, 99.0, 85.0, 87.0, 58.0, 47.0, 38.0, 24.0, 14.0, 12.0, 8.0, 10.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.78668975830078, -16.36717987060547, -15.947669982910156, -15.528160095214844, -15.108650207519531, -14.689140319824219, -14.269630432128906, -13.850119590759277, -13.430609703063965, -13.011099815368652, -12.59158992767334, -12.172080039978027, -11.752570152282715, -11.333059310913086, -10.913549423217773, -10.494039535522461, -10.074529647827148, -9.655019760131836, -9.235509872436523, -8.815999984741211, -8.396490097045898, -7.976979732513428, -7.557469844818115, -7.1379594802856445, -6.718450546264648, -6.298940658569336, -5.879430770874023, -5.459920883178711, -5.04041051864624, -4.620900630950928, -4.201390743255615, -3.7818806171417236, -3.362370491027832, -2.9428606033325195, -2.523350477218628, -2.1038405895233154, -1.6843305826187134, -1.2648205757141113, -0.8453106880187988, -0.4258005619049072, -0.0062906742095947266, 0.41321930289268494, 0.8327292799949646, 1.2522392272949219, 1.671749234199524, 2.091259241104126, 2.5107691287994385, 2.93027925491333, 3.3497891426086426, 3.769299030303955, 4.188808917999268, 4.608319282531738, 5.027829170227051, 5.447339057922363, 5.866848945617676, 6.286358833312988, 6.705868721008301, 7.125378608703613, 7.544888496398926, 7.964398384094238, 8.38390827178955, 8.80341911315918, 9.222929000854492, 9.642438888549805, 10.061948776245117]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 5.0, 8.0, 8.0, 9.0, 10.0, 9.0, 15.0, 12.0, 13.0, 12.0, 20.0, 31.0, 29.0, 33.0, 45.0, 54.0, 48.0, 57.0, 32.0, 53.0, 43.0, 43.0, 36.0, 54.0, 36.0, 18.0, 39.0, 27.0, 19.0, 19.0, 23.0, 22.0, 24.0, 12.0, 21.0, 10.0, 8.0, 7.0, 7.0, 7.0, 8.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-5.5707597732543945, -5.3931732177734375, -5.2155866622924805, -5.037999629974365, -4.860413074493408, -4.682826519012451, -4.505239486694336, -4.327652931213379, -4.150066375732422, -3.972479820251465, -3.7948930263519287, -3.6173062324523926, -3.4397196769714355, -3.2621331214904785, -3.0845463275909424, -2.9069595336914062, -2.729372978210449, -2.551786422729492, -2.374199628829956, -2.19661283493042, -2.019026279449463, -1.8414396047592163, -1.6638529300689697, -1.4862662553787231, -1.3086795806884766, -1.13109290599823, -0.9535062313079834, -0.7759195566177368, -0.5983328819274902, -0.42074620723724365, -0.24315953254699707, -0.06557285785675049, 0.11201333999633789, 0.2896000146865845, 0.46718668937683105, 0.6447733640670776, 0.8223600387573242, 0.9999467134475708, 1.1775333881378174, 1.355120062828064, 1.5327067375183105, 1.7102934122085571, 1.8878800868988037, 2.06546688079834, 2.243053436279297, 2.420639991760254, 2.59822678565979, 2.775813579559326, 2.953400135040283, 3.1309866905212402, 3.3085734844207764, 3.4861602783203125, 3.6637468338012695, 3.8413333892822266, 4.018919944763184, 4.196506977081299, 4.374093532562256, 4.551680088043213, 4.729267120361328, 4.906853675842285, 5.084440231323242, 5.262026786804199, 5.439613342285156, 5.6172003746032715, 5.7947869300842285]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 9.0, 11.0, 8.0, 16.0, 31.0, 33.0, 65.0, 69.0, 102.0, 168.0, 213.0, 325.0, 567.0, 886.0, 1410.0, 2279.0, 4028.0, 7049.0, 13017.0, 25841.0, 53692.0, 116743.0, 229037.0, 271589.0, 166900.0, 77805.0, 36093.0, 17767.0, 9573.0, 5218.0, 2974.0, 1912.0, 1078.0, 705.0, 439.0, 279.0, 214.0, 146.0, 59.0, 77.0, 34.0, 28.0, 20.0, 9.0, 13.0, 9.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.951171875, -3.832305908203125, -3.71343994140625, -3.594573974609375, -3.4757080078125, -3.356842041015625, -3.23797607421875, -3.119110107421875, -3.000244140625, -2.881378173828125, -2.76251220703125, -2.643646240234375, -2.5247802734375, -2.405914306640625, -2.28704833984375, -2.168182373046875, -2.04931640625, -1.930450439453125, -1.81158447265625, -1.692718505859375, -1.5738525390625, -1.454986572265625, -1.33612060546875, -1.217254638671875, -1.098388671875, -0.979522705078125, -0.86065673828125, -0.741790771484375, -0.6229248046875, -0.504058837890625, -0.38519287109375, -0.266326904296875, -0.1474609375, -0.028594970703125, 0.09027099609375, 0.209136962890625, 0.3280029296875, 0.446868896484375, 0.56573486328125, 0.684600830078125, 0.803466796875, 0.922332763671875, 1.04119873046875, 1.160064697265625, 1.2789306640625, 1.397796630859375, 1.51666259765625, 1.635528564453125, 1.75439453125, 1.873260498046875, 1.99212646484375, 2.110992431640625, 2.2298583984375, 2.348724365234375, 2.46759033203125, 2.586456298828125, 2.705322265625, 2.824188232421875, 2.94305419921875, 3.061920166015625, 3.1807861328125, 3.299652099609375, 3.41851806640625, 3.537384033203125, 3.65625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 9.0, 13.0, 17.0, 15.0, 14.0, 17.0, 21.0, 29.0, 35.0, 41.0, 40.0, 59.0, 48.0, 53.0, 69.0, 45.0, 40.0, 50.0, 36.0, 34.0, 36.0, 33.0, 29.0, 22.0, 24.0, 25.0, 21.0, 18.0, 12.0, 18.0, 9.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.53125, -6.32598876953125, -6.1207275390625, -5.91546630859375, -5.710205078125, -5.50494384765625, -5.2996826171875, -5.09442138671875, -4.88916015625, -4.68389892578125, -4.4786376953125, -4.27337646484375, -4.068115234375, -3.86285400390625, -3.6575927734375, -3.45233154296875, -3.2470703125, -3.04180908203125, -2.8365478515625, -2.63128662109375, -2.426025390625, -2.22076416015625, -2.0155029296875, -1.81024169921875, -1.60498046875, -1.39971923828125, -1.1944580078125, -0.98919677734375, -0.783935546875, -0.57867431640625, -0.3734130859375, -0.16815185546875, 0.037109375, 0.24237060546875, 0.4476318359375, 0.65289306640625, 0.858154296875, 1.06341552734375, 1.2686767578125, 1.47393798828125, 1.67919921875, 1.88446044921875, 2.0897216796875, 2.29498291015625, 2.500244140625, 2.70550537109375, 2.9107666015625, 3.11602783203125, 3.3212890625, 3.52655029296875, 3.7318115234375, 3.93707275390625, 4.142333984375, 4.34759521484375, 4.5528564453125, 4.75811767578125, 4.96337890625, 5.16864013671875, 5.3739013671875, 5.57916259765625, 5.784423828125, 5.98968505859375, 6.1949462890625, 6.40020751953125, 6.60546875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 7.0, 12.0, 20.0, 28.0, 39.0, 51.0, 76.0, 87.0, 147.0, 262.0, 397.0, 633.0, 1047.0, 1807.0, 3488.0, 6705.0, 13986.0, 32610.0, 85409.0, 233418.0, 366787.0, 183807.0, 67159.0, 26309.0, 11637.0, 5665.0, 2854.0, 1623.0, 931.0, 550.0, 323.0, 216.0, 138.0, 91.0, 78.0, 51.0, 24.0, 19.0, 13.0, 14.0, 9.0, 12.0, 8.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4140625, -5.24151611328125, -5.0689697265625, -4.89642333984375, -4.723876953125, -4.55133056640625, -4.3787841796875, -4.20623779296875, -4.03369140625, -3.86114501953125, -3.6885986328125, -3.51605224609375, -3.343505859375, -3.17095947265625, -2.9984130859375, -2.82586669921875, -2.6533203125, -2.48077392578125, -2.3082275390625, -2.13568115234375, -1.963134765625, -1.79058837890625, -1.6180419921875, -1.44549560546875, -1.27294921875, -1.10040283203125, -0.9278564453125, -0.75531005859375, -0.582763671875, -0.41021728515625, -0.2376708984375, -0.06512451171875, 0.107421875, 0.27996826171875, 0.4525146484375, 0.62506103515625, 0.797607421875, 0.97015380859375, 1.1427001953125, 1.31524658203125, 1.48779296875, 1.66033935546875, 1.8328857421875, 2.00543212890625, 2.177978515625, 2.35052490234375, 2.5230712890625, 2.69561767578125, 2.8681640625, 3.04071044921875, 3.2132568359375, 3.38580322265625, 3.558349609375, 3.73089599609375, 3.9034423828125, 4.07598876953125, 4.24853515625, 4.42108154296875, 4.5936279296875, 4.76617431640625, 4.938720703125, 5.11126708984375, 5.2838134765625, 5.45635986328125, 5.62890625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 6.0, 11.0, 8.0, 17.0, 6.0, 13.0, 19.0, 18.0, 12.0, 36.0, 33.0, 37.0, 34.0, 38.0, 33.0, 29.0, 40.0, 30.0, 38.0, 38.0, 43.0, 43.0, 41.0, 40.0, 41.0, 35.0, 31.0, 30.0, 24.0, 20.0, 23.0, 22.0, 21.0, 15.0, 8.0, 12.0, 12.0, 5.0, 9.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.115234375, -3.015777587890625, -2.91632080078125, -2.816864013671875, -2.7174072265625, -2.617950439453125, -2.51849365234375, -2.419036865234375, -2.319580078125, -2.220123291015625, -2.12066650390625, -2.021209716796875, -1.9217529296875, -1.822296142578125, -1.72283935546875, -1.623382568359375, -1.52392578125, -1.424468994140625, -1.32501220703125, -1.225555419921875, -1.1260986328125, -1.026641845703125, -0.92718505859375, -0.827728271484375, -0.728271484375, -0.628814697265625, -0.52935791015625, -0.429901123046875, -0.3304443359375, -0.230987548828125, -0.13153076171875, -0.032073974609375, 0.0673828125, 0.166839599609375, 0.26629638671875, 0.365753173828125, 0.4652099609375, 0.564666748046875, 0.66412353515625, 0.763580322265625, 0.863037109375, 0.962493896484375, 1.06195068359375, 1.161407470703125, 1.2608642578125, 1.360321044921875, 1.45977783203125, 1.559234619140625, 1.65869140625, 1.758148193359375, 1.85760498046875, 1.957061767578125, 2.0565185546875, 2.155975341796875, 2.25543212890625, 2.354888916015625, 2.454345703125, 2.553802490234375, 2.65325927734375, 2.752716064453125, 2.8521728515625, 2.951629638671875, 3.05108642578125, 3.150543212890625, 3.25]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 16.0, 23.0, 26.0, 56.0, 75.0, 100.0, 178.0, 233.0, 364.0, 631.0, 1084.0, 1948.0, 4369.0, 14569.0, 112339.0, 753259.0, 133996.0, 15873.0, 4556.0, 1952.0, 1099.0, 650.0, 350.0, 268.0, 162.0, 114.0, 78.0, 49.0, 33.0, 28.0, 23.0, 9.0, 6.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12890625, -4.942626953125, -4.75634765625, -4.570068359375, -4.3837890625, -4.197509765625, -4.01123046875, -3.824951171875, -3.638671875, -3.452392578125, -3.26611328125, -3.079833984375, -2.8935546875, -2.707275390625, -2.52099609375, -2.334716796875, -2.1484375, -1.962158203125, -1.77587890625, -1.589599609375, -1.4033203125, -1.217041015625, -1.03076171875, -0.844482421875, -0.658203125, -0.471923828125, -0.28564453125, -0.099365234375, 0.0869140625, 0.273193359375, 0.45947265625, 0.645751953125, 0.83203125, 1.018310546875, 1.20458984375, 1.390869140625, 1.5771484375, 1.763427734375, 1.94970703125, 2.135986328125, 2.322265625, 2.508544921875, 2.69482421875, 2.881103515625, 3.0673828125, 3.253662109375, 3.43994140625, 3.626220703125, 3.8125, 3.998779296875, 4.18505859375, 4.371337890625, 4.5576171875, 4.743896484375, 4.93017578125, 5.116455078125, 5.302734375, 5.489013671875, 5.67529296875, 5.861572265625, 6.0478515625, 6.234130859375, 6.42041015625, 6.606689453125, 6.79296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 14.0, 33.0, 38.0, 78.0, 106.0, 111.0, 140.0, 145.0, 90.0, 68.0, 44.0, 31.0, 24.0, 6.0, 14.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00015854835510253906, -0.0001535024493932724, -0.00014845654368400574, -0.00014341063797473907, -0.0001383647322654724, -0.00013331882655620575, -0.0001282729208469391, -0.00012322701513767242, -0.00011818110942840576, -0.0001131352037191391, -0.00010808929800987244, -0.00010304339230060577, -9.799748659133911e-05, -9.295158088207245e-05, -8.790567517280579e-05, -8.285976946353912e-05, -7.781386375427246e-05, -7.27679580450058e-05, -6.772205233573914e-05, -6.267614662647247e-05, -5.763024091720581e-05, -5.258433520793915e-05, -4.7538429498672485e-05, -4.249252378940582e-05, -3.744661808013916e-05, -3.24007123708725e-05, -2.7354806661605835e-05, -2.2308900952339172e-05, -1.726299524307251e-05, -1.2217089533805847e-05, -7.1711838245391846e-06, -2.125278115272522e-06, 2.9206275939941406e-06, 7.966533303260803e-06, 1.3012439012527466e-05, 1.805834472179413e-05, 2.310425043106079e-05, 2.8150156140327454e-05, 3.3196061849594116e-05, 3.824196755886078e-05, 4.328787326812744e-05, 4.8333778977394104e-05, 5.3379684686660767e-05, 5.842559039592743e-05, 6.347149610519409e-05, 6.851740181446075e-05, 7.356330752372742e-05, 7.860921323299408e-05, 8.365511894226074e-05, 8.87010246515274e-05, 9.374693036079407e-05, 9.879283607006073e-05, 0.00010383874177932739, 0.00010888464748859406, 0.00011393055319786072, 0.00011897645890712738, 0.00012402236461639404, 0.0001290682703256607, 0.00013411417603492737, 0.00013916008174419403, 0.0001442059874534607, 0.00014925189316272736, 0.00015429779887199402, 0.00015934370458126068, 0.00016438961029052734]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 10.0, 19.0, 24.0, 28.0, 44.0, 69.0, 76.0, 147.0, 173.0, 257.0, 414.0, 555.0, 841.0, 1250.0, 1782.0, 2698.0, 4405.0, 7731.0, 17595.0, 50507.0, 178522.0, 419372.0, 246006.0, 69524.0, 22679.0, 9539.0, 4901.0, 3065.0, 1987.0, 1377.0, 894.0, 636.0, 401.0, 323.0, 221.0, 148.0, 97.0, 49.0, 42.0, 48.0, 22.0, 16.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0], "bins": [-2.66796875, -2.586212158203125, -2.50445556640625, -2.422698974609375, -2.3409423828125, -2.259185791015625, -2.17742919921875, -2.095672607421875, -2.013916015625, -1.932159423828125, -1.85040283203125, -1.768646240234375, -1.6868896484375, -1.605133056640625, -1.52337646484375, -1.441619873046875, -1.35986328125, -1.278106689453125, -1.19635009765625, -1.114593505859375, -1.0328369140625, -0.951080322265625, -0.86932373046875, -0.787567138671875, -0.705810546875, -0.624053955078125, -0.54229736328125, -0.460540771484375, -0.3787841796875, -0.297027587890625, -0.21527099609375, -0.133514404296875, -0.0517578125, 0.029998779296875, 0.11175537109375, 0.193511962890625, 0.2752685546875, 0.357025146484375, 0.43878173828125, 0.520538330078125, 0.602294921875, 0.684051513671875, 0.76580810546875, 0.847564697265625, 0.9293212890625, 1.011077880859375, 1.09283447265625, 1.174591064453125, 1.25634765625, 1.338104248046875, 1.41986083984375, 1.501617431640625, 1.5833740234375, 1.665130615234375, 1.74688720703125, 1.828643798828125, 1.910400390625, 1.992156982421875, 2.07391357421875, 2.155670166015625, 2.2374267578125, 2.319183349609375, 2.40093994140625, 2.482696533203125, 2.564453125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 9.0, 12.0, 21.0, 28.0, 45.0, 62.0, 72.0, 91.0, 124.0, 114.0, 104.0, 84.0, 69.0, 52.0, 36.0, 21.0, 15.0, 14.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71533203125, -0.6910781860351562, -0.6668243408203125, -0.6425704956054688, -0.618316650390625, -0.5940628051757812, -0.5698089599609375, -0.5455551147460938, -0.52130126953125, -0.49704742431640625, -0.4727935791015625, -0.44853973388671875, -0.424285888671875, -0.40003204345703125, -0.3757781982421875, -0.35152435302734375, -0.3272705078125, -0.30301666259765625, -0.2787628173828125, -0.25450897216796875, -0.230255126953125, -0.20600128173828125, -0.1817474365234375, -0.15749359130859375, -0.13323974609375, -0.10898590087890625, -0.0847320556640625, -0.06047821044921875, -0.036224365234375, -0.01197052001953125, 0.0122833251953125, 0.03653717041015625, 0.060791015625, 0.08504486083984375, 0.1092987060546875, 0.13355255126953125, 0.157806396484375, 0.18206024169921875, 0.2063140869140625, 0.23056793212890625, 0.25482177734375, 0.27907562255859375, 0.3033294677734375, 0.32758331298828125, 0.351837158203125, 0.37609100341796875, 0.4003448486328125, 0.42459869384765625, 0.4488525390625, 0.47310638427734375, 0.4973602294921875, 0.5216140747070312, 0.545867919921875, 0.5701217651367188, 0.5943756103515625, 0.6186294555664062, 0.64288330078125, 0.6671371459960938, 0.6913909912109375, 0.7156448364257812, 0.739898681640625, 0.7641525268554688, 0.7884063720703125, 0.8126602172851562, 0.8369140625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 5.0, 14.0, 8.0, 20.0, 21.0, 26.0, 42.0, 68.0, 89.0, 101.0, 88.0, 117.0, 78.0, 86.0, 58.0, 46.0, 36.0, 28.0, 10.0, 13.0, 7.0, 8.0, 8.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.774717330932617, -16.364784240722656, -15.954852104187012, -15.544919967651367, -15.134987831115723, -14.725055694580078, -14.315122604370117, -13.905190467834473, -13.495258331298828, -13.085326194763184, -12.675393104553223, -12.265460968017578, -11.855528831481934, -11.445596694946289, -11.035663604736328, -10.625731468200684, -10.215798377990723, -9.805866241455078, -9.395933151245117, -8.986001014709473, -8.576068878173828, -8.166135787963867, -7.756203651428223, -7.346271514892578, -6.936338901519775, -6.526406288146973, -6.116474151611328, -5.706541538238525, -5.296608924865723, -4.886676788330078, -4.476744174957275, -4.066811561584473, -3.656879425048828, -3.2469470500946045, -2.837014675140381, -2.427082061767578, -2.0171496868133545, -1.6072173118591309, -1.1972846984863281, -0.7873523235321045, -0.37741994857788086, 0.03251248598098755, 0.44244492053985596, 0.8523774147033691, 1.2623097896575928, 1.6722421646118164, 2.082174777984619, 2.4921071529388428, 2.9020395278930664, 3.31197190284729, 3.7219042778015137, 4.131836891174316, 4.541769027709961, 4.951701641082764, 5.361634254455566, 5.771566390991211, 6.181499004364014, 6.591431617736816, 7.001363754272461, 7.411296367645264, 7.821228981018066, 8.231161117553711, 8.641094207763672, 9.051026344299316, 9.460958480834961]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 10.0, 10.0, 11.0, 9.0, 13.0, 17.0, 10.0, 13.0, 19.0, 27.0, 36.0, 32.0, 49.0, 49.0, 52.0, 51.0, 36.0, 53.0, 43.0, 43.0, 42.0, 53.0, 27.0, 34.0, 29.0, 27.0, 17.0, 25.0, 21.0, 21.0, 21.0, 18.0, 13.0, 14.0, 7.0, 3.0, 8.0, 7.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.590302467346191, -5.411503791809082, -5.2327046394348145, -5.053905963897705, -4.8751068115234375, -4.696308135986328, -4.517509460449219, -4.338710308074951, -4.159911155700684, -3.981112241744995, -3.8023133277893066, -3.6235146522521973, -3.4447154998779297, -3.2659168243408203, -3.087117910385132, -2.9083189964294434, -2.729520320892334, -2.5507214069366455, -2.371922492980957, -2.1931238174438477, -2.01432466506958, -1.8355258703231812, -1.6567270755767822, -1.4779281616210938, -1.2991292476654053, -1.1203303337097168, -0.9415314793586731, -0.7627326250076294, -0.5839337110519409, -0.40513479709625244, -0.22633600234985352, -0.04753708839416504, 0.13126134872436523, 0.3100602328777313, 0.4888591170310974, 0.6676579713821411, 0.8464568853378296, 1.025255799293518, 1.204054594039917, 1.3828535079956055, 1.561652421951294, 1.7404513359069824, 1.919250249862671, 2.0980491638183594, 2.2768478393554688, 2.4556469917297363, 2.6344456672668457, 2.813244581222534, 2.9920434951782227, 3.170842409133911, 3.3496413230895996, 3.528439998626709, 3.7072391510009766, 3.886037826538086, 4.064836502075195, 4.243635654449463, 4.4224348068237305, 4.60123348236084, 4.780032634735107, 4.958831310272217, 5.137630462646484, 5.316429138183594, 5.495227813720703, 5.674026966094971, 5.85282564163208]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 15.0, 30.0, 25.0, 40.0, 57.0, 75.0, 144.0, 202.0, 302.0, 505.0, 752.0, 1211.0, 2033.0, 3406.0, 6069.0, 10282.0, 18800.0, 35587.0, 69496.0, 127710.0, 198160.0, 218023.0, 159242.0, 91630.0, 48007.0, 25108.0, 13253.0, 7380.0, 4307.0, 2554.0, 1503.0, 940.0, 567.0, 381.0, 248.0, 142.0, 124.0, 86.0, 56.0, 37.0, 18.0, 11.0, 12.0, 10.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.86328125, -6.6434326171875, -6.423583984375, -6.2037353515625, -5.98388671875, -5.7640380859375, -5.544189453125, -5.3243408203125, -5.1044921875, -4.8846435546875, -4.664794921875, -4.4449462890625, -4.22509765625, -4.0052490234375, -3.785400390625, -3.5655517578125, -3.345703125, -3.1258544921875, -2.906005859375, -2.6861572265625, -2.46630859375, -2.2464599609375, -2.026611328125, -1.8067626953125, -1.5869140625, -1.3670654296875, -1.147216796875, -0.9273681640625, -0.70751953125, -0.4876708984375, -0.267822265625, -0.0479736328125, 0.171875, 0.3917236328125, 0.611572265625, 0.8314208984375, 1.05126953125, 1.2711181640625, 1.490966796875, 1.7108154296875, 1.9306640625, 2.1505126953125, 2.370361328125, 2.5902099609375, 2.81005859375, 3.0299072265625, 3.249755859375, 3.4696044921875, 3.689453125, 3.9093017578125, 4.129150390625, 4.3489990234375, 4.56884765625, 4.7886962890625, 5.008544921875, 5.2283935546875, 5.4482421875, 5.6680908203125, 5.887939453125, 6.1077880859375, 6.32763671875, 6.5474853515625, 6.767333984375, 6.9871826171875, 7.20703125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 11.0, 6.0, 12.0, 9.0, 16.0, 13.0, 11.0, 28.0, 19.0, 33.0, 28.0, 47.0, 49.0, 52.0, 53.0, 52.0, 39.0, 50.0, 49.0, 48.0, 54.0, 46.0, 35.0, 22.0, 26.0, 21.0, 20.0, 16.0, 18.0, 23.0, 16.0, 9.0, 12.0, 10.0, 7.0, 6.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.9453125, -5.73651123046875, -5.5277099609375, -5.31890869140625, -5.110107421875, -4.90130615234375, -4.6925048828125, -4.48370361328125, -4.27490234375, -4.06610107421875, -3.8572998046875, -3.64849853515625, -3.439697265625, -3.23089599609375, -3.0220947265625, -2.81329345703125, -2.6044921875, -2.39569091796875, -2.1868896484375, -1.97808837890625, -1.769287109375, -1.56048583984375, -1.3516845703125, -1.14288330078125, -0.93408203125, -0.72528076171875, -0.5164794921875, -0.30767822265625, -0.098876953125, 0.10992431640625, 0.3187255859375, 0.52752685546875, 0.736328125, 0.94512939453125, 1.1539306640625, 1.36273193359375, 1.571533203125, 1.78033447265625, 1.9891357421875, 2.19793701171875, 2.40673828125, 2.61553955078125, 2.8243408203125, 3.03314208984375, 3.241943359375, 3.45074462890625, 3.6595458984375, 3.86834716796875, 4.0771484375, 4.28594970703125, 4.4947509765625, 4.70355224609375, 4.912353515625, 5.12115478515625, 5.3299560546875, 5.53875732421875, 5.74755859375, 5.95635986328125, 6.1651611328125, 6.37396240234375, 6.582763671875, 6.79156494140625, 7.0003662109375, 7.20916748046875, 7.41796875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 18.0, 19.0, 38.0, 51.0, 107.0, 141.0, 193.0, 362.0, 512.0, 802.0, 1344.0, 2128.0, 3406.0, 5405.0, 8992.0, 14603.0, 24279.0, 40624.0, 66423.0, 104780.0, 147647.0, 170023.0, 155588.0, 114215.0, 73126.0, 44696.0, 26888.0, 16261.0, 9723.0, 5948.0, 3764.0, 2373.0, 1491.0, 974.0, 606.0, 367.0, 225.0, 160.0, 92.0, 62.0, 37.0, 25.0, 12.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.94140625, -5.76458740234375, -5.5877685546875, -5.41094970703125, -5.234130859375, -5.05731201171875, -4.8804931640625, -4.70367431640625, -4.52685546875, -4.35003662109375, -4.1732177734375, -3.99639892578125, -3.819580078125, -3.64276123046875, -3.4659423828125, -3.28912353515625, -3.1123046875, -2.93548583984375, -2.7586669921875, -2.58184814453125, -2.405029296875, -2.22821044921875, -2.0513916015625, -1.87457275390625, -1.69775390625, -1.52093505859375, -1.3441162109375, -1.16729736328125, -0.990478515625, -0.81365966796875, -0.6368408203125, -0.46002197265625, -0.283203125, -0.10638427734375, 0.0704345703125, 0.24725341796875, 0.424072265625, 0.60089111328125, 0.7777099609375, 0.95452880859375, 1.13134765625, 1.30816650390625, 1.4849853515625, 1.66180419921875, 1.838623046875, 2.01544189453125, 2.1922607421875, 2.36907958984375, 2.5458984375, 2.72271728515625, 2.8995361328125, 3.07635498046875, 3.253173828125, 3.42999267578125, 3.6068115234375, 3.78363037109375, 3.96044921875, 4.13726806640625, 4.3140869140625, 4.49090576171875, 4.667724609375, 4.84454345703125, 5.0213623046875, 5.19818115234375, 5.375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 8.0, 4.0, 6.0, 11.0, 5.0, 13.0, 14.0, 8.0, 10.0, 18.0, 20.0, 24.0, 30.0, 30.0, 28.0, 36.0, 34.0, 38.0, 48.0, 44.0, 39.0, 36.0, 36.0, 32.0, 36.0, 49.0, 33.0, 29.0, 34.0, 29.0, 26.0, 17.0, 29.0, 27.0, 20.0, 18.0, 13.0, 9.0, 10.0, 8.0, 10.0, 3.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.607421875, -3.500885009765625, -3.39434814453125, -3.287811279296875, -3.1812744140625, -3.074737548828125, -2.96820068359375, -2.861663818359375, -2.755126953125, -2.648590087890625, -2.54205322265625, -2.435516357421875, -2.3289794921875, -2.222442626953125, -2.11590576171875, -2.009368896484375, -1.90283203125, -1.796295166015625, -1.68975830078125, -1.583221435546875, -1.4766845703125, -1.370147705078125, -1.26361083984375, -1.157073974609375, -1.050537109375, -0.944000244140625, -0.83746337890625, -0.730926513671875, -0.6243896484375, -0.517852783203125, -0.41131591796875, -0.304779052734375, -0.1982421875, -0.091705322265625, 0.01483154296875, 0.121368408203125, 0.2279052734375, 0.334442138671875, 0.44097900390625, 0.547515869140625, 0.654052734375, 0.760589599609375, 0.86712646484375, 0.973663330078125, 1.0802001953125, 1.186737060546875, 1.29327392578125, 1.399810791015625, 1.50634765625, 1.612884521484375, 1.71942138671875, 1.825958251953125, 1.9324951171875, 2.039031982421875, 2.14556884765625, 2.252105712890625, 2.358642578125, 2.465179443359375, 2.57171630859375, 2.678253173828125, 2.7847900390625, 2.891326904296875, 2.99786376953125, 3.104400634765625, 3.2109375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 11.0, 9.0, 19.0, 32.0, 38.0, 60.0, 90.0, 134.0, 253.0, 364.0, 625.0, 1016.0, 1850.0, 3329.0, 6545.0, 13539.0, 32502.0, 86202.0, 233350.0, 354851.0, 192993.0, 69633.0, 26817.0, 11591.0, 5651.0, 3002.0, 1690.0, 930.0, 516.0, 321.0, 203.0, 152.0, 72.0, 52.0, 35.0, 28.0, 16.0, 11.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.55780029296875, -4.3851318359375, -4.21246337890625, -4.039794921875, -3.86712646484375, -3.6944580078125, -3.52178955078125, -3.34912109375, -3.17645263671875, -3.0037841796875, -2.83111572265625, -2.658447265625, -2.48577880859375, -2.3131103515625, -2.14044189453125, -1.9677734375, -1.79510498046875, -1.6224365234375, -1.44976806640625, -1.277099609375, -1.10443115234375, -0.9317626953125, -0.75909423828125, -0.58642578125, -0.41375732421875, -0.2410888671875, -0.06842041015625, 0.104248046875, 0.27691650390625, 0.4495849609375, 0.62225341796875, 0.794921875, 0.96759033203125, 1.1402587890625, 1.31292724609375, 1.485595703125, 1.65826416015625, 1.8309326171875, 2.00360107421875, 2.17626953125, 2.34893798828125, 2.5216064453125, 2.69427490234375, 2.866943359375, 3.03961181640625, 3.2122802734375, 3.38494873046875, 3.5576171875, 3.73028564453125, 3.9029541015625, 4.07562255859375, 4.248291015625, 4.42095947265625, 4.5936279296875, 4.76629638671875, 4.93896484375, 5.11163330078125, 5.2843017578125, 5.45697021484375, 5.629638671875, 5.80230712890625, 5.9749755859375, 6.14764404296875, 6.3203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 14.0, 11.0, 18.0, 22.0, 28.0, 29.0, 52.0, 66.0, 80.0, 97.0, 115.0, 93.0, 97.0, 62.0, 52.0, 37.0, 27.0, 21.0, 20.0, 12.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004901885986328125, -0.000474683940410614, -0.00045917928218841553, -0.00044367462396621704, -0.00042816996574401855, -0.00041266530752182007, -0.0003971606492996216, -0.0003816559910774231, -0.0003661513328552246, -0.0003506466746330261, -0.00033514201641082764, -0.00031963735818862915, -0.00030413269996643066, -0.0002886280417442322, -0.0002731233835220337, -0.0002576187252998352, -0.00024211406707763672, -0.00022660940885543823, -0.00021110475063323975, -0.00019560009241104126, -0.00018009543418884277, -0.0001645907759666443, -0.0001490861177444458, -0.00013358145952224731, -0.00011807680130004883, -0.00010257214307785034, -8.706748485565186e-05, -7.156282663345337e-05, -5.605816841125488e-05, -4.0553510189056396e-05, -2.504885196685791e-05, -9.544193744659424e-06, 5.9604644775390625e-06, 2.146512269973755e-05, 3.6969780921936035e-05, 5.247443914413452e-05, 6.797909736633301e-05, 8.34837555885315e-05, 9.898841381072998e-05, 0.00011449307203292847, 0.00012999773025512695, 0.00014550238847732544, 0.00016100704669952393, 0.0001765117049217224, 0.0001920163631439209, 0.00020752102136611938, 0.00022302567958831787, 0.00023853033781051636, 0.00025403499603271484, 0.00026953965425491333, 0.0002850443124771118, 0.0003005489706993103, 0.0003160536289215088, 0.0003315582871437073, 0.00034706294536590576, 0.00036256760358810425, 0.00037807226181030273, 0.0003935769200325012, 0.0004090815782546997, 0.0004245862364768982, 0.0004400908946990967, 0.00045559555292129517, 0.00047110021114349365, 0.00048660486936569214, 0.0005021095275878906]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 11.0, 9.0, 8.0, 16.0, 24.0, 26.0, 39.0, 66.0, 82.0, 135.0, 179.0, 286.0, 406.0, 634.0, 1088.0, 1724.0, 3135.0, 5845.0, 11313.0, 23942.0, 53273.0, 119490.0, 227504.0, 270080.0, 174149.0, 82495.0, 36669.0, 16937.0, 8459.0, 4349.0, 2308.0, 1373.0, 884.0, 532.0, 342.0, 222.0, 147.0, 121.0, 76.0, 46.0, 31.0, 27.0, 19.0, 14.0, 13.0, 8.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.548675537109375, -3.42742919921875, -3.306182861328125, -3.1849365234375, -3.063690185546875, -2.94244384765625, -2.821197509765625, -2.699951171875, -2.578704833984375, -2.45745849609375, -2.336212158203125, -2.2149658203125, -2.093719482421875, -1.97247314453125, -1.851226806640625, -1.72998046875, -1.608734130859375, -1.48748779296875, -1.366241455078125, -1.2449951171875, -1.123748779296875, -1.00250244140625, -0.881256103515625, -0.760009765625, -0.638763427734375, -0.51751708984375, -0.396270751953125, -0.2750244140625, -0.153778076171875, -0.03253173828125, 0.088714599609375, 0.2099609375, 0.331207275390625, 0.45245361328125, 0.573699951171875, 0.6949462890625, 0.816192626953125, 0.93743896484375, 1.058685302734375, 1.179931640625, 1.301177978515625, 1.42242431640625, 1.543670654296875, 1.6649169921875, 1.786163330078125, 1.90740966796875, 2.028656005859375, 2.14990234375, 2.271148681640625, 2.39239501953125, 2.513641357421875, 2.6348876953125, 2.756134033203125, 2.87738037109375, 2.998626708984375, 3.119873046875, 3.241119384765625, 3.36236572265625, 3.483612060546875, 3.6048583984375, 3.726104736328125, 3.84735107421875, 3.968597412109375, 4.08984375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 11.0, 16.0, 19.0, 27.0, 42.0, 46.0, 39.0, 42.0, 66.0, 77.0, 67.0, 66.0, 87.0, 73.0, 66.0, 57.0, 50.0, 33.0, 25.0, 17.0, 23.0, 19.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0828857421875, -1.048583984375, -1.0142822265625, -0.97998046875, -0.9456787109375, -0.911376953125, -0.8770751953125, -0.8427734375, -0.8084716796875, -0.774169921875, -0.7398681640625, -0.70556640625, -0.6712646484375, -0.636962890625, -0.6026611328125, -0.568359375, -0.5340576171875, -0.499755859375, -0.4654541015625, -0.43115234375, -0.3968505859375, -0.362548828125, -0.3282470703125, -0.2939453125, -0.2596435546875, -0.225341796875, -0.1910400390625, -0.15673828125, -0.1224365234375, -0.088134765625, -0.0538330078125, -0.01953125, 0.0147705078125, 0.049072265625, 0.0833740234375, 0.11767578125, 0.1519775390625, 0.186279296875, 0.2205810546875, 0.2548828125, 0.2891845703125, 0.323486328125, 0.3577880859375, 0.39208984375, 0.4263916015625, 0.460693359375, 0.4949951171875, 0.529296875, 0.5635986328125, 0.597900390625, 0.6322021484375, 0.66650390625, 0.7008056640625, 0.735107421875, 0.7694091796875, 0.8037109375, 0.8380126953125, 0.872314453125, 0.9066162109375, 0.94091796875, 0.9752197265625, 1.009521484375, 1.0438232421875, 1.078125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 6.0, 4.0, 4.0, 8.0, 6.0, 8.0, 11.0, 23.0, 21.0, 33.0, 46.0, 69.0, 94.0, 94.0, 98.0, 119.0, 76.0, 75.0, 63.0, 45.0, 27.0, 19.0, 10.0, 17.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.112650871276855, -14.689648628234863, -14.266647338867188, -13.843645095825195, -13.420642852783203, -12.997641563415527, -12.574639320373535, -12.15163803100586, -11.728635787963867, -11.305633544921875, -10.8826322555542, -10.459630012512207, -10.036628723144531, -9.613626480102539, -9.190624237060547, -8.767621994018555, -8.344620704650879, -7.921618938446045, -7.498617172241211, -7.075614929199219, -6.652613162994385, -6.229611396789551, -5.806609153747559, -5.383607387542725, -4.960605621337891, -4.537603855133057, -4.114602088928223, -3.6915998458862305, -3.2685980796813965, -2.8455963134765625, -2.4225943088531494, -1.9995923042297363, -1.5765914916992188, -1.1535896062850952, -0.7305877208709717, -0.30758583545684814, 0.11541604995727539, 0.5384178161621094, 0.9614198207855225, 1.3844218254089355, 1.8074235916137695, 2.2304253578186035, 2.6534273624420166, 3.0764293670654297, 3.4994311332702637, 3.9224328994750977, 4.34543514251709, 4.768436908721924, 5.191438674926758, 5.614440441131592, 6.037442207336426, 6.460444450378418, 6.883446216583252, 7.306447982788086, 7.729450225830078, 8.15245246887207, 8.575453758239746, 8.998456001281738, 9.421457290649414, 9.844459533691406, 10.267461776733398, 10.690463066101074, 11.113465309143066, 11.536466598510742, 11.959468841552734]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 1.0, 6.0, 7.0, 4.0, 14.0, 10.0, 9.0, 15.0, 15.0, 25.0, 18.0, 24.0, 23.0, 39.0, 37.0, 45.0, 34.0, 39.0, 42.0, 45.0, 49.0, 50.0, 45.0, 46.0, 30.0, 36.0, 37.0, 35.0, 32.0, 19.0, 29.0, 16.0, 22.0, 21.0, 14.0, 11.0, 11.0, 11.0, 8.0, 5.0, 4.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.358779430389404, -5.175360202789307, -4.991940498352051, -4.808521270751953, -4.625101566314697, -4.4416823387146, -4.258262634277344, -4.074843406677246, -3.8914239406585693, -3.7080044746398926, -3.524585008621216, -3.341165542602539, -3.1577463150024414, -2.9743266105651855, -2.790907382965088, -2.607487916946411, -2.4240684509277344, -2.2406489849090576, -2.057229518890381, -1.8738101720809937, -1.690390706062317, -1.5069712400436401, -1.323551893234253, -1.1401324272155762, -0.9567129611968994, -0.7732934951782227, -0.5898740887641907, -0.4064546823501587, -0.22303521633148193, -0.039615750312805176, 0.14380359649658203, 0.3272230625152588, 0.5106430053710938, 0.6940624713897705, 0.8774818778038025, 1.0609012842178345, 1.2443207502365112, 1.427740216255188, 1.6111595630645752, 1.794579029083252, 1.9779984951019287, 2.1614179611206055, 2.3448374271392822, 2.528256893157959, 2.7116761207580566, 2.8950958251953125, 3.07851505279541, 3.261934518814087, 3.4453539848327637, 3.6287734508514404, 3.812192916870117, 3.995612144470215, 4.179031848907471, 4.362451076507568, 4.545870780944824, 4.729290008544922, 4.9127092361450195, 5.096128463745117, 5.279548168182373, 5.462967395782471, 5.646387100219727, 5.829806327819824, 6.013225555419922, 6.196645259857178, 6.380064964294434]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [5.0, 5.0, 10.0, 12.0, 22.0, 18.0, 39.0, 38.0, 62.0, 62.0, 106.0, 110.0, 185.0, 246.0, 315.0, 468.0, 726.0, 1081.0, 1481.0, 2164.0, 3266.0, 5118.0, 8057.0, 13691.0, 24979.0, 52693.0, 131531.0, 395882.0, 1119774.0, 1446652.0, 634057.0, 199218.0, 73613.0, 32729.0, 17169.0, 9748.0, 6123.0, 4091.0, 2698.0, 1814.0, 1218.0, 822.0, 643.0, 413.0, 324.0, 214.0, 147.0, 135.0, 96.0, 66.0, 33.0, 39.0, 22.0, 16.0, 18.0, 6.0, 4.0, 8.0, 8.0, 7.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.9375, -9.5972900390625, -9.257080078125, -8.9168701171875, -8.57666015625, -8.2364501953125, -7.896240234375, -7.5560302734375, -7.2158203125, -6.8756103515625, -6.535400390625, -6.1951904296875, -5.85498046875, -5.5147705078125, -5.174560546875, -4.8343505859375, -4.494140625, -4.1539306640625, -3.813720703125, -3.4735107421875, -3.13330078125, -2.7930908203125, -2.452880859375, -2.1126708984375, -1.7724609375, -1.4322509765625, -1.092041015625, -0.7518310546875, -0.41162109375, -0.0714111328125, 0.268798828125, 0.6090087890625, 0.94921875, 1.2894287109375, 1.629638671875, 1.9698486328125, 2.31005859375, 2.6502685546875, 2.990478515625, 3.3306884765625, 3.6708984375, 4.0111083984375, 4.351318359375, 4.6915283203125, 5.03173828125, 5.3719482421875, 5.712158203125, 6.0523681640625, 6.392578125, 6.7327880859375, 7.072998046875, 7.4132080078125, 7.75341796875, 8.0936279296875, 8.433837890625, 8.7740478515625, 9.1142578125, 9.4544677734375, 9.794677734375, 10.1348876953125, 10.47509765625, 10.8153076171875, 11.155517578125, 11.4957275390625, 11.8359375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 8.0, 6.0, 14.0, 11.0, 20.0, 28.0, 19.0, 26.0, 22.0, 30.0, 30.0, 41.0, 46.0, 46.0, 42.0, 50.0, 54.0, 48.0, 45.0, 41.0, 33.0, 35.0, 36.0, 27.0, 28.0, 20.0, 26.0, 27.0, 17.0, 16.0, 12.0, 15.0, 7.0, 7.0, 12.0, 7.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.11669921875, -3.9755859375, -3.83447265625, -3.693359375, -3.55224609375, -3.4111328125, -3.27001953125, -3.12890625, -2.98779296875, -2.8466796875, -2.70556640625, -2.564453125, -2.42333984375, -2.2822265625, -2.14111328125, -2.0, -1.85888671875, -1.7177734375, -1.57666015625, -1.435546875, -1.29443359375, -1.1533203125, -1.01220703125, -0.87109375, -0.72998046875, -0.5888671875, -0.44775390625, -0.306640625, -0.16552734375, -0.0244140625, 0.11669921875, 0.2578125, 0.39892578125, 0.5400390625, 0.68115234375, 0.822265625, 0.96337890625, 1.1044921875, 1.24560546875, 1.38671875, 1.52783203125, 1.6689453125, 1.81005859375, 1.951171875, 2.09228515625, 2.2333984375, 2.37451171875, 2.515625, 2.65673828125, 2.7978515625, 2.93896484375, 3.080078125, 3.22119140625, 3.3623046875, 3.50341796875, 3.64453125, 3.78564453125, 3.9267578125, 4.06787109375, 4.208984375, 4.35009765625, 4.4912109375, 4.63232421875, 4.7734375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 16.0, 26.0, 37.0, 41.0, 64.0, 116.0, 169.0, 237.0, 318.0, 517.0, 756.0, 1168.0, 1838.0, 2886.0, 4624.0, 7738.0, 13341.0, 23641.0, 46836.0, 105669.0, 292107.0, 900650.0, 1574979.0, 773121.0, 251936.0, 94994.0, 42929.0, 21896.0, 12219.0, 7246.0, 4300.0, 2709.0, 1814.0, 1159.0, 718.0, 451.0, 332.0, 226.0, 138.0, 96.0, 74.0, 47.0, 31.0, 20.0, 18.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.3125, -12.914306640625, -12.51611328125, -12.117919921875, -11.7197265625, -11.321533203125, -10.92333984375, -10.525146484375, -10.126953125, -9.728759765625, -9.33056640625, -8.932373046875, -8.5341796875, -8.135986328125, -7.73779296875, -7.339599609375, -6.94140625, -6.543212890625, -6.14501953125, -5.746826171875, -5.3486328125, -4.950439453125, -4.55224609375, -4.154052734375, -3.755859375, -3.357666015625, -2.95947265625, -2.561279296875, -2.1630859375, -1.764892578125, -1.36669921875, -0.968505859375, -0.5703125, -0.172119140625, 0.22607421875, 0.624267578125, 1.0224609375, 1.420654296875, 1.81884765625, 2.217041015625, 2.615234375, 3.013427734375, 3.41162109375, 3.809814453125, 4.2080078125, 4.606201171875, 5.00439453125, 5.402587890625, 5.80078125, 6.198974609375, 6.59716796875, 6.995361328125, 7.3935546875, 7.791748046875, 8.18994140625, 8.588134765625, 8.986328125, 9.384521484375, 9.78271484375, 10.180908203125, 10.5791015625, 10.977294921875, 11.37548828125, 11.773681640625, 12.171875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 10.0, 13.0, 17.0, 14.0, 14.0, 37.0, 43.0, 62.0, 63.0, 91.0, 136.0, 149.0, 207.0, 286.0, 308.0, 329.0, 457.0, 398.0, 307.0, 258.0, 195.0, 160.0, 101.0, 99.0, 72.0, 39.0, 41.0, 32.0, 30.0, 17.0, 18.0, 11.0, 13.0, 8.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.283203125, -3.1790771484375, -3.074951171875, -2.9708251953125, -2.86669921875, -2.7625732421875, -2.658447265625, -2.5543212890625, -2.4501953125, -2.3460693359375, -2.241943359375, -2.1378173828125, -2.03369140625, -1.9295654296875, -1.825439453125, -1.7213134765625, -1.6171875, -1.5130615234375, -1.408935546875, -1.3048095703125, -1.20068359375, -1.0965576171875, -0.992431640625, -0.8883056640625, -0.7841796875, -0.6800537109375, -0.575927734375, -0.4718017578125, -0.36767578125, -0.2635498046875, -0.159423828125, -0.0552978515625, 0.048828125, 0.1529541015625, 0.257080078125, 0.3612060546875, 0.46533203125, 0.5694580078125, 0.673583984375, 0.7777099609375, 0.8818359375, 0.9859619140625, 1.090087890625, 1.1942138671875, 1.29833984375, 1.4024658203125, 1.506591796875, 1.6107177734375, 1.71484375, 1.8189697265625, 1.923095703125, 2.0272216796875, 2.13134765625, 2.2354736328125, 2.339599609375, 2.4437255859375, 2.5478515625, 2.6519775390625, 2.756103515625, 2.8602294921875, 2.96435546875, 3.0684814453125, 3.172607421875, 3.2767333984375, 3.380859375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 6.0, 4.0, 2.0, 3.0, 10.0, 7.0, 10.0, 17.0, 28.0, 34.0, 44.0, 56.0, 74.0, 90.0, 85.0, 103.0, 99.0, 79.0, 53.0, 43.0, 32.0, 30.0, 23.0, 14.0, 8.0, 10.0, 4.0, 8.0, 4.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.243199348449707, -10.845352172851562, -10.447504997253418, -10.04965877532959, -9.651811599731445, -9.2539644241333, -8.856117248535156, -8.458271026611328, -8.060423851013184, -7.662576675415039, -7.264729976654053, -6.866882801055908, -6.469036102294922, -6.071188926696777, -5.673341751098633, -5.2754950523376465, -4.877647876739502, -4.479800701141357, -4.081954002380371, -3.6841068267822266, -3.2862601280212402, -2.8884129524230957, -2.4905660152435303, -2.092719078063965, -1.6948721408843994, -1.297025203704834, -0.8991782069206238, -0.5013312101364136, -0.10348427295684814, 0.2943626642227173, 0.6922097206115723, 1.0900566577911377, 1.4879035949707031, 1.8857505321502686, 2.283597469329834, 2.6814446449279785, 3.079291343688965, 3.4771385192871094, 3.874985456466675, 4.27283239364624, 4.670679092407227, 5.068526268005371, 5.466372966766357, 5.864220142364502, 6.262066841125488, 6.659914016723633, 7.057761192321777, 7.455607891082764, 7.853455066680908, 8.251301765441895, 8.649148941040039, 9.046996116638184, 9.444843292236328, 9.842689514160156, 10.2405366897583, 10.638383865356445, 11.03623104095459, 11.434078216552734, 11.831925392150879, 12.229771614074707, 12.627618789672852, 13.025465965270996, 13.42331314086914, 13.821159362792969, 14.219006538391113]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 12.0, 19.0, 13.0, 15.0, 27.0, 23.0, 24.0, 30.0, 25.0, 49.0, 40.0, 42.0, 35.0, 51.0, 45.0, 48.0, 40.0, 42.0, 43.0, 50.0, 46.0, 33.0, 37.0, 33.0, 18.0, 18.0, 19.0, 10.0, 17.0, 14.0, 11.0, 11.0, 11.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.619811058044434, -6.416428565979004, -6.213045597076416, -6.009663105010986, -5.806280136108398, -5.602897644042969, -5.399515151977539, -5.196132183074951, -4.992749214172363, -4.789366722106934, -4.585983753204346, -4.382601261138916, -4.179218292236328, -3.9758358001708984, -3.7724530696868896, -3.569070339202881, -3.365687847137451, -3.1623051166534424, -2.9589223861694336, -2.755539894104004, -2.552156925201416, -2.3487744331359863, -2.1453917026519775, -1.9420089721679688, -1.73862624168396, -1.5352435111999512, -1.3318607807159424, -1.1284781694412231, -0.9250954389572144, -0.7217127084732056, -0.5183300971984863, -0.31494736671447754, -0.11156511306762695, 0.09181758761405945, 0.29520028829574585, 0.49858295917510986, 0.7019656896591187, 0.9053484201431274, 1.1087310314178467, 1.3121137619018555, 1.5154964923858643, 1.718879222869873, 1.9222619533538818, 2.1256446838378906, 2.3290271759033203, 2.532410144805908, 2.735792636871338, 2.9391753673553467, 3.1425580978393555, 3.3459408283233643, 3.549323558807373, 3.7527060508728027, 3.9560890197753906, 4.15947151184082, 4.36285400390625, 4.566236972808838, 4.769619941711426, 4.9730024337768555, 5.176385402679443, 5.379767894744873, 5.583150863647461, 5.786533355712891, 5.98991584777832, 6.193298816680908, 6.396681308746338]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 17.0, 25.0, 37.0, 66.0, 115.0, 180.0, 287.0, 459.0, 864.0, 1664.0, 2885.0, 5339.0, 10808.0, 22532.0, 51957.0, 126479.0, 268143.0, 292636.0, 150130.0, 61948.0, 26167.0, 12326.0, 6101.0, 3229.0, 1738.0, 1019.0, 577.0, 306.0, 191.0, 122.0, 71.0, 39.0, 24.0, 15.0, 11.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.904296875, -3.770111083984375, -3.63592529296875, -3.501739501953125, -3.3675537109375, -3.233367919921875, -3.09918212890625, -2.964996337890625, -2.830810546875, -2.696624755859375, -2.56243896484375, -2.428253173828125, -2.2940673828125, -2.159881591796875, -2.02569580078125, -1.891510009765625, -1.75732421875, -1.623138427734375, -1.48895263671875, -1.354766845703125, -1.2205810546875, -1.086395263671875, -0.95220947265625, -0.818023681640625, -0.683837890625, -0.549652099609375, -0.41546630859375, -0.281280517578125, -0.1470947265625, -0.012908935546875, 0.12127685546875, 0.255462646484375, 0.3896484375, 0.523834228515625, 0.65802001953125, 0.792205810546875, 0.9263916015625, 1.060577392578125, 1.19476318359375, 1.328948974609375, 1.463134765625, 1.597320556640625, 1.73150634765625, 1.865692138671875, 1.9998779296875, 2.134063720703125, 2.26824951171875, 2.402435302734375, 2.53662109375, 2.670806884765625, 2.80499267578125, 2.939178466796875, 3.0733642578125, 3.207550048828125, 3.34173583984375, 3.475921630859375, 3.610107421875, 3.744293212890625, 3.87847900390625, 4.012664794921875, 4.1468505859375, 4.281036376953125, 4.41522216796875, 4.549407958984375, 4.68359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 6.0, 7.0, 11.0, 10.0, 14.0, 11.0, 17.0, 16.0, 23.0, 38.0, 39.0, 35.0, 35.0, 31.0, 36.0, 38.0, 52.0, 41.0, 54.0, 35.0, 39.0, 47.0, 37.0, 35.0, 36.0, 44.0, 31.0, 27.0, 21.0, 23.0, 15.0, 10.0, 15.0, 9.0, 9.0, 14.0, 6.0, 2.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.9691162109375, -5.754638671875, -5.5401611328125, -5.32568359375, -5.1112060546875, -4.896728515625, -4.6822509765625, -4.4677734375, -4.2532958984375, -4.038818359375, -3.8243408203125, -3.60986328125, -3.3953857421875, -3.180908203125, -2.9664306640625, -2.751953125, -2.5374755859375, -2.322998046875, -2.1085205078125, -1.89404296875, -1.6795654296875, -1.465087890625, -1.2506103515625, -1.0361328125, -0.8216552734375, -0.607177734375, -0.3927001953125, -0.17822265625, 0.0362548828125, 0.250732421875, 0.4652099609375, 0.6796875, 0.8941650390625, 1.108642578125, 1.3231201171875, 1.53759765625, 1.7520751953125, 1.966552734375, 2.1810302734375, 2.3955078125, 2.6099853515625, 2.824462890625, 3.0389404296875, 3.25341796875, 3.4678955078125, 3.682373046875, 3.8968505859375, 4.111328125, 4.3258056640625, 4.540283203125, 4.7547607421875, 4.96923828125, 5.1837158203125, 5.398193359375, 5.6126708984375, 5.8271484375, 6.0416259765625, 6.256103515625, 6.4705810546875, 6.68505859375, 6.8995361328125, 7.114013671875, 7.3284912109375, 7.54296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 10.0, 11.0, 11.0, 18.0, 26.0, 37.0, 62.0, 83.0, 124.0, 199.0, 268.0, 491.0, 706.0, 1182.0, 2001.0, 3281.0, 6008.0, 11264.0, 22823.0, 48024.0, 109720.0, 239330.0, 298801.0, 164578.0, 72008.0, 32699.0, 15926.0, 8079.0, 4299.0, 2506.0, 1472.0, 915.0, 548.0, 350.0, 246.0, 127.0, 120.0, 58.0, 51.0, 33.0, 22.0, 13.0, 14.0, 4.0, 0.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.634033203125, -4.49462890625, -4.355224609375, -4.2158203125, -4.076416015625, -3.93701171875, -3.797607421875, -3.658203125, -3.518798828125, -3.37939453125, -3.239990234375, -3.1005859375, -2.961181640625, -2.82177734375, -2.682373046875, -2.54296875, -2.403564453125, -2.26416015625, -2.124755859375, -1.9853515625, -1.845947265625, -1.70654296875, -1.567138671875, -1.427734375, -1.288330078125, -1.14892578125, -1.009521484375, -0.8701171875, -0.730712890625, -0.59130859375, -0.451904296875, -0.3125, -0.173095703125, -0.03369140625, 0.105712890625, 0.2451171875, 0.384521484375, 0.52392578125, 0.663330078125, 0.802734375, 0.942138671875, 1.08154296875, 1.220947265625, 1.3603515625, 1.499755859375, 1.63916015625, 1.778564453125, 1.91796875, 2.057373046875, 2.19677734375, 2.336181640625, 2.4755859375, 2.614990234375, 2.75439453125, 2.893798828125, 3.033203125, 3.172607421875, 3.31201171875, 3.451416015625, 3.5908203125, 3.730224609375, 3.86962890625, 4.009033203125, 4.1484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 6.0, 5.0, 11.0, 9.0, 10.0, 8.0, 14.0, 19.0, 16.0, 18.0, 23.0, 26.0, 32.0, 36.0, 27.0, 39.0, 36.0, 39.0, 32.0, 37.0, 34.0, 55.0, 39.0, 45.0, 28.0, 41.0, 37.0, 38.0, 33.0, 27.0, 22.0, 21.0, 16.0, 20.0, 16.0, 16.0, 12.0, 11.0, 9.0, 7.0, 5.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.572265625, -3.4583740234375, -3.344482421875, -3.2305908203125, -3.11669921875, -3.0028076171875, -2.888916015625, -2.7750244140625, -2.6611328125, -2.5472412109375, -2.433349609375, -2.3194580078125, -2.20556640625, -2.0916748046875, -1.977783203125, -1.8638916015625, -1.75, -1.6361083984375, -1.522216796875, -1.4083251953125, -1.29443359375, -1.1805419921875, -1.066650390625, -0.9527587890625, -0.8388671875, -0.7249755859375, -0.611083984375, -0.4971923828125, -0.38330078125, -0.2694091796875, -0.155517578125, -0.0416259765625, 0.072265625, 0.1861572265625, 0.300048828125, 0.4139404296875, 0.52783203125, 0.6417236328125, 0.755615234375, 0.8695068359375, 0.9833984375, 1.0972900390625, 1.211181640625, 1.3250732421875, 1.43896484375, 1.5528564453125, 1.666748046875, 1.7806396484375, 1.89453125, 2.0084228515625, 2.122314453125, 2.2362060546875, 2.35009765625, 2.4639892578125, 2.577880859375, 2.6917724609375, 2.8056640625, 2.9195556640625, 3.033447265625, 3.1473388671875, 3.26123046875, 3.3751220703125, 3.489013671875, 3.6029052734375, 3.716796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 12.0, 8.0, 18.0, 30.0, 27.0, 35.0, 44.0, 80.0, 147.0, 204.0, 331.0, 557.0, 869.0, 1612.0, 2817.0, 5302.0, 9989.0, 19836.0, 42365.0, 94755.0, 213089.0, 312344.0, 187283.0, 81982.0, 37029.0, 17904.0, 8852.0, 4717.0, 2586.0, 1521.0, 835.0, 497.0, 313.0, 180.0, 129.0, 83.0, 62.0, 39.0, 30.0, 13.0, 15.0, 4.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.537109375, -1.478912353515625, -1.42071533203125, -1.362518310546875, -1.3043212890625, -1.246124267578125, -1.18792724609375, -1.129730224609375, -1.071533203125, -1.013336181640625, -0.95513916015625, -0.896942138671875, -0.8387451171875, -0.780548095703125, -0.72235107421875, -0.664154052734375, -0.60595703125, -0.547760009765625, -0.48956298828125, -0.431365966796875, -0.3731689453125, -0.314971923828125, -0.25677490234375, -0.198577880859375, -0.140380859375, -0.082183837890625, -0.02398681640625, 0.034210205078125, 0.0924072265625, 0.150604248046875, 0.20880126953125, 0.266998291015625, 0.3251953125, 0.383392333984375, 0.44158935546875, 0.499786376953125, 0.5579833984375, 0.616180419921875, 0.67437744140625, 0.732574462890625, 0.790771484375, 0.848968505859375, 0.90716552734375, 0.965362548828125, 1.0235595703125, 1.081756591796875, 1.13995361328125, 1.198150634765625, 1.25634765625, 1.314544677734375, 1.37274169921875, 1.430938720703125, 1.4891357421875, 1.547332763671875, 1.60552978515625, 1.663726806640625, 1.721923828125, 1.780120849609375, 1.83831787109375, 1.896514892578125, 1.9547119140625, 2.012908935546875, 2.07110595703125, 2.129302978515625, 2.1875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 9.0, 9.0, 14.0, 19.0, 12.0, 29.0, 30.0, 40.0, 34.0, 42.0, 61.0, 62.0, 78.0, 74.0, 98.0, 75.0, 50.0, 56.0, 34.0, 32.0, 15.0, 16.0, 21.0, 16.0, 11.0, 9.0, 6.0, 4.0, 8.0, 3.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.683038711547852e-05, -7.397402077913284e-05, -7.111765444278717e-05, -6.82612881064415e-05, -6.540492177009583e-05, -6.254855543375015e-05, -5.969218909740448e-05, -5.683582276105881e-05, -5.3979456424713135e-05, -5.112309008836746e-05, -4.826672375202179e-05, -4.541035741567612e-05, -4.2553991079330444e-05, -3.969762474298477e-05, -3.68412584066391e-05, -3.3984892070293427e-05, -3.1128525733947754e-05, -2.827215939760208e-05, -2.541579306125641e-05, -2.2559426724910736e-05, -1.9703060388565063e-05, -1.684669405221939e-05, -1.3990327715873718e-05, -1.1133961379528046e-05, -8.277595043182373e-06, -5.4212287068367004e-06, -2.564862370491028e-06, 2.915039658546448e-07, 3.1478703022003174e-06, 6.00423663854599e-06, 8.860602974891663e-06, 1.1716969311237335e-05, 1.4573335647583008e-05, 1.742970198392868e-05, 2.0286068320274353e-05, 2.3142434656620026e-05, 2.5998800992965698e-05, 2.885516732931137e-05, 3.1711533665657043e-05, 3.4567900002002716e-05, 3.742426633834839e-05, 4.028063267469406e-05, 4.3136999011039734e-05, 4.5993365347385406e-05, 4.884973168373108e-05, 5.170609802007675e-05, 5.4562464356422424e-05, 5.74188306927681e-05, 6.027519702911377e-05, 6.313156336545944e-05, 6.598792970180511e-05, 6.884429603815079e-05, 7.170066237449646e-05, 7.455702871084213e-05, 7.74133950471878e-05, 8.026976138353348e-05, 8.312612771987915e-05, 8.598249405622482e-05, 8.88388603925705e-05, 9.169522672891617e-05, 9.455159306526184e-05, 9.740795940160751e-05, 0.00010026432573795319, 0.00010312069207429886, 0.00010597705841064453]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 11.0, 26.0, 35.0, 48.0, 68.0, 87.0, 127.0, 182.0, 265.0, 441.0, 590.0, 892.0, 1335.0, 1957.0, 3013.0, 4679.0, 7401.0, 11880.0, 19055.0, 31177.0, 52951.0, 87158.0, 135755.0, 180966.0, 175507.0, 127328.0, 80007.0, 48168.0, 29041.0, 17773.0, 10719.0, 6951.0, 4397.0, 2864.0, 1853.0, 1185.0, 869.0, 554.0, 448.0, 251.0, 192.0, 105.0, 64.0, 55.0, 41.0, 33.0, 26.0, 14.0, 5.0, 8.0, 1.0, 3.0], "bins": [-1.2646484375, -1.2294387817382812, -1.1942291259765625, -1.1590194702148438, -1.123809814453125, -1.0886001586914062, -1.0533905029296875, -1.0181808471679688, -0.98297119140625, -0.9477615356445312, -0.9125518798828125, -0.8773422241210938, -0.842132568359375, -0.8069229125976562, -0.7717132568359375, -0.7365036010742188, -0.7012939453125, -0.6660842895507812, -0.6308746337890625, -0.5956649780273438, -0.560455322265625, -0.5252456665039062, -0.4900360107421875, -0.45482635498046875, -0.41961669921875, -0.38440704345703125, -0.3491973876953125, -0.31398773193359375, -0.278778076171875, -0.24356842041015625, -0.2083587646484375, -0.17314910888671875, -0.137939453125, -0.10272979736328125, -0.0675201416015625, -0.03231048583984375, 0.002899169921875, 0.03810882568359375, 0.0733184814453125, 0.10852813720703125, 0.14373779296875, 0.17894744873046875, 0.2141571044921875, 0.24936676025390625, 0.284576416015625, 0.31978607177734375, 0.3549957275390625, 0.39020538330078125, 0.4254150390625, 0.46062469482421875, 0.4958343505859375, 0.5310440063476562, 0.566253662109375, 0.6014633178710938, 0.6366729736328125, 0.6718826293945312, 0.70709228515625, 0.7423019409179688, 0.7775115966796875, 0.8127212524414062, 0.847930908203125, 0.8831405639648438, 0.9183502197265625, 0.9535598754882812, 0.98876953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 24.0, 12.0, 25.0, 28.0, 47.0, 46.0, 40.0, 62.0, 57.0, 59.0, 73.0, 65.0, 50.0, 43.0, 50.0, 33.0, 47.0, 38.0, 38.0, 24.0, 23.0, 13.0, 12.0, 11.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453857421875, -0.4390678405761719, -0.42427825927734375, -0.4094886779785156, -0.3946990966796875, -0.3799095153808594, -0.36511993408203125, -0.3503303527832031, -0.335540771484375, -0.3207511901855469, -0.30596160888671875, -0.2911720275878906, -0.2763824462890625, -0.2615928649902344, -0.24680328369140625, -0.23201370239257812, -0.21722412109375, -0.20243453979492188, -0.18764495849609375, -0.17285537719726562, -0.1580657958984375, -0.14327621459960938, -0.12848663330078125, -0.11369705200195312, -0.098907470703125, -0.08411788940429688, -0.06932830810546875, -0.054538726806640625, -0.0397491455078125, -0.024959564208984375, -0.01016998291015625, 0.004619598388671875, 0.0194091796875, 0.034198760986328125, 0.04898834228515625, 0.06377792358398438, 0.0785675048828125, 0.09335708618164062, 0.10814666748046875, 0.12293624877929688, 0.137725830078125, 0.15251541137695312, 0.16730499267578125, 0.18209457397460938, 0.1968841552734375, 0.21167373657226562, 0.22646331787109375, 0.24125289916992188, 0.25604248046875, 0.2708320617675781, 0.28562164306640625, 0.3004112243652344, 0.3152008056640625, 0.3299903869628906, 0.34477996826171875, 0.3595695495605469, 0.374359130859375, 0.3891487121582031, 0.40393829345703125, 0.4187278747558594, 0.4335174560546875, 0.4483070373535156, 0.46309661865234375, 0.4778861999511719, 0.49267578125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 1.0, 4.0, 6.0, 8.0, 10.0, 15.0, 17.0, 37.0, 44.0, 46.0, 64.0, 85.0, 77.0, 100.0, 113.0, 87.0, 59.0, 51.0, 39.0, 31.0, 21.0, 14.0, 14.0, 8.0, 7.0, 5.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.886992454528809, -11.485967636108398, -11.084942817687988, -10.683918952941895, -10.282894134521484, -9.881869316101074, -9.480844497680664, -9.07982063293457, -8.67879581451416, -8.27777099609375, -7.876746654510498, -7.475721836090088, -7.074697494506836, -6.673672676086426, -6.272647857666016, -5.871623516082764, -5.4705986976623535, -5.069573879241943, -4.668549537658691, -4.267524719238281, -3.8665003776550293, -3.465475559234619, -3.064450979232788, -2.663426399230957, -2.262401819229126, -1.861377239227295, -1.4603526592254639, -1.0593279600143433, -0.6583033800125122, -0.2572786808013916, 0.14374589920043945, 0.5447704792022705, 0.9457950592041016, 1.3468196392059326, 1.7478442192077637, 2.148869037628174, 2.549893379211426, 2.950918197631836, 3.351942777633667, 3.752967357635498, 4.15399169921875, 4.55501651763916, 4.956040859222412, 5.357065677642822, 5.758090019226074, 6.159114837646484, 6.5601396560668945, 6.9611639976501465, 7.362188816070557, 7.763213634490967, 8.164237976074219, 8.565262794494629, 8.966287612915039, 9.367311477661133, 9.768336296081543, 10.169361114501953, 10.570385932922363, 10.971410751342773, 11.372435569763184, 11.773459434509277, 12.174484252929688, 12.575509071350098, 12.976533889770508, 13.377557754516602, 13.778582572937012]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 11.0, 10.0, 14.0, 18.0, 17.0, 27.0, 19.0, 31.0, 24.0, 32.0, 43.0, 42.0, 41.0, 43.0, 43.0, 50.0, 41.0, 50.0, 38.0, 42.0, 52.0, 42.0, 34.0, 41.0, 27.0, 21.0, 19.0, 18.0, 16.0, 11.0, 12.0, 16.0, 7.0, 10.0, 8.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.692758083343506, -6.487729072570801, -6.282700061798096, -6.077670574188232, -5.872641563415527, -5.667612552642822, -5.462583541870117, -5.257554054260254, -5.052525043487549, -4.847496032714844, -4.642467021942139, -4.437437534332275, -4.23240852355957, -4.027379512786865, -3.82235050201416, -3.617321252822876, -3.412292242050171, -3.207263231277466, -3.0022339820861816, -2.7972049713134766, -2.5921757221221924, -2.3871467113494873, -2.182117462158203, -1.977088451385498, -1.7720593214035034, -1.5670301914215088, -1.3620010614395142, -1.1569719314575195, -0.9519428610801697, -0.7469137907028198, -0.5418846607208252, -0.33685553073883057, -0.13182640075683594, 0.0732027143239975, 0.27823182940483093, 0.4832609295845032, 0.6882900595664978, 0.8933191299438477, 1.0983482599258423, 1.303377389907837, 1.5084065198898315, 1.7134356498718262, 1.9184647798538208, 2.1234939098358154, 2.3285229206085205, 2.5335521697998047, 2.7385811805725098, 2.943610191345215, 3.148639440536499, 3.353668451309204, 3.5586977005004883, 3.7637267112731934, 3.9687559604644775, 4.173785209655762, 4.378814220428467, 4.583843231201172, 4.788872241973877, 4.993901252746582, 5.198930263519287, 5.40395975112915, 5.6089887619018555, 5.8140177726745605, 6.019046783447266, 6.224076271057129, 6.429105281829834]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 11.0, 22.0, 28.0, 45.0, 58.0, 102.0, 193.0, 276.0, 492.0, 775.0, 1511.0, 2792.0, 5228.0, 9924.0, 20563.0, 45467.0, 105193.0, 217887.0, 283480.0, 191770.0, 88065.0, 38146.0, 17687.0, 8662.0, 4503.0, 2431.0, 1317.0, 787.0, 428.0, 295.0, 133.0, 99.0, 60.0, 39.0, 28.0, 20.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.0711669921875, -8.751708984375, -8.4322509765625, -8.11279296875, -7.7933349609375, -7.473876953125, -7.1544189453125, -6.8349609375, -6.5155029296875, -6.196044921875, -5.8765869140625, -5.55712890625, -5.2376708984375, -4.918212890625, -4.5987548828125, -4.279296875, -3.9598388671875, -3.640380859375, -3.3209228515625, -3.00146484375, -2.6820068359375, -2.362548828125, -2.0430908203125, -1.7236328125, -1.4041748046875, -1.084716796875, -0.7652587890625, -0.44580078125, -0.1263427734375, 0.193115234375, 0.5125732421875, 0.83203125, 1.1514892578125, 1.470947265625, 1.7904052734375, 2.10986328125, 2.4293212890625, 2.748779296875, 3.0682373046875, 3.3876953125, 3.7071533203125, 4.026611328125, 4.3460693359375, 4.66552734375, 4.9849853515625, 5.304443359375, 5.6239013671875, 5.943359375, 6.2628173828125, 6.582275390625, 6.9017333984375, 7.22119140625, 7.5406494140625, 7.860107421875, 8.1795654296875, 8.4990234375, 8.8184814453125, 9.137939453125, 9.4573974609375, 9.77685546875, 10.0963134765625, 10.415771484375, 10.7352294921875, 11.0546875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 5.0, 12.0, 11.0, 15.0, 14.0, 24.0, 16.0, 24.0, 29.0, 36.0, 46.0, 31.0, 41.0, 51.0, 42.0, 50.0, 51.0, 40.0, 48.0, 43.0, 39.0, 49.0, 48.0, 34.0, 37.0, 21.0, 25.0, 10.0, 19.0, 11.0, 14.0, 15.0, 14.0, 3.0, 9.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.390625, -7.1602783203125, -6.929931640625, -6.6995849609375, -6.46923828125, -6.2388916015625, -6.008544921875, -5.7781982421875, -5.5478515625, -5.3175048828125, -5.087158203125, -4.8568115234375, -4.62646484375, -4.3961181640625, -4.165771484375, -3.9354248046875, -3.705078125, -3.4747314453125, -3.244384765625, -3.0140380859375, -2.78369140625, -2.5533447265625, -2.322998046875, -2.0926513671875, -1.8623046875, -1.6319580078125, -1.401611328125, -1.1712646484375, -0.94091796875, -0.7105712890625, -0.480224609375, -0.2498779296875, -0.01953125, 0.2108154296875, 0.441162109375, 0.6715087890625, 0.90185546875, 1.1322021484375, 1.362548828125, 1.5928955078125, 1.8232421875, 2.0535888671875, 2.283935546875, 2.5142822265625, 2.74462890625, 2.9749755859375, 3.205322265625, 3.4356689453125, 3.666015625, 3.8963623046875, 4.126708984375, 4.3570556640625, 4.58740234375, 4.8177490234375, 5.048095703125, 5.2784423828125, 5.5087890625, 5.7391357421875, 5.969482421875, 6.1998291015625, 6.43017578125, 6.6605224609375, 6.890869140625, 7.1212158203125, 7.3515625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 8.0, 7.0, 15.0, 31.0, 38.0, 39.0, 74.0, 90.0, 118.0, 205.0, 309.0, 420.0, 628.0, 902.0, 1330.0, 1947.0, 2933.0, 4206.0, 6453.0, 9537.0, 15009.0, 23234.0, 36270.0, 56728.0, 86297.0, 120430.0, 148615.0, 149512.0, 125178.0, 89698.0, 59289.0, 38030.0, 24302.0, 15595.0, 10252.0, 6726.0, 4573.0, 3071.0, 2056.0, 1356.0, 992.0, 651.0, 457.0, 301.0, 215.0, 131.0, 82.0, 62.0, 49.0, 40.0, 23.0, 17.0, 11.0, 8.0, 3.0, 1.0, 3.0, 2.0], "bins": [-5.87109375, -5.6934814453125, -5.515869140625, -5.3382568359375, -5.16064453125, -4.9830322265625, -4.805419921875, -4.6278076171875, -4.4501953125, -4.2725830078125, -4.094970703125, -3.9173583984375, -3.73974609375, -3.5621337890625, -3.384521484375, -3.2069091796875, -3.029296875, -2.8516845703125, -2.674072265625, -2.4964599609375, -2.31884765625, -2.1412353515625, -1.963623046875, -1.7860107421875, -1.6083984375, -1.4307861328125, -1.253173828125, -1.0755615234375, -0.89794921875, -0.7203369140625, -0.542724609375, -0.3651123046875, -0.1875, -0.0098876953125, 0.167724609375, 0.3453369140625, 0.52294921875, 0.7005615234375, 0.878173828125, 1.0557861328125, 1.2333984375, 1.4110107421875, 1.588623046875, 1.7662353515625, 1.94384765625, 2.1214599609375, 2.299072265625, 2.4766845703125, 2.654296875, 2.8319091796875, 3.009521484375, 3.1871337890625, 3.36474609375, 3.5423583984375, 3.719970703125, 3.8975830078125, 4.0751953125, 4.2528076171875, 4.430419921875, 4.6080322265625, 4.78564453125, 4.9632568359375, 5.140869140625, 5.3184814453125, 5.49609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 5.0, 1.0, 7.0, 6.0, 9.0, 15.0, 14.0, 15.0, 20.0, 14.0, 34.0, 26.0, 20.0, 36.0, 36.0, 33.0, 26.0, 32.0, 39.0, 38.0, 47.0, 33.0, 34.0, 32.0, 31.0, 43.0, 28.0, 34.0, 42.0, 39.0, 26.0, 26.0, 27.0, 15.0, 20.0, 14.0, 17.0, 8.0, 11.0, 13.0, 12.0, 3.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.447265625, -3.33770751953125, -3.2281494140625, -3.11859130859375, -3.009033203125, -2.89947509765625, -2.7899169921875, -2.68035888671875, -2.57080078125, -2.46124267578125, -2.3516845703125, -2.24212646484375, -2.132568359375, -2.02301025390625, -1.9134521484375, -1.80389404296875, -1.6943359375, -1.58477783203125, -1.4752197265625, -1.36566162109375, -1.256103515625, -1.14654541015625, -1.0369873046875, -0.92742919921875, -0.81787109375, -0.70831298828125, -0.5987548828125, -0.48919677734375, -0.379638671875, -0.27008056640625, -0.1605224609375, -0.05096435546875, 0.05859375, 0.16815185546875, 0.2777099609375, 0.38726806640625, 0.496826171875, 0.60638427734375, 0.7159423828125, 0.82550048828125, 0.93505859375, 1.04461669921875, 1.1541748046875, 1.26373291015625, 1.373291015625, 1.48284912109375, 1.5924072265625, 1.70196533203125, 1.8115234375, 1.92108154296875, 2.0306396484375, 2.14019775390625, 2.249755859375, 2.35931396484375, 2.4688720703125, 2.57843017578125, 2.68798828125, 2.79754638671875, 2.9071044921875, 3.01666259765625, 3.126220703125, 3.23577880859375, 3.3453369140625, 3.45489501953125, 3.564453125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 4.0, 14.0, 21.0, 25.0, 32.0, 46.0, 51.0, 86.0, 135.0, 182.0, 272.0, 368.0, 561.0, 909.0, 1501.0, 2530.0, 4871.0, 9877.0, 24879.0, 74628.0, 240596.0, 402327.0, 188422.0, 57827.0, 19786.0, 8440.0, 4070.0, 2247.0, 1283.0, 821.0, 555.0, 360.0, 250.0, 164.0, 109.0, 77.0, 62.0, 38.0, 33.0, 24.0, 14.0, 10.0, 16.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0], "bins": [-8.8515625, -8.6014404296875, -8.351318359375, -8.1011962890625, -7.85107421875, -7.6009521484375, -7.350830078125, -7.1007080078125, -6.8505859375, -6.6004638671875, -6.350341796875, -6.1002197265625, -5.85009765625, -5.5999755859375, -5.349853515625, -5.0997314453125, -4.849609375, -4.5994873046875, -4.349365234375, -4.0992431640625, -3.84912109375, -3.5989990234375, -3.348876953125, -3.0987548828125, -2.8486328125, -2.5985107421875, -2.348388671875, -2.0982666015625, -1.84814453125, -1.5980224609375, -1.347900390625, -1.0977783203125, -0.84765625, -0.5975341796875, -0.347412109375, -0.0972900390625, 0.15283203125, 0.4029541015625, 0.653076171875, 0.9031982421875, 1.1533203125, 1.4034423828125, 1.653564453125, 1.9036865234375, 2.15380859375, 2.4039306640625, 2.654052734375, 2.9041748046875, 3.154296875, 3.4044189453125, 3.654541015625, 3.9046630859375, 4.15478515625, 4.4049072265625, 4.655029296875, 4.9051513671875, 5.1552734375, 5.4053955078125, 5.655517578125, 5.9056396484375, 6.15576171875, 6.4058837890625, 6.656005859375, 6.9061279296875, 7.15625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 23.0, 33.0, 33.0, 57.0, 83.0, 113.0, 115.0, 133.0, 112.0, 75.0, 66.0, 46.0, 29.0, 16.0, 8.0, 7.0, 5.0, 8.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008387565612792969, -0.0008166208863258362, -0.0007944852113723755, -0.0007723495364189148, -0.0007502138614654541, -0.0007280781865119934, -0.0007059425115585327, -0.000683806836605072, -0.0006616711616516113, -0.0006395354866981506, -0.0006173998117446899, -0.0005952641367912292, -0.0005731284618377686, -0.0005509927868843079, -0.0005288571119308472, -0.0005067214369773865, -0.0004845857620239258, -0.0004624500870704651, -0.0004403144121170044, -0.0004181787371635437, -0.000396043062210083, -0.0003739073872566223, -0.0003517717123031616, -0.00032963603734970093, -0.00030750036239624023, -0.00028536468744277954, -0.00026322901248931885, -0.00024109333753585815, -0.00021895766258239746, -0.00019682198762893677, -0.00017468631267547607, -0.00015255063772201538, -0.0001304149627685547, -0.000108279287815094, -8.61436128616333e-05, -6.400793790817261e-05, -4.1872262954711914e-05, -1.973658800125122e-05, 2.3990869522094727e-06, 2.4534761905670166e-05, 4.667043685913086e-05, 6.880611181259155e-05, 9.094178676605225e-05, 0.00011307746171951294, 0.00013521313667297363, 0.00015734881162643433, 0.00017948448657989502, 0.0002016201615333557, 0.0002237558364868164, 0.0002458915114402771, 0.0002680271863937378, 0.0002901628613471985, 0.0003122985363006592, 0.0003344342112541199, 0.00035656988620758057, 0.00037870556116104126, 0.00040084123611450195, 0.00042297691106796265, 0.00044511258602142334, 0.00046724826097488403, 0.0004893839359283447, 0.0005115196108818054, 0.0005336552858352661, 0.0005557909607887268, 0.0005779266357421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 3.0, 7.0, 14.0, 12.0, 17.0, 18.0, 28.0, 50.0, 51.0, 65.0, 97.0, 113.0, 159.0, 239.0, 354.0, 548.0, 868.0, 1398.0, 2335.0, 4552.0, 9224.0, 20685.0, 49610.0, 125809.0, 266374.0, 295385.0, 158301.0, 62888.0, 25484.0, 11189.0, 5344.0, 2824.0, 1587.0, 958.0, 621.0, 380.0, 272.0, 193.0, 129.0, 87.0, 70.0, 45.0, 32.0, 32.0, 20.0, 19.0, 20.0, 17.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.3671875, -5.19476318359375, -5.0223388671875, -4.84991455078125, -4.677490234375, -4.50506591796875, -4.3326416015625, -4.16021728515625, -3.98779296875, -3.81536865234375, -3.6429443359375, -3.47052001953125, -3.298095703125, -3.12567138671875, -2.9532470703125, -2.78082275390625, -2.6083984375, -2.43597412109375, -2.2635498046875, -2.09112548828125, -1.918701171875, -1.74627685546875, -1.5738525390625, -1.40142822265625, -1.22900390625, -1.05657958984375, -0.8841552734375, -0.71173095703125, -0.539306640625, -0.36688232421875, -0.1944580078125, -0.02203369140625, 0.150390625, 0.32281494140625, 0.4952392578125, 0.66766357421875, 0.840087890625, 1.01251220703125, 1.1849365234375, 1.35736083984375, 1.52978515625, 1.70220947265625, 1.8746337890625, 2.04705810546875, 2.219482421875, 2.39190673828125, 2.5643310546875, 2.73675537109375, 2.9091796875, 3.08160400390625, 3.2540283203125, 3.42645263671875, 3.598876953125, 3.77130126953125, 3.9437255859375, 4.11614990234375, 4.28857421875, 4.46099853515625, 4.6334228515625, 4.80584716796875, 4.978271484375, 5.15069580078125, 5.3231201171875, 5.49554443359375, 5.66796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 10.0, 9.0, 10.0, 14.0, 23.0, 27.0, 29.0, 33.0, 46.0, 49.0, 57.0, 51.0, 50.0, 60.0, 53.0, 62.0, 66.0, 47.0, 33.0, 52.0, 45.0, 23.0, 21.0, 28.0, 13.0, 19.0, 10.0, 16.0, 6.0, 7.0, 5.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0251388549804688, -0.9955902099609375, -0.9660415649414062, -0.936492919921875, -0.9069442749023438, -0.8773956298828125, -0.8478469848632812, -0.81829833984375, -0.7887496948242188, -0.7592010498046875, -0.7296524047851562, -0.700103759765625, -0.6705551147460938, -0.6410064697265625, -0.6114578247070312, -0.5819091796875, -0.5523605346679688, -0.5228118896484375, -0.49326324462890625, -0.463714599609375, -0.43416595458984375, -0.4046173095703125, -0.37506866455078125, -0.34552001953125, -0.31597137451171875, -0.2864227294921875, -0.25687408447265625, -0.227325439453125, -0.19777679443359375, -0.1682281494140625, -0.13867950439453125, -0.109130859375, -0.07958221435546875, -0.0500335693359375, -0.02048492431640625, 0.009063720703125, 0.03861236572265625, 0.0681610107421875, 0.09770965576171875, 0.12725830078125, 0.15680694580078125, 0.1863555908203125, 0.21590423583984375, 0.245452880859375, 0.27500152587890625, 0.3045501708984375, 0.33409881591796875, 0.3636474609375, 0.39319610595703125, 0.4227447509765625, 0.45229339599609375, 0.481842041015625, 0.5113906860351562, 0.5409393310546875, 0.5704879760742188, 0.60003662109375, 0.6295852661132812, 0.6591339111328125, 0.6886825561523438, 0.718231201171875, 0.7477798461914062, 0.7773284912109375, 0.8068771362304688, 0.83642578125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 15.0, 17.0, 20.0, 31.0, 34.0, 40.0, 49.0, 52.0, 67.0, 76.0, 78.0, 91.0, 83.0, 68.0, 59.0, 47.0, 29.0, 21.0, 15.0, 18.0, 7.0, 11.0, 9.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.766605377197266, -12.398869514465332, -12.031133651733398, -11.663397789001465, -11.295661926269531, -10.927926063537598, -10.560190200805664, -10.192453384399414, -9.824718475341797, -9.456982612609863, -9.08924674987793, -8.721510887145996, -8.353775024414062, -7.986039161682129, -7.618302822113037, -7.2505669593811035, -6.882830619812012, -6.515094757080078, -6.1473588943481445, -5.779623031616211, -5.411887168884277, -5.044151306152344, -4.676414966583252, -4.308679103851318, -3.9409432411193848, -3.573207378387451, -3.2054715156555176, -2.837735414505005, -2.4699995517730713, -2.1022636890411377, -1.734527587890625, -1.3667917251586914, -0.9990549087524414, -0.631318986415863, -0.26358306407928467, 0.10415291786193848, 0.47188878059387207, 0.8396246433258057, 1.2073607444763184, 1.575096607208252, 1.9428324699401855, 2.310568332672119, 2.6783041954040527, 3.0460402965545654, 3.413776159286499, 3.7815120220184326, 4.149248123168945, 4.516983985900879, 4.8847198486328125, 5.252455711364746, 5.62019157409668, 5.987927436828613, 6.355663299560547, 6.7233991622924805, 7.091135501861572, 7.458871364593506, 7.8266072273254395, 8.194343566894531, 8.562079429626465, 8.929815292358398, 9.297551155090332, 9.665287017822266, 10.0330228805542, 10.400758743286133, 10.768494606018066]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 14.0, 10.0, 18.0, 14.0, 22.0, 16.0, 19.0, 31.0, 25.0, 37.0, 38.0, 28.0, 39.0, 41.0, 41.0, 48.0, 41.0, 53.0, 40.0, 48.0, 48.0, 42.0, 37.0, 40.0, 24.0, 21.0, 25.0, 27.0, 17.0, 16.0, 16.0, 11.0, 9.0, 13.0, 5.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.657054424285889, -6.4504265785217285, -6.24379825592041, -6.03717041015625, -5.83054256439209, -5.6239142417907715, -5.417286396026611, -5.210658073425293, -5.004030227661133, -4.797402381896973, -4.590774059295654, -4.384146213531494, -4.177517890930176, -3.9708900451660156, -3.7642621994018555, -3.557634115219116, -3.351006031036377, -3.1443779468536377, -2.9377498626708984, -2.7311220169067383, -2.524493932723999, -2.3178658485412598, -2.1112380027770996, -1.9046099185943604, -1.697981834411621, -1.4913537502288818, -1.2847257852554321, -1.0780978202819824, -0.8714697360992432, -0.6648416519165039, -0.4582136869430542, -0.2515857219696045, -0.044957637786865234, 0.16167038679122925, 0.36829841136932373, 0.5749264359474182, 0.7815544605255127, 0.988182544708252, 1.1948105096817017, 1.4014384746551514, 1.6080665588378906, 1.8146946430206299, 2.021322727203369, 2.2279505729675293, 2.4345786571502686, 2.641206741333008, 2.847834587097168, 3.0544626712799072, 3.2610907554626465, 3.4677188396453857, 3.674346923828125, 3.880974769592285, 4.087602615356445, 4.294230937957764, 4.500858783721924, 4.707487106323242, 4.914114952087402, 5.1207427978515625, 5.327371120452881, 5.533998966217041, 5.740627288818359, 5.9472551345825195, 6.15388298034668, 6.36051082611084, 6.567139148712158]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 13.0, 17.0, 23.0, 32.0, 46.0, 64.0, 96.0, 127.0, 166.0, 297.0, 428.0, 639.0, 931.0, 1464.0, 2358.0, 3799.0, 6331.0, 11409.0, 23234.0, 56169.0, 181894.0, 755632.0, 1896832.0, 923910.0, 210503.0, 61378.0, 24878.0, 12418.0, 7052.0, 4243.0, 2607.0, 1719.0, 1182.0, 729.0, 541.0, 372.0, 238.0, 161.0, 92.0, 75.0, 47.0, 44.0, 29.0, 12.0, 13.0, 12.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.140625, -13.662353515625, -13.18408203125, -12.705810546875, -12.2275390625, -11.749267578125, -11.27099609375, -10.792724609375, -10.314453125, -9.836181640625, -9.35791015625, -8.879638671875, -8.4013671875, -7.923095703125, -7.44482421875, -6.966552734375, -6.48828125, -6.010009765625, -5.53173828125, -5.053466796875, -4.5751953125, -4.096923828125, -3.61865234375, -3.140380859375, -2.662109375, -2.183837890625, -1.70556640625, -1.227294921875, -0.7490234375, -0.270751953125, 0.20751953125, 0.685791015625, 1.1640625, 1.642333984375, 2.12060546875, 2.598876953125, 3.0771484375, 3.555419921875, 4.03369140625, 4.511962890625, 4.990234375, 5.468505859375, 5.94677734375, 6.425048828125, 6.9033203125, 7.381591796875, 7.85986328125, 8.338134765625, 8.81640625, 9.294677734375, 9.77294921875, 10.251220703125, 10.7294921875, 11.207763671875, 11.68603515625, 12.164306640625, 12.642578125, 13.120849609375, 13.59912109375, 14.077392578125, 14.5556640625, 15.033935546875, 15.51220703125, 15.990478515625, 16.46875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 9.0, 7.0, 15.0, 18.0, 12.0, 16.0, 22.0, 30.0, 29.0, 26.0, 24.0, 34.0, 43.0, 44.0, 55.0, 51.0, 47.0, 42.0, 46.0, 47.0, 39.0, 38.0, 49.0, 34.0, 32.0, 24.0, 31.0, 25.0, 15.0, 27.0, 15.0, 13.0, 6.0, 7.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.73455810546875, -4.5628662109375, -4.39117431640625, -4.219482421875, -4.04779052734375, -3.8760986328125, -3.70440673828125, -3.53271484375, -3.36102294921875, -3.1893310546875, -3.01763916015625, -2.845947265625, -2.67425537109375, -2.5025634765625, -2.33087158203125, -2.1591796875, -1.98748779296875, -1.8157958984375, -1.64410400390625, -1.472412109375, -1.30072021484375, -1.1290283203125, -0.95733642578125, -0.78564453125, -0.61395263671875, -0.4422607421875, -0.27056884765625, -0.098876953125, 0.07281494140625, 0.2445068359375, 0.41619873046875, 0.587890625, 0.75958251953125, 0.9312744140625, 1.10296630859375, 1.274658203125, 1.44635009765625, 1.6180419921875, 1.78973388671875, 1.96142578125, 2.13311767578125, 2.3048095703125, 2.47650146484375, 2.648193359375, 2.81988525390625, 2.9915771484375, 3.16326904296875, 3.3349609375, 3.50665283203125, 3.6783447265625, 3.85003662109375, 4.021728515625, 4.19342041015625, 4.3651123046875, 4.53680419921875, 4.70849609375, 4.88018798828125, 5.0518798828125, 5.22357177734375, 5.395263671875, 5.56695556640625, 5.7386474609375, 5.91033935546875, 6.08203125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 8.0, 14.0, 23.0, 28.0, 50.0, 56.0, 81.0, 106.0, 185.0, 235.0, 391.0, 509.0, 909.0, 1401.0, 2145.0, 3558.0, 5896.0, 10092.0, 17860.0, 35015.0, 74872.0, 188767.0, 558661.0, 1423087.0, 1185673.0, 413764.0, 144223.0, 60083.0, 29089.0, 15166.0, 8616.0, 5185.0, 3044.0, 1881.0, 1229.0, 817.0, 463.0, 344.0, 245.0, 146.0, 94.0, 82.0, 48.0, 48.0, 22.0, 18.0, 17.0, 8.0, 11.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8509521484375, -12.420654296875, -11.9903564453125, -11.56005859375, -11.1297607421875, -10.699462890625, -10.2691650390625, -9.8388671875, -9.4085693359375, -8.978271484375, -8.5479736328125, -8.11767578125, -7.6873779296875, -7.257080078125, -6.8267822265625, -6.396484375, -5.9661865234375, -5.535888671875, -5.1055908203125, -4.67529296875, -4.2449951171875, -3.814697265625, -3.3843994140625, -2.9541015625, -2.5238037109375, -2.093505859375, -1.6632080078125, -1.23291015625, -0.8026123046875, -0.372314453125, 0.0579833984375, 0.48828125, 0.9185791015625, 1.348876953125, 1.7791748046875, 2.20947265625, 2.6397705078125, 3.070068359375, 3.5003662109375, 3.9306640625, 4.3609619140625, 4.791259765625, 5.2215576171875, 5.65185546875, 6.0821533203125, 6.512451171875, 6.9427490234375, 7.373046875, 7.8033447265625, 8.233642578125, 8.6639404296875, 9.09423828125, 9.5245361328125, 9.954833984375, 10.3851318359375, 10.8154296875, 11.2457275390625, 11.676025390625, 12.1063232421875, 12.53662109375, 12.9669189453125, 13.397216796875, 13.8275146484375, 14.2578125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 9.0, 13.0, 12.0, 22.0, 29.0, 41.0, 54.0, 75.0, 116.0, 119.0, 142.0, 215.0, 273.0, 302.0, 398.0, 370.0, 390.0, 323.0, 264.0, 218.0, 151.0, 117.0, 104.0, 77.0, 38.0, 45.0, 28.0, 24.0, 25.0, 11.0, 8.0, 9.0, 12.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.220703125, -3.10845947265625, -2.9962158203125, -2.88397216796875, -2.771728515625, -2.65948486328125, -2.5472412109375, -2.43499755859375, -2.32275390625, -2.21051025390625, -2.0982666015625, -1.98602294921875, -1.873779296875, -1.76153564453125, -1.6492919921875, -1.53704833984375, -1.4248046875, -1.31256103515625, -1.2003173828125, -1.08807373046875, -0.975830078125, -0.86358642578125, -0.7513427734375, -0.63909912109375, -0.52685546875, -0.41461181640625, -0.3023681640625, -0.19012451171875, -0.077880859375, 0.03436279296875, 0.1466064453125, 0.25885009765625, 0.37109375, 0.48333740234375, 0.5955810546875, 0.70782470703125, 0.820068359375, 0.93231201171875, 1.0445556640625, 1.15679931640625, 1.26904296875, 1.38128662109375, 1.4935302734375, 1.60577392578125, 1.718017578125, 1.83026123046875, 1.9425048828125, 2.05474853515625, 2.1669921875, 2.27923583984375, 2.3914794921875, 2.50372314453125, 2.615966796875, 2.72821044921875, 2.8404541015625, 2.95269775390625, 3.06494140625, 3.17718505859375, 3.2894287109375, 3.40167236328125, 3.513916015625, 3.62615966796875, 3.7384033203125, 3.85064697265625, 3.962890625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 5.0, 3.0, 8.0, 8.0, 13.0, 13.0, 16.0, 12.0, 20.0, 25.0, 28.0, 29.0, 37.0, 71.0, 66.0, 59.0, 90.0, 79.0, 64.0, 78.0, 50.0, 43.0, 47.0, 29.0, 20.0, 20.0, 8.0, 9.0, 15.0, 6.0, 4.0, 4.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.491689682006836, -11.13202953338623, -10.772369384765625, -10.412710189819336, -10.05305004119873, -9.693389892578125, -9.333730697631836, -8.97407054901123, -8.614410400390625, -8.25475025177002, -7.895090579986572, -7.535430908203125, -7.1757707595825195, -6.816110610961914, -6.456450939178467, -6.0967912673950195, -5.737131118774414, -5.377470970153809, -5.017811298370361, -4.658151626586914, -4.298491477966309, -3.9388315677642822, -3.579171657562256, -3.2195117473602295, -2.859851837158203, -2.5001919269561768, -2.1405320167541504, -1.780872106552124, -1.4212121963500977, -1.0615522861480713, -0.7018923759460449, -0.34223246574401855, 0.01742839813232422, 0.3770883083343506, 0.736748218536377, 1.0964081287384033, 1.4560680389404297, 1.815727949142456, 2.1753878593444824, 2.535047769546509, 2.894707679748535, 3.2543675899505615, 3.614027500152588, 3.9736874103546143, 4.333347320556641, 4.693007469177246, 5.052667140960693, 5.412326812744141, 5.771986961364746, 6.131647109985352, 6.491306781768799, 6.850966453552246, 7.210626602172852, 7.570286750793457, 7.929946422576904, 8.289606094360352, 8.649266242980957, 9.008926391601562, 9.368585586547852, 9.728245735168457, 10.087905883789062, 10.447566032409668, 10.807226181030273, 11.166885375976562, 11.526545524597168]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 9.0, 7.0, 10.0, 13.0, 14.0, 21.0, 19.0, 23.0, 31.0, 27.0, 18.0, 34.0, 39.0, 48.0, 45.0, 36.0, 39.0, 51.0, 47.0, 49.0, 51.0, 42.0, 35.0, 40.0, 28.0, 29.0, 32.0, 16.0, 30.0, 17.0, 20.0, 18.0, 10.0, 13.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 10.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.589496612548828, -6.378467559814453, -6.16743803024292, -5.956408977508545, -5.74537992477417, -5.534350395202637, -5.323321342468262, -5.112292289733887, -4.901263236999512, -4.690234184265137, -4.4792046546936035, -4.2681756019592285, -4.0571465492248535, -3.8461172580718994, -3.6350879669189453, -3.4240589141845703, -3.213029384613037, -3.002000093460083, -2.790971040725708, -2.579941749572754, -2.368912696838379, -2.157883405685425, -1.9468541145324707, -1.7358249425888062, -1.5247957706451416, -1.313766598701477, -1.1027374267578125, -0.8917081356048584, -0.6806789636611938, -0.4696497917175293, -0.2586205005645752, -0.047591328620910645, 0.1634373664855957, 0.37446656823158264, 0.5854957699775696, 0.7965250015258789, 1.0075541734695435, 1.218583345413208, 1.429612636566162, 1.6406418085098267, 1.8516709804534912, 2.0627002716064453, 2.2737293243408203, 2.4847586154937744, 2.6957879066467285, 2.9068169593811035, 3.1178462505340576, 3.3288755416870117, 3.5399045944213867, 3.750933885574341, 3.961962938308716, 4.17299222946167, 4.384021282196045, 4.595050811767578, 4.806079864501953, 5.017108917236328, 5.228137969970703, 5.439167022705078, 5.650196552276611, 5.861225605010986, 6.072254657745361, 6.2832841873168945, 6.4943132400512695, 6.7053422927856445, 6.916371822357178]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 2.0, 10.0, 12.0, 17.0, 20.0, 30.0, 44.0, 61.0, 85.0, 126.0, 179.0, 296.0, 465.0, 792.0, 1357.0, 2295.0, 4328.0, 8437.0, 18189.0, 41483.0, 101676.0, 241635.0, 324343.0, 175003.0, 70466.0, 29286.0, 13451.0, 6469.0, 3385.0, 1862.0, 1014.0, 591.0, 381.0, 259.0, 158.0, 110.0, 63.0, 64.0, 29.0, 20.0, 20.0, 13.0, 5.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.2783203125, -5.091796875, -4.9052734375, -4.71875, -4.5322265625, -4.345703125, -4.1591796875, -3.97265625, -3.7861328125, -3.599609375, -3.4130859375, -3.2265625, -3.0400390625, -2.853515625, -2.6669921875, -2.48046875, -2.2939453125, -2.107421875, -1.9208984375, -1.734375, -1.5478515625, -1.361328125, -1.1748046875, -0.98828125, -0.8017578125, -0.615234375, -0.4287109375, -0.2421875, -0.0556640625, 0.130859375, 0.3173828125, 0.50390625, 0.6904296875, 0.876953125, 1.0634765625, 1.25, 1.4365234375, 1.623046875, 1.8095703125, 1.99609375, 2.1826171875, 2.369140625, 2.5556640625, 2.7421875, 2.9287109375, 3.115234375, 3.3017578125, 3.48828125, 3.6748046875, 3.861328125, 4.0478515625, 4.234375, 4.4208984375, 4.607421875, 4.7939453125, 4.98046875, 5.1669921875, 5.353515625, 5.5400390625, 5.7265625, 5.9130859375, 6.099609375, 6.2861328125, 6.47265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 9.0, 9.0, 14.0, 17.0, 22.0, 27.0, 24.0, 28.0, 26.0, 32.0, 39.0, 30.0, 42.0, 41.0, 53.0, 43.0, 39.0, 64.0, 47.0, 47.0, 40.0, 38.0, 20.0, 39.0, 25.0, 25.0, 30.0, 20.0, 21.0, 19.0, 13.0, 13.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.9296875, -7.6927490234375, -7.455810546875, -7.2188720703125, -6.98193359375, -6.7449951171875, -6.508056640625, -6.2711181640625, -6.0341796875, -5.7972412109375, -5.560302734375, -5.3233642578125, -5.08642578125, -4.8494873046875, -4.612548828125, -4.3756103515625, -4.138671875, -3.9017333984375, -3.664794921875, -3.4278564453125, -3.19091796875, -2.9539794921875, -2.717041015625, -2.4801025390625, -2.2431640625, -2.0062255859375, -1.769287109375, -1.5323486328125, -1.29541015625, -1.0584716796875, -0.821533203125, -0.5845947265625, -0.34765625, -0.1107177734375, 0.126220703125, 0.3631591796875, 0.60009765625, 0.8370361328125, 1.073974609375, 1.3109130859375, 1.5478515625, 1.7847900390625, 2.021728515625, 2.2586669921875, 2.49560546875, 2.7325439453125, 2.969482421875, 3.2064208984375, 3.443359375, 3.6802978515625, 3.917236328125, 4.1541748046875, 4.39111328125, 4.6280517578125, 4.864990234375, 5.1019287109375, 5.3388671875, 5.5758056640625, 5.812744140625, 6.0496826171875, 6.28662109375, 6.5235595703125, 6.760498046875, 6.9974365234375, 7.234375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 2.0, 8.0, 10.0, 10.0, 21.0, 31.0, 37.0, 51.0, 80.0, 88.0, 142.0, 181.0, 309.0, 461.0, 635.0, 1119.0, 1884.0, 3577.0, 7527.0, 18517.0, 53972.0, 177150.0, 411685.0, 249450.0, 76587.0, 24757.0, 9842.0, 4497.0, 2293.0, 1249.0, 778.0, 532.0, 297.0, 230.0, 152.0, 107.0, 75.0, 56.0, 34.0, 32.0, 27.0, 20.0, 9.0, 10.0, 6.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.58984375, -7.35003662109375, -7.1102294921875, -6.87042236328125, -6.630615234375, -6.39080810546875, -6.1510009765625, -5.91119384765625, -5.67138671875, -5.43157958984375, -5.1917724609375, -4.95196533203125, -4.712158203125, -4.47235107421875, -4.2325439453125, -3.99273681640625, -3.7529296875, -3.51312255859375, -3.2733154296875, -3.03350830078125, -2.793701171875, -2.55389404296875, -2.3140869140625, -2.07427978515625, -1.83447265625, -1.59466552734375, -1.3548583984375, -1.11505126953125, -0.875244140625, -0.63543701171875, -0.3956298828125, -0.15582275390625, 0.083984375, 0.32379150390625, 0.5635986328125, 0.80340576171875, 1.043212890625, 1.28302001953125, 1.5228271484375, 1.76263427734375, 2.00244140625, 2.24224853515625, 2.4820556640625, 2.72186279296875, 2.961669921875, 3.20147705078125, 3.4412841796875, 3.68109130859375, 3.9208984375, 4.16070556640625, 4.4005126953125, 4.64031982421875, 4.880126953125, 5.11993408203125, 5.3597412109375, 5.59954833984375, 5.83935546875, 6.07916259765625, 6.3189697265625, 6.55877685546875, 6.798583984375, 7.03839111328125, 7.2781982421875, 7.51800537109375, 7.7578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 8.0, 20.0, 16.0, 13.0, 24.0, 21.0, 35.0, 35.0, 39.0, 44.0, 44.0, 48.0, 59.0, 62.0, 44.0, 48.0, 41.0, 40.0, 47.0, 53.0, 37.0, 37.0, 22.0, 27.0, 25.0, 16.0, 27.0, 9.0, 12.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.192138671875, -4.04443359375, -3.896728515625, -3.7490234375, -3.601318359375, -3.45361328125, -3.305908203125, -3.158203125, -3.010498046875, -2.86279296875, -2.715087890625, -2.5673828125, -2.419677734375, -2.27197265625, -2.124267578125, -1.9765625, -1.828857421875, -1.68115234375, -1.533447265625, -1.3857421875, -1.238037109375, -1.09033203125, -0.942626953125, -0.794921875, -0.647216796875, -0.49951171875, -0.351806640625, -0.2041015625, -0.056396484375, 0.09130859375, 0.239013671875, 0.38671875, 0.534423828125, 0.68212890625, 0.829833984375, 0.9775390625, 1.125244140625, 1.27294921875, 1.420654296875, 1.568359375, 1.716064453125, 1.86376953125, 2.011474609375, 2.1591796875, 2.306884765625, 2.45458984375, 2.602294921875, 2.75, 2.897705078125, 3.04541015625, 3.193115234375, 3.3408203125, 3.488525390625, 3.63623046875, 3.783935546875, 3.931640625, 4.079345703125, 4.22705078125, 4.374755859375, 4.5224609375, 4.670166015625, 4.81787109375, 4.965576171875, 5.11328125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 3.0, 11.0, 14.0, 13.0, 15.0, 21.0, 30.0, 28.0, 47.0, 67.0, 102.0, 121.0, 198.0, 259.0, 351.0, 511.0, 712.0, 979.0, 1570.0, 2345.0, 4195.0, 8351.0, 25072.0, 260932.0, 663862.0, 52918.0, 11748.0, 5229.0, 2948.0, 1837.0, 1191.0, 840.0, 564.0, 407.0, 297.0, 209.0, 133.0, 117.0, 86.0, 56.0, 47.0, 31.0, 16.0, 17.0, 10.0, 12.0, 11.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-8.625, -8.357177734375, -8.08935546875, -7.821533203125, -7.5537109375, -7.285888671875, -7.01806640625, -6.750244140625, -6.482421875, -6.214599609375, -5.94677734375, -5.678955078125, -5.4111328125, -5.143310546875, -4.87548828125, -4.607666015625, -4.33984375, -4.072021484375, -3.80419921875, -3.536376953125, -3.2685546875, -3.000732421875, -2.73291015625, -2.465087890625, -2.197265625, -1.929443359375, -1.66162109375, -1.393798828125, -1.1259765625, -0.858154296875, -0.59033203125, -0.322509765625, -0.0546875, 0.213134765625, 0.48095703125, 0.748779296875, 1.0166015625, 1.284423828125, 1.55224609375, 1.820068359375, 2.087890625, 2.355712890625, 2.62353515625, 2.891357421875, 3.1591796875, 3.427001953125, 3.69482421875, 3.962646484375, 4.23046875, 4.498291015625, 4.76611328125, 5.033935546875, 5.3017578125, 5.569580078125, 5.83740234375, 6.105224609375, 6.373046875, 6.640869140625, 6.90869140625, 7.176513671875, 7.4443359375, 7.712158203125, 7.97998046875, 8.247802734375, 8.515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 22.0, 189.0, 569.0, 151.0, 23.0, 10.0, 4.0, 0.0, 3.0, 6.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007205009460449219, -0.0006897374987602234, -0.0006589740514755249, -0.0006282106041908264, -0.0005974471569061279, -0.0005666837096214294, -0.000535920262336731, -0.0005051568150520325, -0.000474393367767334, -0.0004436299204826355, -0.000412866473197937, -0.0003821030259132385, -0.00035133957862854004, -0.00032057613134384155, -0.00028981268405914307, -0.0002590492367744446, -0.0002282857894897461, -0.0001975223422050476, -0.00016675889492034912, -0.00013599544763565063, -0.00010523200035095215, -7.446855306625366e-05, -4.3705105781555176e-05, -1.294165849685669e-05, 1.7821788787841797e-05, 4.858523607254028e-05, 7.934868335723877e-05, 0.00011011213064193726, 0.00014087557792663574, 0.00017163902521133423, 0.00020240247249603271, 0.0002331659197807312, 0.0002639293670654297, 0.0002946928143501282, 0.00032545626163482666, 0.00035621970891952515, 0.00038698315620422363, 0.0004177466034889221, 0.0004485100507736206, 0.0004792734980583191, 0.0005100369453430176, 0.0005408003926277161, 0.0005715638399124146, 0.000602327287197113, 0.0006330907344818115, 0.00066385418176651, 0.0006946176290512085, 0.000725381076335907, 0.0007561445236206055, 0.000786907970905304, 0.0008176714181900024, 0.0008484348654747009, 0.0008791983127593994, 0.0009099617600440979, 0.0009407252073287964, 0.0009714886546134949, 0.0010022521018981934, 0.0010330155491828918, 0.0010637789964675903, 0.0010945424437522888, 0.0011253058910369873, 0.0011560693383216858, 0.0011868327856063843, 0.0012175962328910828, 0.0012483596801757812]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 9.0, 7.0, 14.0, 12.0, 40.0, 34.0, 55.0, 55.0, 112.0, 135.0, 184.0, 268.0, 408.0, 633.0, 845.0, 1339.0, 2150.0, 3346.0, 5266.0, 9995.0, 34310.0, 337643.0, 560556.0, 61174.0, 12865.0, 6181.0, 3824.0, 2372.0, 1527.0, 979.0, 676.0, 476.0, 317.0, 206.0, 156.0, 104.0, 72.0, 68.0, 43.0, 31.0, 27.0, 12.0, 13.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-8.125, -7.90020751953125, -7.6754150390625, -7.45062255859375, -7.225830078125, -7.00103759765625, -6.7762451171875, -6.55145263671875, -6.32666015625, -6.10186767578125, -5.8770751953125, -5.65228271484375, -5.427490234375, -5.20269775390625, -4.9779052734375, -4.75311279296875, -4.5283203125, -4.30352783203125, -4.0787353515625, -3.85394287109375, -3.629150390625, -3.40435791015625, -3.1795654296875, -2.95477294921875, -2.72998046875, -2.50518798828125, -2.2803955078125, -2.05560302734375, -1.830810546875, -1.60601806640625, -1.3812255859375, -1.15643310546875, -0.931640625, -0.70684814453125, -0.4820556640625, -0.25726318359375, -0.032470703125, 0.19232177734375, 0.4171142578125, 0.64190673828125, 0.86669921875, 1.09149169921875, 1.3162841796875, 1.54107666015625, 1.765869140625, 1.99066162109375, 2.2154541015625, 2.44024658203125, 2.6650390625, 2.88983154296875, 3.1146240234375, 3.33941650390625, 3.564208984375, 3.78900146484375, 4.0137939453125, 4.23858642578125, 4.46337890625, 4.68817138671875, 4.9129638671875, 5.13775634765625, 5.362548828125, 5.58734130859375, 5.8121337890625, 6.03692626953125, 6.26171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 11.0, 10.0, 24.0, 70.0, 103.0, 205.0, 239.0, 156.0, 84.0, 33.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.144195556640625, -2.07550048828125, -2.006805419921875, -1.9381103515625, -1.869415283203125, -1.80072021484375, -1.732025146484375, -1.663330078125, -1.594635009765625, -1.52593994140625, -1.457244873046875, -1.3885498046875, -1.319854736328125, -1.25115966796875, -1.182464599609375, -1.11376953125, -1.045074462890625, -0.97637939453125, -0.907684326171875, -0.8389892578125, -0.770294189453125, -0.70159912109375, -0.632904052734375, -0.564208984375, -0.495513916015625, -0.42681884765625, -0.358123779296875, -0.2894287109375, -0.220733642578125, -0.15203857421875, -0.083343505859375, -0.0146484375, 0.054046630859375, 0.12274169921875, 0.191436767578125, 0.2601318359375, 0.328826904296875, 0.39752197265625, 0.466217041015625, 0.534912109375, 0.603607177734375, 0.67230224609375, 0.740997314453125, 0.8096923828125, 0.878387451171875, 0.94708251953125, 1.015777587890625, 1.08447265625, 1.153167724609375, 1.22186279296875, 1.290557861328125, 1.3592529296875, 1.427947998046875, 1.49664306640625, 1.565338134765625, 1.634033203125, 1.702728271484375, 1.77142333984375, 1.840118408203125, 1.9088134765625, 1.977508544921875, 2.04620361328125, 2.114898681640625, 2.18359375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 7.0, 15.0, 15.0, 14.0, 19.0, 21.0, 27.0, 30.0, 35.0, 49.0, 59.0, 77.0, 79.0, 87.0, 83.0, 64.0, 71.0, 53.0, 32.0, 34.0, 23.0, 17.0, 15.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.94861888885498, -11.57848072052002, -11.208342552185059, -10.838205337524414, -10.468067169189453, -10.097929000854492, -9.727790832519531, -9.35765266418457, -8.98751449584961, -8.617376327514648, -8.247238159179688, -7.877100467681885, -7.506962776184082, -7.136824607849121, -6.76668643951416, -6.396548271179199, -6.026411056518555, -5.656272888183594, -5.286135196685791, -4.91599702835083, -4.545859336853027, -4.175721168518066, -3.8055830001831055, -3.4354450702667236, -3.065307140350342, -2.69516921043396, -2.325031280517578, -1.9548931121826172, -1.5847551822662354, -1.2146172523498535, -0.8444790840148926, -0.47434115409851074, -0.1042022705078125, 0.2659357190132141, 0.6360737085342407, 1.006211757659912, 1.376349687576294, 1.7464876174926758, 2.1166257858276367, 2.4867637157440186, 2.8569016456604004, 3.2270395755767822, 3.597177505493164, 3.967315673828125, 4.337453842163086, 4.707591533660889, 5.07772970199585, 5.447867393493652, 5.818005561828613, 6.188143730163574, 6.558281421661377, 6.928419589996338, 7.298557281494141, 7.668695449829102, 8.038833618164062, 8.408971786499023, 8.779109954833984, 9.149248123168945, 9.519386291503906, 9.889524459838867, 10.259661674499512, 10.629799842834473, 10.999938011169434, 11.370076179504395, 11.740213394165039]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 16.0, 14.0, 19.0, 13.0, 27.0, 30.0, 22.0, 32.0, 23.0, 42.0, 39.0, 37.0, 49.0, 48.0, 43.0, 41.0, 53.0, 48.0, 52.0, 39.0, 36.0, 30.0, 36.0, 24.0, 19.0, 32.0, 20.0, 18.0, 17.0, 16.0, 5.0, 8.0, 11.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.725652694702148, -6.512574195861816, -6.299495697021484, -6.086417198181152, -5.873338222503662, -5.66025972366333, -5.447181224822998, -5.234102725982666, -5.021024227142334, -4.807945728302002, -4.59486722946167, -4.38178825378418, -4.168709754943848, -3.9556312561035156, -3.7425527572631836, -3.5294742584228516, -3.3163955211639404, -3.1033170223236084, -2.8902382850646973, -2.6771597862243652, -2.464081287384033, -2.251002788543701, -2.03792405128479, -1.824845552444458, -1.6117669343948364, -1.3986883163452148, -1.1856098175048828, -0.9725311994552612, -0.7594526410102844, -0.5463740825653076, -0.33329546451568604, -0.120216965675354, 0.09286165237426758, 0.3059402108192444, 0.5190187692642212, 0.7320973873138428, 0.9451759457588196, 1.1582545042037964, 1.371333122253418, 1.58441162109375, 1.7974902391433716, 2.010568857192993, 2.223647356033325, 2.4367260932922363, 2.6498045921325684, 2.8628830909729004, 3.0759615898132324, 3.2890400886535645, 3.5021188259124756, 3.7151973247528076, 3.9282760620117188, 4.141354560852051, 4.354433059692383, 4.567511558532715, 4.780590057373047, 4.993668556213379, 5.206747531890869, 5.419826030731201, 5.632904529571533, 5.845983505249023, 6.0590620040893555, 6.2721405029296875, 6.4852190017700195, 6.698297500610352, 6.911375999450684]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 9.0, 20.0, 25.0, 47.0, 63.0, 105.0, 160.0, 259.0, 418.0, 613.0, 950.0, 1544.0, 2645.0, 4416.0, 7494.0, 13376.0, 24847.0, 48985.0, 95581.0, 175267.0, 238016.0, 196659.0, 112975.0, 57861.0, 29211.0, 15540.0, 8659.0, 4978.0, 2869.0, 1749.0, 1121.0, 713.0, 429.0, 292.0, 209.0, 144.0, 95.0, 56.0, 45.0, 28.0, 25.0, 13.0, 12.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.359375, -9.04345703125, -8.7275390625, -8.41162109375, -8.095703125, -7.77978515625, -7.4638671875, -7.14794921875, -6.83203125, -6.51611328125, -6.2001953125, -5.88427734375, -5.568359375, -5.25244140625, -4.9365234375, -4.62060546875, -4.3046875, -3.98876953125, -3.6728515625, -3.35693359375, -3.041015625, -2.72509765625, -2.4091796875, -2.09326171875, -1.77734375, -1.46142578125, -1.1455078125, -0.82958984375, -0.513671875, -0.19775390625, 0.1181640625, 0.43408203125, 0.75, 1.06591796875, 1.3818359375, 1.69775390625, 2.013671875, 2.32958984375, 2.6455078125, 2.96142578125, 3.27734375, 3.59326171875, 3.9091796875, 4.22509765625, 4.541015625, 4.85693359375, 5.1728515625, 5.48876953125, 5.8046875, 6.12060546875, 6.4365234375, 6.75244140625, 7.068359375, 7.38427734375, 7.7001953125, 8.01611328125, 8.33203125, 8.64794921875, 8.9638671875, 9.27978515625, 9.595703125, 9.91162109375, 10.2275390625, 10.54345703125, 10.859375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 16.0, 11.0, 16.0, 17.0, 18.0, 14.0, 27.0, 34.0, 30.0, 36.0, 43.0, 45.0, 50.0, 38.0, 36.0, 56.0, 57.0, 47.0, 45.0, 41.0, 39.0, 38.0, 37.0, 31.0, 25.0, 23.0, 24.0, 16.0, 16.0, 11.0, 11.0, 6.0, 6.0, 7.0, 7.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.5845947265625, -6.348876953125, -6.1131591796875, -5.87744140625, -5.6417236328125, -5.406005859375, -5.1702880859375, -4.9345703125, -4.6988525390625, -4.463134765625, -4.2274169921875, -3.99169921875, -3.7559814453125, -3.520263671875, -3.2845458984375, -3.048828125, -2.8131103515625, -2.577392578125, -2.3416748046875, -2.10595703125, -1.8702392578125, -1.634521484375, -1.3988037109375, -1.1630859375, -0.9273681640625, -0.691650390625, -0.4559326171875, -0.22021484375, 0.0155029296875, 0.251220703125, 0.4869384765625, 0.72265625, 0.9583740234375, 1.194091796875, 1.4298095703125, 1.66552734375, 1.9012451171875, 2.136962890625, 2.3726806640625, 2.6083984375, 2.8441162109375, 3.079833984375, 3.3155517578125, 3.55126953125, 3.7869873046875, 4.022705078125, 4.2584228515625, 4.494140625, 4.7298583984375, 4.965576171875, 5.2012939453125, 5.43701171875, 5.6727294921875, 5.908447265625, 6.1441650390625, 6.3798828125, 6.6156005859375, 6.851318359375, 7.0870361328125, 7.32275390625, 7.5584716796875, 7.794189453125, 8.0299072265625, 8.265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 20.0, 22.0, 53.0, 61.0, 99.0, 154.0, 207.0, 335.0, 485.0, 749.0, 1109.0, 1661.0, 2514.0, 3804.0, 5674.0, 8725.0, 13943.0, 22326.0, 36246.0, 57952.0, 90350.0, 128863.0, 158955.0, 156415.0, 124464.0, 85814.0, 54835.0, 33727.0, 21348.0, 13269.0, 8412.0, 5307.0, 3587.0, 2340.0, 1629.0, 1005.0, 670.0, 455.0, 315.0, 218.0, 161.0, 89.0, 62.0, 37.0, 30.0, 17.0, 9.0, 12.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1171875, -6.89434814453125, -6.6715087890625, -6.44866943359375, -6.225830078125, -6.00299072265625, -5.7801513671875, -5.55731201171875, -5.33447265625, -5.11163330078125, -4.8887939453125, -4.66595458984375, -4.443115234375, -4.22027587890625, -3.9974365234375, -3.77459716796875, -3.5517578125, -3.32891845703125, -3.1060791015625, -2.88323974609375, -2.660400390625, -2.43756103515625, -2.2147216796875, -1.99188232421875, -1.76904296875, -1.54620361328125, -1.3233642578125, -1.10052490234375, -0.877685546875, -0.65484619140625, -0.4320068359375, -0.20916748046875, 0.013671875, 0.23651123046875, 0.4593505859375, 0.68218994140625, 0.905029296875, 1.12786865234375, 1.3507080078125, 1.57354736328125, 1.79638671875, 2.01922607421875, 2.2420654296875, 2.46490478515625, 2.687744140625, 2.91058349609375, 3.1334228515625, 3.35626220703125, 3.5791015625, 3.80194091796875, 4.0247802734375, 4.24761962890625, 4.470458984375, 4.69329833984375, 4.9161376953125, 5.13897705078125, 5.36181640625, 5.58465576171875, 5.8074951171875, 6.03033447265625, 6.253173828125, 6.47601318359375, 6.6988525390625, 6.92169189453125, 7.14453125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 8.0, 8.0, 10.0, 22.0, 19.0, 30.0, 27.0, 29.0, 24.0, 35.0, 33.0, 44.0, 48.0, 49.0, 44.0, 31.0, 50.0, 42.0, 39.0, 55.0, 28.0, 36.0, 26.0, 40.0, 38.0, 31.0, 23.0, 20.0, 20.0, 8.0, 10.0, 14.0, 9.0, 6.0, 6.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.28125, -4.14935302734375, -4.0174560546875, -3.88555908203125, -3.753662109375, -3.62176513671875, -3.4898681640625, -3.35797119140625, -3.22607421875, -3.09417724609375, -2.9622802734375, -2.83038330078125, -2.698486328125, -2.56658935546875, -2.4346923828125, -2.30279541015625, -2.1708984375, -2.03900146484375, -1.9071044921875, -1.77520751953125, -1.643310546875, -1.51141357421875, -1.3795166015625, -1.24761962890625, -1.11572265625, -0.98382568359375, -0.8519287109375, -0.72003173828125, -0.588134765625, -0.45623779296875, -0.3243408203125, -0.19244384765625, -0.060546875, 0.07135009765625, 0.2032470703125, 0.33514404296875, 0.467041015625, 0.59893798828125, 0.7308349609375, 0.86273193359375, 0.99462890625, 1.12652587890625, 1.2584228515625, 1.39031982421875, 1.522216796875, 1.65411376953125, 1.7860107421875, 1.91790771484375, 2.0498046875, 2.18170166015625, 2.3135986328125, 2.44549560546875, 2.577392578125, 2.70928955078125, 2.8411865234375, 2.97308349609375, 3.10498046875, 3.23687744140625, 3.3687744140625, 3.50067138671875, 3.632568359375, 3.76446533203125, 3.8963623046875, 4.02825927734375, 4.16015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 11.0, 19.0, 26.0, 35.0, 70.0, 84.0, 108.0, 161.0, 252.0, 323.0, 465.0, 694.0, 1039.0, 1597.0, 2485.0, 3919.0, 6602.0, 11237.0, 20564.0, 41359.0, 90431.0, 201356.0, 301644.0, 190950.0, 85704.0, 39675.0, 19750.0, 10830.0, 6173.0, 3826.0, 2397.0, 1529.0, 1003.0, 655.0, 471.0, 327.0, 263.0, 166.0, 99.0, 69.0, 58.0, 37.0, 29.0, 20.0, 12.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.2764892578125, -7.029541015625, -6.7825927734375, -6.53564453125, -6.2886962890625, -6.041748046875, -5.7947998046875, -5.5478515625, -5.3009033203125, -5.053955078125, -4.8070068359375, -4.56005859375, -4.3131103515625, -4.066162109375, -3.8192138671875, -3.572265625, -3.3253173828125, -3.078369140625, -2.8314208984375, -2.58447265625, -2.3375244140625, -2.090576171875, -1.8436279296875, -1.5966796875, -1.3497314453125, -1.102783203125, -0.8558349609375, -0.60888671875, -0.3619384765625, -0.114990234375, 0.1319580078125, 0.37890625, 0.6258544921875, 0.872802734375, 1.1197509765625, 1.36669921875, 1.6136474609375, 1.860595703125, 2.1075439453125, 2.3544921875, 2.6014404296875, 2.848388671875, 3.0953369140625, 3.34228515625, 3.5892333984375, 3.836181640625, 4.0831298828125, 4.330078125, 4.5770263671875, 4.823974609375, 5.0709228515625, 5.31787109375, 5.5648193359375, 5.811767578125, 6.0587158203125, 6.3056640625, 6.5526123046875, 6.799560546875, 7.0465087890625, 7.29345703125, 7.5404052734375, 7.787353515625, 8.0343017578125, 8.28125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 10.0, 10.0, 12.0, 15.0, 20.0, 26.0, 54.0, 69.0, 117.0, 138.0, 137.0, 122.0, 88.0, 53.0, 32.0, 17.0, 13.0, 14.0, 8.0, 12.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013942718505859375, -0.001353532075881958, -0.0013127923011779785, -0.001272052526473999, -0.0012313127517700195, -0.00119057297706604, -0.0011498332023620605, -0.001109093427658081, -0.0010683536529541016, -0.001027613878250122, -0.0009868741035461426, -0.0009461343288421631, -0.0009053945541381836, -0.0008646547794342041, -0.0008239150047302246, -0.0007831752300262451, -0.0007424354553222656, -0.0007016956806182861, -0.0006609559059143066, -0.0006202161312103271, -0.0005794763565063477, -0.0005387365818023682, -0.0004979968070983887, -0.0004572570323944092, -0.0004165172576904297, -0.0003757774829864502, -0.0003350377082824707, -0.0002942979335784912, -0.0002535581588745117, -0.00021281838417053223, -0.00017207860946655273, -0.00013133883476257324, -9.059906005859375e-05, -4.985928535461426e-05, -9.119510650634766e-06, 3.1620264053344727e-05, 7.236003875732422e-05, 0.00011309981346130371, 0.0001538395881652832, 0.0001945793628692627, 0.0002353191375732422, 0.0002760589122772217, 0.00031679868698120117, 0.00035753846168518066, 0.00039827823638916016, 0.00043901801109313965, 0.00047975778579711914, 0.0005204975605010986, 0.0005612373352050781, 0.0006019771099090576, 0.0006427168846130371, 0.0006834566593170166, 0.0007241964340209961, 0.0007649362087249756, 0.0008056759834289551, 0.0008464157581329346, 0.0008871555328369141, 0.0009278953075408936, 0.000968635082244873, 0.0010093748569488525, 0.001050114631652832, 0.0010908544063568115, 0.001131594181060791, 0.0011723339557647705, 0.00121307373046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 2.0, 10.0, 17.0, 17.0, 24.0, 25.0, 37.0, 67.0, 101.0, 154.0, 227.0, 386.0, 595.0, 954.0, 1620.0, 2782.0, 5165.0, 9888.0, 21391.0, 50834.0, 128822.0, 287580.0, 299007.0, 138326.0, 54282.0, 22941.0, 10597.0, 5360.0, 2893.0, 1746.0, 1001.0, 576.0, 367.0, 259.0, 176.0, 89.0, 67.0, 50.0, 29.0, 31.0, 16.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.62890625, -7.38311767578125, -7.1373291015625, -6.89154052734375, -6.645751953125, -6.39996337890625, -6.1541748046875, -5.90838623046875, -5.66259765625, -5.41680908203125, -5.1710205078125, -4.92523193359375, -4.679443359375, -4.43365478515625, -4.1878662109375, -3.94207763671875, -3.6962890625, -3.45050048828125, -3.2047119140625, -2.95892333984375, -2.713134765625, -2.46734619140625, -2.2215576171875, -1.97576904296875, -1.72998046875, -1.48419189453125, -1.2384033203125, -0.99261474609375, -0.746826171875, -0.50103759765625, -0.2552490234375, -0.00946044921875, 0.236328125, 0.48211669921875, 0.7279052734375, 0.97369384765625, 1.219482421875, 1.46527099609375, 1.7110595703125, 1.95684814453125, 2.20263671875, 2.44842529296875, 2.6942138671875, 2.94000244140625, 3.185791015625, 3.43157958984375, 3.6773681640625, 3.92315673828125, 4.1689453125, 4.41473388671875, 4.6605224609375, 4.90631103515625, 5.152099609375, 5.39788818359375, 5.6436767578125, 5.88946533203125, 6.13525390625, 6.38104248046875, 6.6268310546875, 6.87261962890625, 7.118408203125, 7.36419677734375, 7.6099853515625, 7.85577392578125, 8.1015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 15.0, 21.0, 22.0, 28.0, 48.0, 56.0, 61.0, 75.0, 76.0, 105.0, 95.0, 92.0, 72.0, 44.0, 29.0, 49.0, 28.0, 16.0, 13.0, 12.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7564849853515625, -1.695587158203125, -1.6346893310546875, -1.57379150390625, -1.5128936767578125, -1.451995849609375, -1.3910980224609375, -1.3302001953125, -1.2693023681640625, -1.208404541015625, -1.1475067138671875, -1.08660888671875, -1.0257110595703125, -0.964813232421875, -0.9039154052734375, -0.843017578125, -0.7821197509765625, -0.721221923828125, -0.6603240966796875, -0.59942626953125, -0.5385284423828125, -0.477630615234375, -0.4167327880859375, -0.3558349609375, -0.2949371337890625, -0.234039306640625, -0.1731414794921875, -0.11224365234375, -0.0513458251953125, 0.009552001953125, 0.0704498291015625, 0.13134765625, 0.1922454833984375, 0.253143310546875, 0.3140411376953125, 0.37493896484375, 0.4358367919921875, 0.496734619140625, 0.5576324462890625, 0.6185302734375, 0.6794281005859375, 0.740325927734375, 0.8012237548828125, 0.86212158203125, 0.9230194091796875, 0.983917236328125, 1.0448150634765625, 1.105712890625, 1.1666107177734375, 1.227508544921875, 1.2884063720703125, 1.34930419921875, 1.4102020263671875, 1.471099853515625, 1.5319976806640625, 1.5928955078125, 1.6537933349609375, 1.714691162109375, 1.7755889892578125, 1.83648681640625, 1.8973846435546875, 1.958282470703125, 2.0191802978515625, 2.080078125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 3.0, 6.0, 8.0, 9.0, 13.0, 20.0, 16.0, 16.0, 31.0, 34.0, 37.0, 47.0, 47.0, 64.0, 84.0, 76.0, 78.0, 71.0, 67.0, 46.0, 54.0, 23.0, 24.0, 18.0, 18.0, 14.0, 13.0, 6.0, 11.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.410075187683105, -10.060137748718262, -9.710200309753418, -9.360262870788574, -9.010326385498047, -8.660388946533203, -8.31045150756836, -7.960514068603516, -7.610576629638672, -7.260639190673828, -6.910701751708984, -6.560764789581299, -6.210827350616455, -5.860889911651611, -5.510952949523926, -5.161015510559082, -4.811078071594238, -4.4611406326293945, -4.111203193664551, -3.7612662315368652, -3.4113287925720215, -3.0613913536071777, -2.711454153060913, -2.3615169525146484, -2.0115795135498047, -1.6616421937942505, -1.3117048740386963, -0.9617675542831421, -0.6118302345275879, -0.2618929147720337, 0.08804440498352051, 0.43798160552978516, 0.7879199981689453, 1.1378573179244995, 1.4877946376800537, 1.837731957435608, 2.187669277191162, 2.537606716156006, 2.8875439167022705, 3.237481117248535, 3.587418556213379, 3.9373559951782227, 4.287293434143066, 4.637230396270752, 4.987167835235596, 5.3371052742004395, 5.687042236328125, 6.036979675292969, 6.3869171142578125, 6.736854553222656, 7.0867919921875, 7.4367289543151855, 7.786666393280029, 8.136603355407715, 8.486540794372559, 8.836478233337402, 9.186415672302246, 9.53635311126709, 9.886290550231934, 10.236227989196777, 10.586164474487305, 10.936101913452148, 11.286039352416992, 11.635976791381836, 11.98591423034668]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 12.0, 22.0, 19.0, 24.0, 29.0, 27.0, 30.0, 38.0, 54.0, 43.0, 34.0, 43.0, 41.0, 34.0, 62.0, 43.0, 40.0, 55.0, 35.0, 35.0, 44.0, 25.0, 27.0, 21.0, 21.0, 18.0, 21.0, 8.0, 10.0, 15.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.289765357971191, -6.0647687911987305, -5.8397722244262695, -5.614776134490967, -5.389779567718506, -5.164783000946045, -4.939786434173584, -4.714790344238281, -4.48979377746582, -4.264797210693359, -4.039800643920898, -3.8148043155670166, -3.5898079872131348, -3.364811420440674, -3.139814853668213, -2.914818525314331, -2.68982195854187, -2.464825391769409, -2.2398290634155273, -2.0148324966430664, -1.7898361682891846, -1.5648396015167236, -1.3398431539535522, -1.1148467063903809, -0.8898502588272095, -0.6648538112640381, -0.4398573338985443, -0.21486085653305054, 0.01013559103012085, 0.235132098197937, 0.4601285457611084, 0.6851249933242798, 0.9101214408874512, 1.1351178884506226, 1.360114336013794, 1.5851109027862549, 1.8101072311401367, 2.0351037979125977, 2.2601003646850586, 2.4850966930389404, 2.7100930213928223, 2.935089588165283, 3.160085916519165, 3.385082483291626, 3.610078811645508, 3.8350753784179688, 4.06007194519043, 4.285068511962891, 4.510065078735352, 4.7350616455078125, 4.960058212280273, 5.185054302215576, 5.410050868988037, 5.635047435760498, 5.860044002532959, 6.085040092468262, 6.310036659240723, 6.535033226013184, 6.7600297927856445, 6.985025882720947, 7.210022449493408, 7.435019016265869, 7.66001558303833, 7.885011672973633, 8.110008239746094]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 12.0, 12.0, 16.0, 32.0, 29.0, 43.0, 62.0, 83.0, 115.0, 171.0, 243.0, 353.0, 512.0, 722.0, 1090.0, 1596.0, 2241.0, 3453.0, 5493.0, 8775.0, 15236.0, 28961.0, 66039.0, 193883.0, 691573.0, 1666464.0, 1043290.0, 287048.0, 89198.0, 36660.0, 18499.0, 10915.0, 6815.0, 4499.0, 3016.0, 2073.0, 1490.0, 994.0, 774.0, 527.0, 344.0, 293.0, 199.0, 137.0, 97.0, 57.0, 49.0, 39.0, 19.0, 11.0, 7.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.2890625, -13.837890625, -13.38671875, -12.935546875, -12.484375, -12.033203125, -11.58203125, -11.130859375, -10.6796875, -10.228515625, -9.77734375, -9.326171875, -8.875, -8.423828125, -7.97265625, -7.521484375, -7.0703125, -6.619140625, -6.16796875, -5.716796875, -5.265625, -4.814453125, -4.36328125, -3.912109375, -3.4609375, -3.009765625, -2.55859375, -2.107421875, -1.65625, -1.205078125, -0.75390625, -0.302734375, 0.1484375, 0.599609375, 1.05078125, 1.501953125, 1.953125, 2.404296875, 2.85546875, 3.306640625, 3.7578125, 4.208984375, 4.66015625, 5.111328125, 5.5625, 6.013671875, 6.46484375, 6.916015625, 7.3671875, 7.818359375, 8.26953125, 8.720703125, 9.171875, 9.623046875, 10.07421875, 10.525390625, 10.9765625, 11.427734375, 11.87890625, 12.330078125, 12.78125, 13.232421875, 13.68359375, 14.134765625, 14.5859375]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 15.0, 8.0, 12.0, 13.0, 17.0, 23.0, 22.0, 26.0, 25.0, 37.0, 38.0, 39.0, 40.0, 38.0, 42.0, 49.0, 50.0, 51.0, 46.0, 46.0, 47.0, 35.0, 33.0, 48.0, 26.0, 30.0, 22.0, 24.0, 18.0, 11.0, 18.0, 10.0, 9.0, 10.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.00390625, -4.824462890625, -4.64501953125, -4.465576171875, -4.2861328125, -4.106689453125, -3.92724609375, -3.747802734375, -3.568359375, -3.388916015625, -3.20947265625, -3.030029296875, -2.8505859375, -2.671142578125, -2.49169921875, -2.312255859375, -2.1328125, -1.953369140625, -1.77392578125, -1.594482421875, -1.4150390625, -1.235595703125, -1.05615234375, -0.876708984375, -0.697265625, -0.517822265625, -0.33837890625, -0.158935546875, 0.0205078125, 0.199951171875, 0.37939453125, 0.558837890625, 0.73828125, 0.917724609375, 1.09716796875, 1.276611328125, 1.4560546875, 1.635498046875, 1.81494140625, 1.994384765625, 2.173828125, 2.353271484375, 2.53271484375, 2.712158203125, 2.8916015625, 3.071044921875, 3.25048828125, 3.429931640625, 3.609375, 3.788818359375, 3.96826171875, 4.147705078125, 4.3271484375, 4.506591796875, 4.68603515625, 4.865478515625, 5.044921875, 5.224365234375, 5.40380859375, 5.583251953125, 5.7626953125, 5.942138671875, 6.12158203125, 6.301025390625, 6.48046875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 0.0, 6.0, 9.0, 12.0, 18.0, 39.0, 59.0, 73.0, 89.0, 150.0, 266.0, 346.0, 620.0, 960.0, 1448.0, 2484.0, 4003.0, 6581.0, 11436.0, 20966.0, 41287.0, 91338.0, 243095.0, 740936.0, 1553758.0, 945064.0, 311708.0, 112577.0, 48908.0, 24153.0, 12932.0, 7424.0, 4372.0, 2682.0, 1604.0, 1039.0, 623.0, 440.0, 270.0, 170.0, 113.0, 69.0, 50.0, 29.0, 22.0, 28.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.359375, -14.888427734375, -14.41748046875, -13.946533203125, -13.4755859375, -13.004638671875, -12.53369140625, -12.062744140625, -11.591796875, -11.120849609375, -10.64990234375, -10.178955078125, -9.7080078125, -9.237060546875, -8.76611328125, -8.295166015625, -7.82421875, -7.353271484375, -6.88232421875, -6.411376953125, -5.9404296875, -5.469482421875, -4.99853515625, -4.527587890625, -4.056640625, -3.585693359375, -3.11474609375, -2.643798828125, -2.1728515625, -1.701904296875, -1.23095703125, -0.760009765625, -0.2890625, 0.181884765625, 0.65283203125, 1.123779296875, 1.5947265625, 2.065673828125, 2.53662109375, 3.007568359375, 3.478515625, 3.949462890625, 4.42041015625, 4.891357421875, 5.3623046875, 5.833251953125, 6.30419921875, 6.775146484375, 7.24609375, 7.717041015625, 8.18798828125, 8.658935546875, 9.1298828125, 9.600830078125, 10.07177734375, 10.542724609375, 11.013671875, 11.484619140625, 11.95556640625, 12.426513671875, 12.8974609375, 13.368408203125, 13.83935546875, 14.310302734375, 14.78125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 11.0, 6.0, 4.0, 11.0, 11.0, 17.0, 20.0, 22.0, 38.0, 54.0, 47.0, 62.0, 93.0, 113.0, 156.0, 204.0, 278.0, 303.0, 326.0, 380.0, 346.0, 325.0, 250.0, 213.0, 188.0, 136.0, 118.0, 77.0, 61.0, 46.0, 44.0, 30.0, 15.0, 16.0, 14.0, 10.0, 9.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.046875, -3.930755615234375, -3.81463623046875, -3.698516845703125, -3.5823974609375, -3.466278076171875, -3.35015869140625, -3.234039306640625, -3.117919921875, -3.001800537109375, -2.88568115234375, -2.769561767578125, -2.6534423828125, -2.537322998046875, -2.42120361328125, -2.305084228515625, -2.18896484375, -2.072845458984375, -1.95672607421875, -1.840606689453125, -1.7244873046875, -1.608367919921875, -1.49224853515625, -1.376129150390625, -1.260009765625, -1.143890380859375, -1.02777099609375, -0.911651611328125, -0.7955322265625, -0.679412841796875, -0.56329345703125, -0.447174072265625, -0.3310546875, -0.214935302734375, -0.09881591796875, 0.017303466796875, 0.1334228515625, 0.249542236328125, 0.36566162109375, 0.481781005859375, 0.597900390625, 0.714019775390625, 0.83013916015625, 0.946258544921875, 1.0623779296875, 1.178497314453125, 1.29461669921875, 1.410736083984375, 1.52685546875, 1.642974853515625, 1.75909423828125, 1.875213623046875, 1.9913330078125, 2.107452392578125, 2.22357177734375, 2.339691162109375, 2.455810546875, 2.571929931640625, 2.68804931640625, 2.804168701171875, 2.9202880859375, 3.036407470703125, 3.15252685546875, 3.268646240234375, 3.384765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 8.0, 12.0, 10.0, 12.0, 23.0, 29.0, 39.0, 42.0, 64.0, 84.0, 101.0, 108.0, 100.0, 100.0, 71.0, 48.0, 43.0, 27.0, 17.0, 6.0, 17.0, 5.0, 5.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.42683982849121, -19.897809982299805, -19.368778228759766, -18.83974838256836, -18.310718536376953, -17.781688690185547, -17.252656936645508, -16.7236270904541, -16.194595336914062, -15.66556453704834, -15.136534690856934, -14.607503890991211, -14.078474044799805, -13.549443244934082, -13.02041244506836, -12.491382598876953, -11.962352752685547, -11.433321952819824, -10.904292106628418, -10.375261306762695, -9.846231460571289, -9.317200660705566, -8.788169860839844, -8.259140014648438, -7.730109214782715, -7.20107889175415, -6.672048568725586, -6.143017768859863, -5.613987445831299, -5.084957122802734, -4.555926322937012, -4.026895999908447, -3.49786376953125, -2.9688334465026855, -2.439802885055542, -1.910772442817688, -1.381742000579834, -0.8527116775512695, -0.323681116104126, 0.20534944534301758, 0.734379768371582, 1.263410210609436, 1.79244065284729, 2.3214712142944336, 2.850501537322998, 3.3795318603515625, 3.908562421798706, 4.43759298324585, 4.966623306274414, 5.4956536293029785, 6.024683952331543, 6.553714752197266, 7.08274507522583, 7.6117753982543945, 8.140806198120117, 8.669836044311523, 9.198866844177246, 9.727897644042969, 10.256927490234375, 10.785958290100098, 11.31498908996582, 11.844018936157227, 12.37304973602295, 12.902080535888672, 13.431110382080078]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 10.0, 12.0, 8.0, 20.0, 15.0, 19.0, 22.0, 37.0, 36.0, 33.0, 38.0, 45.0, 40.0, 36.0, 42.0, 54.0, 38.0, 50.0, 46.0, 39.0, 45.0, 45.0, 42.0, 27.0, 25.0, 30.0, 21.0, 26.0, 6.0, 20.0, 10.0, 8.0, 14.0, 6.0, 8.0, 7.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962804794311523, -5.730165481567383, -5.497525691986084, -5.264886379241943, -5.0322465896606445, -4.799607276916504, -4.566967487335205, -4.3343281745910645, -4.101688385009766, -3.869048833847046, -3.636409282684326, -3.4037697315216064, -3.1711301803588867, -2.938490867614746, -2.7058510780334473, -2.4732117652893066, -2.240572214126587, -2.007932662963867, -1.7752931118011475, -1.5426535606384277, -1.310014009475708, -1.0773745775222778, -0.8447350263595581, -0.6120954751968384, -0.37945592403411865, -0.14681638777256012, 0.08582314848899841, 0.31846266984939575, 0.5511022210121155, 0.7837417125701904, 1.0163812637329102, 1.2490208148956299, 1.4816603660583496, 1.7142999172210693, 1.946939468383789, 2.179579019546509, 2.4122185707092285, 2.644857883453369, 2.877497673034668, 3.1101369857788086, 3.3427767753601074, 3.575416326522827, 3.808055877685547, 4.0406951904296875, 4.273334980010986, 4.505974292755127, 4.738614082336426, 4.971253395080566, 5.203892707824707, 5.436532020568848, 5.6691718101501465, 5.901811122894287, 6.134450912475586, 6.367090225219727, 6.599730014801025, 6.832369327545166, 7.065009117126465, 7.2976484298706055, 7.530288219451904, 7.762927532196045, 7.995567321777344, 8.228206634521484, 8.460845947265625, 8.693486213684082, 8.926125526428223]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 11.0, 13.0, 32.0, 49.0, 60.0, 101.0, 142.0, 217.0, 333.0, 510.0, 718.0, 1127.0, 1817.0, 2907.0, 4524.0, 7105.0, 11868.0, 18701.0, 30847.0, 51283.0, 85739.0, 133781.0, 176830.0, 175829.0, 131316.0, 83177.0, 50188.0, 30137.0, 18538.0, 11145.0, 7025.0, 4472.0, 2889.0, 1760.0, 1157.0, 711.0, 501.0, 310.0, 217.0, 141.0, 101.0, 74.0, 49.0, 31.0, 25.0, 17.0, 6.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.79296875, -2.699798583984375, -2.60662841796875, -2.513458251953125, -2.4202880859375, -2.327117919921875, -2.23394775390625, -2.140777587890625, -2.047607421875, -1.954437255859375, -1.86126708984375, -1.768096923828125, -1.6749267578125, -1.581756591796875, -1.48858642578125, -1.395416259765625, -1.30224609375, -1.209075927734375, -1.11590576171875, -1.022735595703125, -0.9295654296875, -0.836395263671875, -0.74322509765625, -0.650054931640625, -0.556884765625, -0.463714599609375, -0.37054443359375, -0.277374267578125, -0.1842041015625, -0.091033935546875, 0.00213623046875, 0.095306396484375, 0.1884765625, 0.281646728515625, 0.37481689453125, 0.467987060546875, 0.5611572265625, 0.654327392578125, 0.74749755859375, 0.840667724609375, 0.933837890625, 1.027008056640625, 1.12017822265625, 1.213348388671875, 1.3065185546875, 1.399688720703125, 1.49285888671875, 1.586029052734375, 1.67919921875, 1.772369384765625, 1.86553955078125, 1.958709716796875, 2.0518798828125, 2.145050048828125, 2.23822021484375, 2.331390380859375, 2.424560546875, 2.517730712890625, 2.61090087890625, 2.704071044921875, 2.7972412109375, 2.890411376953125, 2.98358154296875, 3.076751708984375, 3.169921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 0.0, 2.0, 8.0, 10.0, 13.0, 17.0, 12.0, 21.0, 23.0, 15.0, 26.0, 43.0, 40.0, 38.0, 64.0, 45.0, 31.0, 49.0, 43.0, 45.0, 37.0, 63.0, 53.0, 38.0, 28.0, 37.0, 38.0, 29.0, 22.0, 14.0, 26.0, 11.0, 13.0, 11.0, 10.0, 7.0, 9.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.640869140625, -6.37548828125, -6.110107421875, -5.8447265625, -5.579345703125, -5.31396484375, -5.048583984375, -4.783203125, -4.517822265625, -4.25244140625, -3.987060546875, -3.7216796875, -3.456298828125, -3.19091796875, -2.925537109375, -2.66015625, -2.394775390625, -2.12939453125, -1.864013671875, -1.5986328125, -1.333251953125, -1.06787109375, -0.802490234375, -0.537109375, -0.271728515625, -0.00634765625, 0.259033203125, 0.5244140625, 0.789794921875, 1.05517578125, 1.320556640625, 1.5859375, 1.851318359375, 2.11669921875, 2.382080078125, 2.6474609375, 2.912841796875, 3.17822265625, 3.443603515625, 3.708984375, 3.974365234375, 4.23974609375, 4.505126953125, 4.7705078125, 5.035888671875, 5.30126953125, 5.566650390625, 5.83203125, 6.097412109375, 6.36279296875, 6.628173828125, 6.8935546875, 7.158935546875, 7.42431640625, 7.689697265625, 7.955078125, 8.220458984375, 8.48583984375, 8.751220703125, 9.0166015625, 9.281982421875, 9.54736328125, 9.812744140625, 10.078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 8.0, 17.0, 25.0, 31.0, 32.0, 86.0, 98.0, 181.0, 266.0, 343.0, 495.0, 769.0, 1325.0, 2093.0, 3425.0, 5755.0, 9812.0, 17097.0, 30585.0, 56433.0, 100837.0, 170518.0, 222068.0, 179706.0, 108664.0, 60297.0, 33052.0, 18355.0, 10467.0, 6004.0, 3542.0, 2223.0, 1391.0, 875.0, 575.0, 389.0, 227.0, 146.0, 119.0, 56.0, 53.0, 35.0, 22.0, 18.0, 14.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.59375, -3.476165771484375, -3.35858154296875, -3.240997314453125, -3.1234130859375, -3.005828857421875, -2.88824462890625, -2.770660400390625, -2.653076171875, -2.535491943359375, -2.41790771484375, -2.300323486328125, -2.1827392578125, -2.065155029296875, -1.94757080078125, -1.829986572265625, -1.71240234375, -1.594818115234375, -1.47723388671875, -1.359649658203125, -1.2420654296875, -1.124481201171875, -1.00689697265625, -0.889312744140625, -0.771728515625, -0.654144287109375, -0.53656005859375, -0.418975830078125, -0.3013916015625, -0.183807373046875, -0.06622314453125, 0.051361083984375, 0.1689453125, 0.286529541015625, 0.40411376953125, 0.521697998046875, 0.6392822265625, 0.756866455078125, 0.87445068359375, 0.992034912109375, 1.109619140625, 1.227203369140625, 1.34478759765625, 1.462371826171875, 1.5799560546875, 1.697540283203125, 1.81512451171875, 1.932708740234375, 2.05029296875, 2.167877197265625, 2.28546142578125, 2.403045654296875, 2.5206298828125, 2.638214111328125, 2.75579833984375, 2.873382568359375, 2.990966796875, 3.108551025390625, 3.22613525390625, 3.343719482421875, 3.4613037109375, 3.578887939453125, 3.69647216796875, 3.814056396484375, 3.931640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 4.0, 8.0, 12.0, 11.0, 9.0, 24.0, 17.0, 21.0, 26.0, 27.0, 28.0, 34.0, 46.0, 30.0, 30.0, 40.0, 27.0, 33.0, 37.0, 40.0, 43.0, 39.0, 32.0, 40.0, 36.0, 40.0, 26.0, 26.0, 29.0, 22.0, 21.0, 22.0, 22.0, 21.0, 12.0, 12.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.125, -4.000030517578125, -3.87506103515625, -3.750091552734375, -3.6251220703125, -3.500152587890625, -3.37518310546875, -3.250213623046875, -3.125244140625, -3.000274658203125, -2.87530517578125, -2.750335693359375, -2.6253662109375, -2.500396728515625, -2.37542724609375, -2.250457763671875, -2.12548828125, -2.000518798828125, -1.87554931640625, -1.750579833984375, -1.6256103515625, -1.500640869140625, -1.37567138671875, -1.250701904296875, -1.125732421875, -1.000762939453125, -0.87579345703125, -0.750823974609375, -0.6258544921875, -0.500885009765625, -0.37591552734375, -0.250946044921875, -0.1259765625, -0.001007080078125, 0.12396240234375, 0.248931884765625, 0.3739013671875, 0.498870849609375, 0.62384033203125, 0.748809814453125, 0.873779296875, 0.998748779296875, 1.12371826171875, 1.248687744140625, 1.3736572265625, 1.498626708984375, 1.62359619140625, 1.748565673828125, 1.87353515625, 1.998504638671875, 2.12347412109375, 2.248443603515625, 2.3734130859375, 2.498382568359375, 2.62335205078125, 2.748321533203125, 2.873291015625, 2.998260498046875, 3.12322998046875, 3.248199462890625, 3.3731689453125, 3.498138427734375, 3.62310791015625, 3.748077392578125, 3.873046875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 16.0, 15.0, 21.0, 28.0, 39.0, 65.0, 106.0, 141.0, 232.0, 440.0, 677.0, 1243.0, 2459.0, 4913.0, 10542.0, 24434.0, 62917.0, 172843.0, 368186.0, 246789.0, 90876.0, 34456.0, 13956.0, 6364.0, 3054.0, 1564.0, 911.0, 448.0, 304.0, 159.0, 119.0, 71.0, 47.0, 39.0, 23.0, 16.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.671539306640625, -2.58721923828125, -2.502899169921875, -2.4185791015625, -2.334259033203125, -2.24993896484375, -2.165618896484375, -2.081298828125, -1.996978759765625, -1.91265869140625, -1.828338623046875, -1.7440185546875, -1.659698486328125, -1.57537841796875, -1.491058349609375, -1.40673828125, -1.322418212890625, -1.23809814453125, -1.153778076171875, -1.0694580078125, -0.985137939453125, -0.90081787109375, -0.816497802734375, -0.732177734375, -0.647857666015625, -0.56353759765625, -0.479217529296875, -0.3948974609375, -0.310577392578125, -0.22625732421875, -0.141937255859375, -0.0576171875, 0.026702880859375, 0.11102294921875, 0.195343017578125, 0.2796630859375, 0.363983154296875, 0.44830322265625, 0.532623291015625, 0.616943359375, 0.701263427734375, 0.78558349609375, 0.869903564453125, 0.9542236328125, 1.038543701171875, 1.12286376953125, 1.207183837890625, 1.29150390625, 1.375823974609375, 1.46014404296875, 1.544464111328125, 1.6287841796875, 1.713104248046875, 1.79742431640625, 1.881744384765625, 1.966064453125, 2.050384521484375, 2.13470458984375, 2.219024658203125, 2.3033447265625, 2.387664794921875, 2.47198486328125, 2.556304931640625, 2.640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 5.0, 6.0, 4.0, 13.0, 13.0, 9.0, 13.0, 25.0, 36.0, 58.0, 49.0, 72.0, 60.0, 75.0, 71.0, 79.0, 80.0, 69.0, 46.0, 48.0, 42.0, 34.0, 21.0, 13.0, 13.0, 11.0, 6.0, 10.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.00012099742889404297, -0.00011779461055994034, -0.00011459179222583771, -0.00011138897389173508, -0.00010818615555763245, -0.00010498333722352982, -0.00010178051888942719, -9.857770055532455e-05, -9.537488222122192e-05, -9.217206388711929e-05, -8.896924555301666e-05, -8.576642721891403e-05, -8.25636088848114e-05, -7.936079055070877e-05, -7.615797221660614e-05, -7.295515388250351e-05, -6.975233554840088e-05, -6.654951721429825e-05, -6.334669888019562e-05, -6.014388054609299e-05, -5.6941062211990356e-05, -5.3738243877887726e-05, -5.0535425543785095e-05, -4.7332607209682465e-05, -4.4129788875579834e-05, -4.09269705414772e-05, -3.772415220737457e-05, -3.452133387327194e-05, -3.131851553916931e-05, -2.811569720506668e-05, -2.491287887096405e-05, -2.171006053686142e-05, -1.850724220275879e-05, -1.530442386865616e-05, -1.2101605534553528e-05, -8.898787200450897e-06, -5.695968866348267e-06, -2.493150532245636e-06, 7.096678018569946e-07, 3.912486135959625e-06, 7.115304470062256e-06, 1.0318122804164886e-05, 1.3520941138267517e-05, 1.6723759472370148e-05, 1.992657780647278e-05, 2.312939614057541e-05, 2.633221447467804e-05, 2.953503280878067e-05, 3.27378511428833e-05, 3.594066947698593e-05, 3.914348781108856e-05, 4.234630614519119e-05, 4.554912447929382e-05, 4.8751942813396454e-05, 5.1954761147499084e-05, 5.5157579481601715e-05, 5.8360397815704346e-05, 6.156321614980698e-05, 6.476603448390961e-05, 6.796885281801224e-05, 7.117167115211487e-05, 7.43744894862175e-05, 7.757730782032013e-05, 8.078012615442276e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 15.0, 17.0, 24.0, 26.0, 38.0, 79.0, 85.0, 139.0, 241.0, 342.0, 579.0, 986.0, 1545.0, 2673.0, 4802.0, 8759.0, 17015.0, 35431.0, 79728.0, 178788.0, 290031.0, 226368.0, 107185.0, 46923.0, 21704.0, 11047.0, 5784.0, 3258.0, 1892.0, 1099.0, 684.0, 436.0, 290.0, 170.0, 108.0, 78.0, 52.0, 46.0, 19.0, 12.0, 11.0, 14.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.29296875, -2.2205810546875, -2.148193359375, -2.0758056640625, -2.00341796875, -1.9310302734375, -1.858642578125, -1.7862548828125, -1.7138671875, -1.6414794921875, -1.569091796875, -1.4967041015625, -1.42431640625, -1.3519287109375, -1.279541015625, -1.2071533203125, -1.134765625, -1.0623779296875, -0.989990234375, -0.9176025390625, -0.84521484375, -0.7728271484375, -0.700439453125, -0.6280517578125, -0.5556640625, -0.4832763671875, -0.410888671875, -0.3385009765625, -0.26611328125, -0.1937255859375, -0.121337890625, -0.0489501953125, 0.0234375, 0.0958251953125, 0.168212890625, 0.2406005859375, 0.31298828125, 0.3853759765625, 0.457763671875, 0.5301513671875, 0.6025390625, 0.6749267578125, 0.747314453125, 0.8197021484375, 0.89208984375, 0.9644775390625, 1.036865234375, 1.1092529296875, 1.181640625, 1.2540283203125, 1.326416015625, 1.3988037109375, 1.47119140625, 1.5435791015625, 1.615966796875, 1.6883544921875, 1.7607421875, 1.8331298828125, 1.905517578125, 1.9779052734375, 2.05029296875, 2.1226806640625, 2.195068359375, 2.2674560546875, 2.33984375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 6.0, 8.0, 13.0, 17.0, 14.0, 23.0, 25.0, 37.0, 51.0, 58.0, 58.0, 65.0, 70.0, 67.0, 54.0, 58.0, 80.0, 47.0, 49.0, 43.0, 32.0, 27.0, 25.0, 12.0, 10.0, 11.0, 6.0, 8.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5410079956054688, -0.5229339599609375, -0.5048599243164062, -0.486785888671875, -0.46871185302734375, -0.4506378173828125, -0.43256378173828125, -0.41448974609375, -0.39641571044921875, -0.3783416748046875, -0.36026763916015625, -0.342193603515625, -0.32411956787109375, -0.3060455322265625, -0.28797149658203125, -0.2698974609375, -0.25182342529296875, -0.2337493896484375, -0.21567535400390625, -0.197601318359375, -0.17952728271484375, -0.1614532470703125, -0.14337921142578125, -0.12530517578125, -0.10723114013671875, -0.0891571044921875, -0.07108306884765625, -0.053009033203125, -0.03493499755859375, -0.0168609619140625, 0.00121307373046875, 0.019287109375, 0.03736114501953125, 0.0554351806640625, 0.07350921630859375, 0.091583251953125, 0.10965728759765625, 0.1277313232421875, 0.14580535888671875, 0.16387939453125, 0.18195343017578125, 0.2000274658203125, 0.21810150146484375, 0.236175537109375, 0.25424957275390625, 0.2723236083984375, 0.29039764404296875, 0.3084716796875, 0.32654571533203125, 0.3446197509765625, 0.36269378662109375, 0.380767822265625, 0.39884185791015625, 0.4169158935546875, 0.43498992919921875, 0.45306396484375, 0.47113800048828125, 0.4892120361328125, 0.5072860717773438, 0.525360107421875, 0.5434341430664062, 0.5615081787109375, 0.5795822143554688, 0.59765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 7.0, 13.0, 10.0, 16.0, 22.0, 33.0, 37.0, 44.0, 68.0, 104.0, 98.0, 95.0, 114.0, 81.0, 68.0, 52.0, 34.0, 30.0, 11.0, 14.0, 8.0, 6.0, 9.0, 6.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.80108070373535, -20.27338981628418, -19.745698928833008, -19.218008041381836, -18.690317153930664, -18.162626266479492, -17.63493537902832, -17.10724449157715, -16.579553604125977, -16.051862716674805, -15.524171829223633, -14.996480941772461, -14.468790054321289, -13.941099166870117, -13.413408279418945, -12.885717391967773, -12.358026504516602, -11.83033561706543, -11.302644729614258, -10.774953842163086, -10.247262954711914, -9.719572067260742, -9.19188117980957, -8.664190292358398, -8.136499404907227, -7.608808517456055, -7.081117630004883, -6.553426742553711, -6.025735855102539, -5.498044967651367, -4.970354080200195, -4.442663192749023, -3.9149703979492188, -3.387279510498047, -2.859588623046875, -2.331897735595703, -1.8042068481445312, -1.2765159606933594, -0.7488250732421875, -0.22113418579101562, 0.30655670166015625, 0.8342475891113281, 1.3619384765625, 1.8896293640136719, 2.4173202514648438, 2.9450111389160156, 3.4727020263671875, 4.000392913818359, 4.528083801269531, 5.055774688720703, 5.583465576171875, 6.111156463623047, 6.638847351074219, 7.166538238525391, 7.6942291259765625, 8.221920013427734, 8.749610900878906, 9.277301788330078, 9.80499267578125, 10.332683563232422, 10.860374450683594, 11.388065338134766, 11.915756225585938, 12.44344711303711, 12.971138000488281]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 5.0, 9.0, 11.0, 9.0, 21.0, 17.0, 16.0, 22.0, 33.0, 39.0, 38.0, 39.0, 45.0, 35.0, 35.0, 55.0, 47.0, 40.0, 51.0, 43.0, 39.0, 45.0, 52.0, 34.0, 27.0, 27.0, 31.0, 18.0, 25.0, 7.0, 16.0, 13.0, 5.0, 16.0, 6.0, 10.0, 5.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.937016487121582, -5.702924728393555, -5.4688334465026855, -5.234741687774658, -5.000649929046631, -4.766558647155762, -4.532466888427734, -4.298375129699707, -4.06428337097168, -3.8301918506622314, -3.596100091934204, -3.362008571624756, -3.1279168128967285, -2.8938252925872803, -2.659733772277832, -2.4256420135498047, -2.1915504932403564, -1.9574588537216187, -1.7233672142028809, -1.4892756938934326, -1.2551839351654053, -1.021092414855957, -0.7870007753372192, -0.5529091358184814, -0.31881749629974365, -0.08472587168216705, 0.14936575293540955, 0.38345736265182495, 0.6175490021705627, 0.8516405820846558, 1.0857322216033936, 1.3198238611221313, 1.5539155006408691, 1.788007140159607, 2.0220987796783447, 2.256190299987793, 2.4902820587158203, 2.7243735790252686, 2.958465099334717, 3.192556858062744, 3.4266486167907715, 3.6607401371002197, 3.894831895828247, 4.128923416137695, 4.363015174865723, 4.59710693359375, 4.831198215484619, 5.0652899742126465, 5.299381256103516, 5.533473014831543, 5.767564296722412, 6.0016560554504395, 6.235747814178467, 6.469839096069336, 6.703930854797363, 6.938022613525391, 7.172114372253418, 7.406206130981445, 7.6402974128723145, 7.874389171600342, 8.108480453491211, 8.342572212219238, 8.576663970947266, 8.810755729675293, 9.04484748840332]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 11.0, 9.0, 10.0, 17.0, 27.0, 24.0, 45.0, 54.0, 87.0, 108.0, 133.0, 235.0, 357.0, 611.0, 1064.0, 1774.0, 3252.0, 6268.0, 12952.0, 28631.0, 70927.0, 179953.0, 324307.0, 242316.0, 100625.0, 39511.0, 17310.0, 8217.0, 4194.0, 2222.0, 1195.0, 704.0, 435.0, 292.0, 199.0, 130.0, 107.0, 66.0, 43.0, 37.0, 22.0, 16.0, 12.0, 11.0, 14.0, 9.0, 6.0, 2.0, 0.0, 5.0], "bins": [-17.859375, -17.37255859375, -16.8857421875, -16.39892578125, -15.912109375, -15.42529296875, -14.9384765625, -14.45166015625, -13.96484375, -13.47802734375, -12.9912109375, -12.50439453125, -12.017578125, -11.53076171875, -11.0439453125, -10.55712890625, -10.0703125, -9.58349609375, -9.0966796875, -8.60986328125, -8.123046875, -7.63623046875, -7.1494140625, -6.66259765625, -6.17578125, -5.68896484375, -5.2021484375, -4.71533203125, -4.228515625, -3.74169921875, -3.2548828125, -2.76806640625, -2.28125, -1.79443359375, -1.3076171875, -0.82080078125, -0.333984375, 0.15283203125, 0.6396484375, 1.12646484375, 1.61328125, 2.10009765625, 2.5869140625, 3.07373046875, 3.560546875, 4.04736328125, 4.5341796875, 5.02099609375, 5.5078125, 5.99462890625, 6.4814453125, 6.96826171875, 7.455078125, 7.94189453125, 8.4287109375, 8.91552734375, 9.40234375, 9.88916015625, 10.3759765625, 10.86279296875, 11.349609375, 11.83642578125, 12.3232421875, 12.81005859375, 13.296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 5.0, 14.0, 13.0, 18.0, 19.0, 20.0, 22.0, 25.0, 32.0, 30.0, 42.0, 50.0, 49.0, 48.0, 46.0, 45.0, 49.0, 43.0, 44.0, 54.0, 45.0, 38.0, 34.0, 43.0, 32.0, 14.0, 15.0, 21.0, 22.0, 6.0, 11.0, 7.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.21771240234375, -5.9627685546875, -5.70782470703125, -5.452880859375, -5.19793701171875, -4.9429931640625, -4.68804931640625, -4.43310546875, -4.17816162109375, -3.9232177734375, -3.66827392578125, -3.413330078125, -3.15838623046875, -2.9034423828125, -2.64849853515625, -2.3935546875, -2.13861083984375, -1.8836669921875, -1.62872314453125, -1.373779296875, -1.11883544921875, -0.8638916015625, -0.60894775390625, -0.35400390625, -0.09906005859375, 0.1558837890625, 0.41082763671875, 0.665771484375, 0.92071533203125, 1.1756591796875, 1.43060302734375, 1.685546875, 1.94049072265625, 2.1954345703125, 2.45037841796875, 2.705322265625, 2.96026611328125, 3.2152099609375, 3.47015380859375, 3.72509765625, 3.98004150390625, 4.2349853515625, 4.48992919921875, 4.744873046875, 4.99981689453125, 5.2547607421875, 5.50970458984375, 5.7646484375, 6.01959228515625, 6.2745361328125, 6.52947998046875, 6.784423828125, 7.03936767578125, 7.2943115234375, 7.54925537109375, 7.80419921875, 8.05914306640625, 8.3140869140625, 8.56903076171875, 8.823974609375, 9.07891845703125, 9.3338623046875, 9.58880615234375, 9.84375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 13.0, 7.0, 13.0, 16.0, 38.0, 44.0, 52.0, 101.0, 145.0, 191.0, 246.0, 398.0, 534.0, 847.0, 1236.0, 1869.0, 2918.0, 4530.0, 6966.0, 11375.0, 18580.0, 31009.0, 52711.0, 87498.0, 134230.0, 176699.0, 174099.0, 130215.0, 83749.0, 50162.0, 29933.0, 17881.0, 10906.0, 6772.0, 4290.0, 2778.0, 1832.0, 1209.0, 776.0, 525.0, 350.0, 258.0, 184.0, 120.0, 65.0, 50.0, 40.0, 34.0, 21.0, 12.0, 12.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.81640625, -7.55548095703125, -7.2945556640625, -7.03363037109375, -6.772705078125, -6.51177978515625, -6.2508544921875, -5.98992919921875, -5.72900390625, -5.46807861328125, -5.2071533203125, -4.94622802734375, -4.685302734375, -4.42437744140625, -4.1634521484375, -3.90252685546875, -3.6416015625, -3.38067626953125, -3.1197509765625, -2.85882568359375, -2.597900390625, -2.33697509765625, -2.0760498046875, -1.81512451171875, -1.55419921875, -1.29327392578125, -1.0323486328125, -0.77142333984375, -0.510498046875, -0.24957275390625, 0.0113525390625, 0.27227783203125, 0.533203125, 0.79412841796875, 1.0550537109375, 1.31597900390625, 1.576904296875, 1.83782958984375, 2.0987548828125, 2.35968017578125, 2.62060546875, 2.88153076171875, 3.1424560546875, 3.40338134765625, 3.664306640625, 3.92523193359375, 4.1861572265625, 4.44708251953125, 4.7080078125, 4.96893310546875, 5.2298583984375, 5.49078369140625, 5.751708984375, 6.01263427734375, 6.2735595703125, 6.53448486328125, 6.79541015625, 7.05633544921875, 7.3172607421875, 7.57818603515625, 7.839111328125, 8.10003662109375, 8.3609619140625, 8.62188720703125, 8.8828125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 6.0, 8.0, 13.0, 16.0, 16.0, 16.0, 22.0, 20.0, 28.0, 23.0, 31.0, 48.0, 47.0, 38.0, 43.0, 45.0, 46.0, 38.0, 51.0, 42.0, 42.0, 35.0, 37.0, 33.0, 33.0, 37.0, 24.0, 19.0, 20.0, 22.0, 16.0, 17.0, 20.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4765625, -4.335205078125, -4.19384765625, -4.052490234375, -3.9111328125, -3.769775390625, -3.62841796875, -3.487060546875, -3.345703125, -3.204345703125, -3.06298828125, -2.921630859375, -2.7802734375, -2.638916015625, -2.49755859375, -2.356201171875, -2.21484375, -2.073486328125, -1.93212890625, -1.790771484375, -1.6494140625, -1.508056640625, -1.36669921875, -1.225341796875, -1.083984375, -0.942626953125, -0.80126953125, -0.659912109375, -0.5185546875, -0.377197265625, -0.23583984375, -0.094482421875, 0.046875, 0.188232421875, 0.32958984375, 0.470947265625, 0.6123046875, 0.753662109375, 0.89501953125, 1.036376953125, 1.177734375, 1.319091796875, 1.46044921875, 1.601806640625, 1.7431640625, 1.884521484375, 2.02587890625, 2.167236328125, 2.30859375, 2.449951171875, 2.59130859375, 2.732666015625, 2.8740234375, 3.015380859375, 3.15673828125, 3.298095703125, 3.439453125, 3.580810546875, 3.72216796875, 3.863525390625, 4.0048828125, 4.146240234375, 4.28759765625, 4.428955078125, 4.5703125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 10.0, 9.0, 16.0, 18.0, 35.0, 44.0, 51.0, 73.0, 83.0, 114.0, 178.0, 261.0, 342.0, 515.0, 769.0, 1211.0, 1914.0, 3216.0, 5829.0, 11494.0, 24379.0, 58145.0, 153820.0, 338384.0, 265839.0, 103274.0, 40149.0, 17780.0, 8681.0, 4575.0, 2567.0, 1579.0, 985.0, 643.0, 445.0, 315.0, 234.0, 153.0, 126.0, 94.0, 51.0, 45.0, 36.0, 17.0, 16.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-8.6015625, -8.322265625, -8.04296875, -7.763671875, -7.484375, -7.205078125, -6.92578125, -6.646484375, -6.3671875, -6.087890625, -5.80859375, -5.529296875, -5.25, -4.970703125, -4.69140625, -4.412109375, -4.1328125, -3.853515625, -3.57421875, -3.294921875, -3.015625, -2.736328125, -2.45703125, -2.177734375, -1.8984375, -1.619140625, -1.33984375, -1.060546875, -0.78125, -0.501953125, -0.22265625, 0.056640625, 0.3359375, 0.615234375, 0.89453125, 1.173828125, 1.453125, 1.732421875, 2.01171875, 2.291015625, 2.5703125, 2.849609375, 3.12890625, 3.408203125, 3.6875, 3.966796875, 4.24609375, 4.525390625, 4.8046875, 5.083984375, 5.36328125, 5.642578125, 5.921875, 6.201171875, 6.48046875, 6.759765625, 7.0390625, 7.318359375, 7.59765625, 7.876953125, 8.15625, 8.435546875, 8.71484375, 8.994140625, 9.2734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 7.0, 10.0, 27.0, 30.0, 40.0, 60.0, 80.0, 106.0, 134.0, 133.0, 126.0, 73.0, 54.0, 25.0, 27.0, 27.0, 12.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005993843078613281, -0.0005640164017677307, -0.0005286484956741333, -0.0004932805895805359, -0.0004579126834869385, -0.00042254477739334106, -0.00038717687129974365, -0.00035180896520614624, -0.00031644105911254883, -0.0002810731530189514, -0.000245705246925354, -0.0002103373408317566, -0.00017496943473815918, -0.00013960152864456177, -0.00010423362255096436, -6.886571645736694e-05, -3.349781036376953e-05, 1.8700957298278809e-06, 3.723800182342529e-05, 7.26059079170227e-05, 0.00010797381401062012, 0.00014334172010421753, 0.00017870962619781494, 0.00021407753229141235, 0.00024944543838500977, 0.0002848133444786072, 0.0003201812505722046, 0.000355549156665802, 0.0003909170627593994, 0.0004262849688529968, 0.00046165287494659424, 0.0004970207810401917, 0.0005323886871337891, 0.0005677565932273865, 0.0006031244993209839, 0.0006384924054145813, 0.0006738603115081787, 0.0007092282176017761, 0.0007445961236953735, 0.000779964029788971, 0.0008153319358825684, 0.0008506998419761658, 0.0008860677480697632, 0.0009214356541633606, 0.000956803560256958, 0.0009921714663505554, 0.0010275393724441528, 0.0010629072785377502, 0.0010982751846313477, 0.001133643090724945, 0.0011690109968185425, 0.00120437890291214, 0.0012397468090057373, 0.0012751147150993347, 0.0013104826211929321, 0.0013458505272865295, 0.001381218433380127, 0.0014165863394737244, 0.0014519542455673218, 0.0014873221516609192, 0.0015226900577545166, 0.001558057963848114, 0.0015934258699417114, 0.0016287937760353088, 0.0016641616821289062]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 7.0, 10.0, 9.0, 12.0, 13.0, 25.0, 27.0, 58.0, 66.0, 71.0, 118.0, 132.0, 190.0, 328.0, 435.0, 548.0, 859.0, 1370.0, 2410.0, 4476.0, 9733.0, 27191.0, 96521.0, 359731.0, 385439.0, 107186.0, 29529.0, 10495.0, 4585.0, 2469.0, 1477.0, 944.0, 619.0, 398.0, 322.0, 182.0, 165.0, 136.0, 64.0, 48.0, 40.0, 29.0, 31.0, 19.0, 9.0, 8.0, 10.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.8203125, -11.4625244140625, -11.104736328125, -10.7469482421875, -10.38916015625, -10.0313720703125, -9.673583984375, -9.3157958984375, -8.9580078125, -8.6002197265625, -8.242431640625, -7.8846435546875, -7.52685546875, -7.1690673828125, -6.811279296875, -6.4534912109375, -6.095703125, -5.7379150390625, -5.380126953125, -5.0223388671875, -4.66455078125, -4.3067626953125, -3.948974609375, -3.5911865234375, -3.2333984375, -2.8756103515625, -2.517822265625, -2.1600341796875, -1.80224609375, -1.4444580078125, -1.086669921875, -0.7288818359375, -0.37109375, -0.0133056640625, 0.344482421875, 0.7022705078125, 1.06005859375, 1.4178466796875, 1.775634765625, 2.1334228515625, 2.4912109375, 2.8489990234375, 3.206787109375, 3.5645751953125, 3.92236328125, 4.2801513671875, 4.637939453125, 4.9957275390625, 5.353515625, 5.7113037109375, 6.069091796875, 6.4268798828125, 6.78466796875, 7.1424560546875, 7.500244140625, 7.8580322265625, 8.2158203125, 8.5736083984375, 8.931396484375, 9.2891845703125, 9.64697265625, 10.0047607421875, 10.362548828125, 10.7203369140625, 11.078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 16.0, 14.0, 22.0, 40.0, 43.0, 77.0, 69.0, 88.0, 89.0, 93.0, 100.0, 65.0, 51.0, 53.0, 30.0, 31.0, 20.0, 14.0, 16.0, 7.0, 8.0, 8.0, 1.0, 0.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.109375, -2.045440673828125, -1.98150634765625, -1.917572021484375, -1.8536376953125, -1.789703369140625, -1.72576904296875, -1.661834716796875, -1.597900390625, -1.533966064453125, -1.47003173828125, -1.406097412109375, -1.3421630859375, -1.278228759765625, -1.21429443359375, -1.150360107421875, -1.08642578125, -1.022491455078125, -0.95855712890625, -0.894622802734375, -0.8306884765625, -0.766754150390625, -0.70281982421875, -0.638885498046875, -0.574951171875, -0.511016845703125, -0.44708251953125, -0.383148193359375, -0.3192138671875, -0.255279541015625, -0.19134521484375, -0.127410888671875, -0.0634765625, 0.000457763671875, 0.06439208984375, 0.128326416015625, 0.1922607421875, 0.256195068359375, 0.32012939453125, 0.384063720703125, 0.447998046875, 0.511932373046875, 0.57586669921875, 0.639801025390625, 0.7037353515625, 0.767669677734375, 0.83160400390625, 0.895538330078125, 0.95947265625, 1.023406982421875, 1.08734130859375, 1.151275634765625, 1.2152099609375, 1.279144287109375, 1.34307861328125, 1.407012939453125, 1.470947265625, 1.534881591796875, 1.59881591796875, 1.662750244140625, 1.7266845703125, 1.790618896484375, 1.85455322265625, 1.918487548828125, 1.982421875]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 6.0, 11.0, 7.0, 17.0, 22.0, 21.0, 31.0, 41.0, 61.0, 71.0, 72.0, 95.0, 100.0, 83.0, 83.0, 59.0, 59.0, 32.0, 31.0, 18.0, 14.0, 8.0, 6.0, 4.0, 3.0, 8.0, 7.0, 5.0, 2.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.568994522094727, -17.1079158782959, -16.646839141845703, -16.185760498046875, -15.724681854248047, -15.263603210449219, -14.802525520324707, -14.341447830200195, -13.880369186401367, -13.419290542602539, -12.958212852478027, -12.497135162353516, -12.036056518554688, -11.57497787475586, -11.113900184631348, -10.652822494506836, -10.191743850708008, -9.73066520690918, -9.269587516784668, -8.808509826660156, -8.347431182861328, -7.886353015899658, -7.425274848937988, -6.964196681976318, -6.503118515014648, -6.0420403480529785, -5.580962181091309, -5.119884014129639, -4.658805847167969, -4.197727680206299, -3.736649513244629, -3.275571346282959, -2.8144941329956055, -2.3534159660339355, -1.8923377990722656, -1.4312596321105957, -0.9701814651489258, -0.5091032981872559, -0.04802513122558594, 0.413053035736084, 0.8741312026977539, 1.3352093696594238, 1.7962875366210938, 2.2573657035827637, 2.7184438705444336, 3.1795220375061035, 3.6406002044677734, 4.101678371429443, 4.562756538391113, 5.023834705352783, 5.484912872314453, 5.945991039276123, 6.407069206237793, 6.868147373199463, 7.329225540161133, 7.790303707122803, 8.251381874084473, 8.712459564208984, 9.173538208007812, 9.63461685180664, 10.095694541931152, 10.556772232055664, 11.017850875854492, 11.47892951965332, 11.940007209777832]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 7.0, 8.0, 12.0, 14.0, 9.0, 15.0, 19.0, 13.0, 26.0, 30.0, 24.0, 22.0, 37.0, 37.0, 34.0, 34.0, 47.0, 42.0, 42.0, 51.0, 25.0, 40.0, 43.0, 38.0, 42.0, 34.0, 31.0, 25.0, 29.0, 26.0, 28.0, 14.0, 11.0, 19.0, 14.0, 13.0, 8.0, 8.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.356032371520996, -6.140588760375977, -5.925145149230957, -5.7097015380859375, -5.494257926940918, -5.278814315795898, -5.063370227813721, -4.847926616668701, -4.632483005523682, -4.417039394378662, -4.201595783233643, -3.986151933670044, -3.7707083225250244, -3.555264711380005, -3.3398208618164062, -3.1243772506713867, -2.908933639526367, -2.6934900283813477, -2.478046417236328, -2.2626025676727295, -2.04715895652771, -1.8317153453826904, -1.6162716150283813, -1.4008278846740723, -1.1853842735290527, -0.9699406027793884, -0.7544969320297241, -0.5390532612800598, -0.3236095905303955, -0.10816597938537598, 0.1072777509689331, 0.3227214813232422, 0.5381655693054199, 0.7536092400550842, 0.9690529108047485, 1.1844966411590576, 1.3999402523040771, 1.6153838634490967, 1.8308275938034058, 2.046271324157715, 2.2617149353027344, 2.477158546447754, 2.6926021575927734, 2.908046007156372, 3.1234896183013916, 3.338933229446411, 3.5543770790100098, 3.7698206901550293, 3.985264301300049, 4.200707912445068, 4.416151523590088, 4.631595134735107, 4.847039222717285, 5.062482833862305, 5.277926445007324, 5.493370056152344, 5.708813667297363, 5.924257278442383, 6.139700889587402, 6.355144500732422, 6.570588111877441, 6.786031723022461, 7.001475811004639, 7.216919422149658, 7.432363033294678]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 11.0, 13.0, 28.0, 35.0, 45.0, 70.0, 95.0, 143.0, 191.0, 232.0, 366.0, 552.0, 837.0, 1153.0, 1767.0, 2827.0, 4471.0, 7926.0, 14437.0, 30283.0, 76994.0, 238904.0, 818973.0, 1646066.0, 922064.0, 267452.0, 85237.0, 33872.0, 16212.0, 8609.0, 5099.0, 3151.0, 2025.0, 1311.0, 940.0, 597.0, 357.0, 266.0, 203.0, 124.0, 104.0, 75.0, 48.0, 36.0, 31.0, 17.0, 10.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3984375, -13.9112548828125, -13.424072265625, -12.9368896484375, -12.44970703125, -11.9625244140625, -11.475341796875, -10.9881591796875, -10.5009765625, -10.0137939453125, -9.526611328125, -9.0394287109375, -8.55224609375, -8.0650634765625, -7.577880859375, -7.0906982421875, -6.603515625, -6.1163330078125, -5.629150390625, -5.1419677734375, -4.65478515625, -4.1676025390625, -3.680419921875, -3.1932373046875, -2.7060546875, -2.2188720703125, -1.731689453125, -1.2445068359375, -0.75732421875, -0.2701416015625, 0.217041015625, 0.7042236328125, 1.19140625, 1.6785888671875, 2.165771484375, 2.6529541015625, 3.14013671875, 3.6273193359375, 4.114501953125, 4.6016845703125, 5.0888671875, 5.5760498046875, 6.063232421875, 6.5504150390625, 7.03759765625, 7.5247802734375, 8.011962890625, 8.4991455078125, 8.986328125, 9.4735107421875, 9.960693359375, 10.4478759765625, 10.93505859375, 11.4222412109375, 11.909423828125, 12.3966064453125, 12.8837890625, 13.3709716796875, 13.858154296875, 14.3453369140625, 14.83251953125, 15.3197021484375, 15.806884765625, 16.2940673828125, 16.78125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 4.0, 3.0, 5.0, 10.0, 10.0, 12.0, 10.0, 14.0, 18.0, 24.0, 28.0, 20.0, 20.0, 21.0, 32.0, 37.0, 43.0, 37.0, 50.0, 36.0, 40.0, 51.0, 37.0, 39.0, 50.0, 32.0, 35.0, 45.0, 31.0, 20.0, 34.0, 25.0, 18.0, 17.0, 14.0, 14.0, 19.0, 11.0, 10.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.33203125, -5.16217041015625, -4.9923095703125, -4.82244873046875, -4.652587890625, -4.48272705078125, -4.3128662109375, -4.14300537109375, -3.97314453125, -3.80328369140625, -3.6334228515625, -3.46356201171875, -3.293701171875, -3.12384033203125, -2.9539794921875, -2.78411865234375, -2.6142578125, -2.44439697265625, -2.2745361328125, -2.10467529296875, -1.934814453125, -1.76495361328125, -1.5950927734375, -1.42523193359375, -1.25537109375, -1.08551025390625, -0.9156494140625, -0.74578857421875, -0.575927734375, -0.40606689453125, -0.2362060546875, -0.06634521484375, 0.103515625, 0.27337646484375, 0.4432373046875, 0.61309814453125, 0.782958984375, 0.95281982421875, 1.1226806640625, 1.29254150390625, 1.46240234375, 1.63226318359375, 1.8021240234375, 1.97198486328125, 2.141845703125, 2.31170654296875, 2.4815673828125, 2.65142822265625, 2.8212890625, 2.99114990234375, 3.1610107421875, 3.33087158203125, 3.500732421875, 3.67059326171875, 3.8404541015625, 4.01031494140625, 4.18017578125, 4.35003662109375, 4.5198974609375, 4.68975830078125, 4.859619140625, 5.02947998046875, 5.1993408203125, 5.36920166015625, 5.5390625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 6.0, 9.0, 13.0, 17.0, 26.0, 38.0, 57.0, 78.0, 117.0, 186.0, 292.0, 388.0, 537.0, 794.0, 1145.0, 1669.0, 2507.0, 3722.0, 5647.0, 8855.0, 13888.0, 23814.0, 42211.0, 80304.0, 165807.0, 368606.0, 783440.0, 1133589.0, 806814.0, 383455.0, 173822.0, 83359.0, 43570.0, 24479.0, 14548.0, 8907.0, 5788.0, 3878.0, 2553.0, 1695.0, 1147.0, 767.0, 536.0, 365.0, 261.0, 163.0, 130.0, 99.0, 57.0, 47.0, 34.0, 15.0, 13.0, 11.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0], "bins": [-11.3203125, -10.949462890625, -10.57861328125, -10.207763671875, -9.8369140625, -9.466064453125, -9.09521484375, -8.724365234375, -8.353515625, -7.982666015625, -7.61181640625, -7.240966796875, -6.8701171875, -6.499267578125, -6.12841796875, -5.757568359375, -5.38671875, -5.015869140625, -4.64501953125, -4.274169921875, -3.9033203125, -3.532470703125, -3.16162109375, -2.790771484375, -2.419921875, -2.049072265625, -1.67822265625, -1.307373046875, -0.9365234375, -0.565673828125, -0.19482421875, 0.176025390625, 0.546875, 0.917724609375, 1.28857421875, 1.659423828125, 2.0302734375, 2.401123046875, 2.77197265625, 3.142822265625, 3.513671875, 3.884521484375, 4.25537109375, 4.626220703125, 4.9970703125, 5.367919921875, 5.73876953125, 6.109619140625, 6.48046875, 6.851318359375, 7.22216796875, 7.593017578125, 7.9638671875, 8.334716796875, 8.70556640625, 9.076416015625, 9.447265625, 9.818115234375, 10.18896484375, 10.559814453125, 10.9306640625, 11.301513671875, 11.67236328125, 12.043212890625, 12.4140625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 7.0, 16.0, 13.0, 18.0, 26.0, 35.0, 35.0, 51.0, 60.0, 79.0, 101.0, 117.0, 175.0, 254.0, 257.0, 315.0, 337.0, 357.0, 308.0, 250.0, 268.0, 244.0, 157.0, 152.0, 100.0, 76.0, 61.0, 48.0, 30.0, 30.0, 18.0, 19.0, 17.0, 6.0, 11.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.11328125, -3.991424560546875, -3.86956787109375, -3.747711181640625, -3.6258544921875, -3.503997802734375, -3.38214111328125, -3.260284423828125, -3.138427734375, -3.016571044921875, -2.89471435546875, -2.772857666015625, -2.6510009765625, -2.529144287109375, -2.40728759765625, -2.285430908203125, -2.16357421875, -2.041717529296875, -1.91986083984375, -1.798004150390625, -1.6761474609375, -1.554290771484375, -1.43243408203125, -1.310577392578125, -1.188720703125, -1.066864013671875, -0.94500732421875, -0.823150634765625, -0.7012939453125, -0.579437255859375, -0.45758056640625, -0.335723876953125, -0.2138671875, -0.092010498046875, 0.02984619140625, 0.151702880859375, 0.2735595703125, 0.395416259765625, 0.51727294921875, 0.639129638671875, 0.760986328125, 0.882843017578125, 1.00469970703125, 1.126556396484375, 1.2484130859375, 1.370269775390625, 1.49212646484375, 1.613983154296875, 1.73583984375, 1.857696533203125, 1.97955322265625, 2.101409912109375, 2.2232666015625, 2.345123291015625, 2.46697998046875, 2.588836669921875, 2.710693359375, 2.832550048828125, 2.95440673828125, 3.076263427734375, 3.1981201171875, 3.319976806640625, 3.44183349609375, 3.563690185546875, 3.685546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 9.0, 11.0, 24.0, 29.0, 34.0, 47.0, 58.0, 69.0, 93.0, 83.0, 111.0, 75.0, 77.0, 60.0, 48.0, 33.0, 21.0, 20.0, 18.0, 7.0, 7.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.337761878967285, -11.842564582824707, -11.347367286682129, -10.85216999053955, -10.356972694396973, -9.861775398254395, -9.3665771484375, -8.871379852294922, -8.376182556152344, -7.880985260009766, -7.3857879638671875, -6.890590667724609, -6.395393371582031, -5.900196075439453, -5.404998302459717, -4.909801006317139, -4.414604187011719, -3.9194068908691406, -3.4242095947265625, -2.9290120601654053, -2.433814764022827, -1.938617467880249, -1.4434199333190918, -0.9482226371765137, -0.45302534103393555, 0.042172014713287354, 0.5373693704605103, 1.032566785812378, 1.527764081954956, 2.022961378097534, 2.5181589126586914, 3.0133562088012695, 3.5085525512695312, 4.003749847412109, 4.4989471435546875, 4.994144439697266, 5.489341735839844, 5.984539031982422, 6.479736804962158, 6.974934101104736, 7.4701313972473145, 7.965328693389893, 8.460526466369629, 8.955723762512207, 9.450921058654785, 9.946118354797363, 10.441315650939941, 10.93651294708252, 11.431710243225098, 11.926907539367676, 12.422104835510254, 12.917302131652832, 13.41249942779541, 13.907696723937988, 14.402894973754883, 14.898092269897461, 15.393289566040039, 15.888486862182617, 16.383684158325195, 16.878881454467773, 17.37407875061035, 17.86927604675293, 18.364473342895508, 18.859670639038086, 19.354867935180664]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 11.0, 8.0, 9.0, 10.0, 13.0, 13.0, 18.0, 12.0, 25.0, 20.0, 22.0, 29.0, 33.0, 31.0, 23.0, 34.0, 37.0, 40.0, 48.0, 39.0, 29.0, 39.0, 41.0, 45.0, 38.0, 31.0, 35.0, 26.0, 36.0, 31.0, 27.0, 25.0, 21.0, 21.0, 15.0, 11.0, 6.0, 11.0, 7.0, 7.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.325138568878174, -7.107594966888428, -6.89005184173584, -6.672508239746094, -6.454965114593506, -6.23742151260376, -6.019878387451172, -5.802334785461426, -5.58479118347168, -5.367247581481934, -5.149704456329346, -4.9321608543396, -4.714617729187012, -4.497074127197266, -4.2795305252075195, -4.061987400054932, -3.8444442749023438, -3.6269009113311768, -3.4093575477600098, -3.1918139457702637, -2.974270820617676, -2.7567272186279297, -2.5391838550567627, -2.3216404914855957, -2.1040971279144287, -1.8865537643432617, -1.6690104007720947, -1.4514669179916382, -1.2339235544204712, -1.0163801908493042, -0.7988367080688477, -0.5812933444976807, -0.3637504577636719, -0.1462070643901825, 0.07133632898330688, 0.28887975215911865, 0.5064231157302856, 0.7239664793014526, 0.9415099620819092, 1.1590533256530762, 1.3765966892242432, 1.5941400527954102, 1.8116834163665771, 2.029226779937744, 2.2467703819274902, 2.464313507080078, 2.681857109069824, 2.899400472640991, 3.116943836212158, 3.334487199783325, 3.552030563354492, 3.7695741653442383, 3.987117290496826, 4.204660892486572, 4.42220401763916, 4.639747619628906, 4.857291221618652, 5.074834823608398, 5.292377948760986, 5.509921550750732, 5.72746467590332, 5.945008277893066, 6.1625518798828125, 6.3800950050354, 6.597638130187988]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 10.0, 14.0, 15.0, 21.0, 30.0, 49.0, 65.0, 89.0, 137.0, 223.0, 346.0, 476.0, 756.0, 1170.0, 1992.0, 3540.0, 6200.0, 11504.0, 23589.0, 48340.0, 102757.0, 200967.0, 269399.0, 189706.0, 95300.0, 44866.0, 21579.0, 11053.0, 5980.0, 3262.0, 1935.0, 1181.0, 700.0, 413.0, 250.0, 205.0, 111.0, 104.0, 67.0, 39.0, 34.0, 23.0, 17.0, 10.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.59765625, -5.413818359375, -5.22998046875, -5.046142578125, -4.8623046875, -4.678466796875, -4.49462890625, -4.310791015625, -4.126953125, -3.943115234375, -3.75927734375, -3.575439453125, -3.3916015625, -3.207763671875, -3.02392578125, -2.840087890625, -2.65625, -2.472412109375, -2.28857421875, -2.104736328125, -1.9208984375, -1.737060546875, -1.55322265625, -1.369384765625, -1.185546875, -1.001708984375, -0.81787109375, -0.634033203125, -0.4501953125, -0.266357421875, -0.08251953125, 0.101318359375, 0.28515625, 0.468994140625, 0.65283203125, 0.836669921875, 1.0205078125, 1.204345703125, 1.38818359375, 1.572021484375, 1.755859375, 1.939697265625, 2.12353515625, 2.307373046875, 2.4912109375, 2.675048828125, 2.85888671875, 3.042724609375, 3.2265625, 3.410400390625, 3.59423828125, 3.778076171875, 3.9619140625, 4.145751953125, 4.32958984375, 4.513427734375, 4.697265625, 4.881103515625, 5.06494140625, 5.248779296875, 5.4326171875, 5.616455078125, 5.80029296875, 5.984130859375, 6.16796875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 7.0, 9.0, 9.0, 12.0, 13.0, 11.0, 17.0, 22.0, 22.0, 20.0, 15.0, 34.0, 24.0, 31.0, 34.0, 39.0, 34.0, 32.0, 31.0, 47.0, 29.0, 37.0, 33.0, 39.0, 40.0, 35.0, 50.0, 34.0, 25.0, 27.0, 24.0, 22.0, 25.0, 16.0, 11.0, 18.0, 11.0, 8.0, 7.0, 10.0, 4.0, 4.0, 6.0, 1.0, 6.0, 2.0, 3.0, 3.0, 3.0], "bins": [-8.046875, -7.8193359375, -7.591796875, -7.3642578125, -7.13671875, -6.9091796875, -6.681640625, -6.4541015625, -6.2265625, -5.9990234375, -5.771484375, -5.5439453125, -5.31640625, -5.0888671875, -4.861328125, -4.6337890625, -4.40625, -4.1787109375, -3.951171875, -3.7236328125, -3.49609375, -3.2685546875, -3.041015625, -2.8134765625, -2.5859375, -2.3583984375, -2.130859375, -1.9033203125, -1.67578125, -1.4482421875, -1.220703125, -0.9931640625, -0.765625, -0.5380859375, -0.310546875, -0.0830078125, 0.14453125, 0.3720703125, 0.599609375, 0.8271484375, 1.0546875, 1.2822265625, 1.509765625, 1.7373046875, 1.96484375, 2.1923828125, 2.419921875, 2.6474609375, 2.875, 3.1025390625, 3.330078125, 3.5576171875, 3.78515625, 4.0126953125, 4.240234375, 4.4677734375, 4.6953125, 4.9228515625, 5.150390625, 5.3779296875, 5.60546875, 5.8330078125, 6.060546875, 6.2880859375, 6.515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 9.0, 4.0, 14.0, 16.0, 22.0, 23.0, 29.0, 56.0, 62.0, 94.0, 116.0, 176.0, 271.0, 437.0, 659.0, 1182.0, 2117.0, 4111.0, 8571.0, 19977.0, 53458.0, 162739.0, 391602.0, 261443.0, 86192.0, 30653.0, 12241.0, 5484.0, 2765.0, 1523.0, 905.0, 486.0, 348.0, 236.0, 146.0, 109.0, 72.0, 56.0, 41.0, 24.0, 24.0, 13.0, 12.0, 9.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.7901611328125, -8.494384765625, -8.1986083984375, -7.90283203125, -7.6070556640625, -7.311279296875, -7.0155029296875, -6.7197265625, -6.4239501953125, -6.128173828125, -5.8323974609375, -5.53662109375, -5.2408447265625, -4.945068359375, -4.6492919921875, -4.353515625, -4.0577392578125, -3.761962890625, -3.4661865234375, -3.17041015625, -2.8746337890625, -2.578857421875, -2.2830810546875, -1.9873046875, -1.6915283203125, -1.395751953125, -1.0999755859375, -0.80419921875, -0.5084228515625, -0.212646484375, 0.0831298828125, 0.37890625, 0.6746826171875, 0.970458984375, 1.2662353515625, 1.56201171875, 1.8577880859375, 2.153564453125, 2.4493408203125, 2.7451171875, 3.0408935546875, 3.336669921875, 3.6324462890625, 3.92822265625, 4.2239990234375, 4.519775390625, 4.8155517578125, 5.111328125, 5.4071044921875, 5.702880859375, 5.9986572265625, 6.29443359375, 6.5902099609375, 6.885986328125, 7.1817626953125, 7.4775390625, 7.7733154296875, 8.069091796875, 8.3648681640625, 8.66064453125, 8.9564208984375, 9.252197265625, 9.5479736328125, 9.84375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 13.0, 13.0, 8.0, 16.0, 18.0, 15.0, 16.0, 30.0, 34.0, 31.0, 33.0, 35.0, 44.0, 46.0, 61.0, 34.0, 53.0, 38.0, 53.0, 46.0, 34.0, 36.0, 33.0, 33.0, 32.0, 27.0, 25.0, 19.0, 24.0, 22.0, 14.0, 9.0, 12.0, 8.0, 2.0, 7.0, 2.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.32147216796875, -4.1663818359375, -4.01129150390625, -3.856201171875, -3.70111083984375, -3.5460205078125, -3.39093017578125, -3.23583984375, -3.08074951171875, -2.9256591796875, -2.77056884765625, -2.615478515625, -2.46038818359375, -2.3052978515625, -2.15020751953125, -1.9951171875, -1.84002685546875, -1.6849365234375, -1.52984619140625, -1.374755859375, -1.21966552734375, -1.0645751953125, -0.90948486328125, -0.75439453125, -0.59930419921875, -0.4442138671875, -0.28912353515625, -0.134033203125, 0.02105712890625, 0.1761474609375, 0.33123779296875, 0.486328125, 0.64141845703125, 0.7965087890625, 0.95159912109375, 1.106689453125, 1.26177978515625, 1.4168701171875, 1.57196044921875, 1.72705078125, 1.88214111328125, 2.0372314453125, 2.19232177734375, 2.347412109375, 2.50250244140625, 2.6575927734375, 2.81268310546875, 2.9677734375, 3.12286376953125, 3.2779541015625, 3.43304443359375, 3.588134765625, 3.74322509765625, 3.8983154296875, 4.05340576171875, 4.20849609375, 4.36358642578125, 4.5186767578125, 4.67376708984375, 4.828857421875, 4.98394775390625, 5.1390380859375, 5.29412841796875, 5.44921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 16.0, 32.0, 39.0, 48.0, 80.0, 109.0, 210.0, 304.0, 469.0, 728.0, 1270.0, 2039.0, 3728.0, 6515.0, 12807.0, 26260.0, 58624.0, 141844.0, 299858.0, 273765.0, 121231.0, 50602.0, 22876.0, 11092.0, 5891.0, 3202.0, 1830.0, 1099.0, 721.0, 451.0, 286.0, 182.0, 124.0, 78.0, 37.0, 30.0, 22.0, 13.0, 6.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.037384033203125, -2.94781494140625, -2.858245849609375, -2.7686767578125, -2.679107666015625, -2.58953857421875, -2.499969482421875, -2.410400390625, -2.320831298828125, -2.23126220703125, -2.141693115234375, -2.0521240234375, -1.962554931640625, -1.87298583984375, -1.783416748046875, -1.69384765625, -1.604278564453125, -1.51470947265625, -1.425140380859375, -1.3355712890625, -1.246002197265625, -1.15643310546875, -1.066864013671875, -0.977294921875, -0.887725830078125, -0.79815673828125, -0.708587646484375, -0.6190185546875, -0.529449462890625, -0.43988037109375, -0.350311279296875, -0.2607421875, -0.171173095703125, -0.08160400390625, 0.007965087890625, 0.0975341796875, 0.187103271484375, 0.27667236328125, 0.366241455078125, 0.455810546875, 0.545379638671875, 0.63494873046875, 0.724517822265625, 0.8140869140625, 0.903656005859375, 0.99322509765625, 1.082794189453125, 1.17236328125, 1.261932373046875, 1.35150146484375, 1.441070556640625, 1.5306396484375, 1.620208740234375, 1.70977783203125, 1.799346923828125, 1.888916015625, 1.978485107421875, 2.06805419921875, 2.157623291015625, 2.2471923828125, 2.336761474609375, 2.42633056640625, 2.515899658203125, 2.60546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 4.0, 13.0, 7.0, 25.0, 38.0, 77.0, 92.0, 139.0, 143.0, 130.0, 112.0, 68.0, 40.0, 31.0, 12.0, 14.0, 15.0, 11.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002231597900390625, -0.0002144351601600647, -0.0002057105302810669, -0.0001969859004020691, -0.0001882612705230713, -0.00017953664064407349, -0.00017081201076507568, -0.00016208738088607788, -0.00015336275100708008, -0.00014463812112808228, -0.00013591349124908447, -0.00012718886137008667, -0.00011846423149108887, -0.00010973960161209106, -0.00010101497173309326, -9.229034185409546e-05, -8.356571197509766e-05, -7.484108209609985e-05, -6.611645221710205e-05, -5.739182233810425e-05, -4.8667192459106445e-05, -3.994256258010864e-05, -3.121793270111084e-05, -2.2493302822113037e-05, -1.3768672943115234e-05, -5.044043064117432e-06, 3.680586814880371e-06, 1.2405216693878174e-05, 2.1129846572875977e-05, 2.985447645187378e-05, 3.857910633087158e-05, 4.7303736209869385e-05, 5.602836608886719e-05, 6.475299596786499e-05, 7.347762584686279e-05, 8.22022557258606e-05, 9.09268856048584e-05, 9.96515154838562e-05, 0.000108376145362854, 0.0001171007752418518, 0.0001258254051208496, 0.0001345500349998474, 0.00014327466487884521, 0.00015199929475784302, 0.00016072392463684082, 0.00016944855451583862, 0.00017817318439483643, 0.00018689781427383423, 0.00019562244415283203, 0.00020434707403182983, 0.00021307170391082764, 0.00022179633378982544, 0.00023052096366882324, 0.00023924559354782104, 0.00024797022342681885, 0.00025669485330581665, 0.00026541948318481445, 0.00027414411306381226, 0.00028286874294281006, 0.00029159337282180786, 0.00030031800270080566, 0.00030904263257980347, 0.00031776726245880127, 0.00032649189233779907, 0.0003352165222167969]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 8.0, 8.0, 7.0, 16.0, 19.0, 21.0, 34.0, 49.0, 49.0, 93.0, 156.0, 203.0, 281.0, 405.0, 582.0, 868.0, 1271.0, 1982.0, 2995.0, 4643.0, 7778.0, 13684.0, 24056.0, 43770.0, 82959.0, 151859.0, 224579.0, 205959.0, 126473.0, 67746.0, 35906.0, 20039.0, 11276.0, 6732.0, 4094.0, 2728.0, 1700.0, 1113.0, 690.0, 513.0, 364.0, 250.0, 161.0, 142.0, 78.0, 58.0, 44.0, 41.0, 31.0, 12.0, 16.0, 5.0, 9.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.00848388671875, -1.9388427734375, -1.86920166015625, -1.799560546875, -1.72991943359375, -1.6602783203125, -1.59063720703125, -1.52099609375, -1.45135498046875, -1.3817138671875, -1.31207275390625, -1.242431640625, -1.17279052734375, -1.1031494140625, -1.03350830078125, -0.9638671875, -0.89422607421875, -0.8245849609375, -0.75494384765625, -0.685302734375, -0.61566162109375, -0.5460205078125, -0.47637939453125, -0.40673828125, -0.33709716796875, -0.2674560546875, -0.19781494140625, -0.128173828125, -0.05853271484375, 0.0111083984375, 0.08074951171875, 0.150390625, 0.22003173828125, 0.2896728515625, 0.35931396484375, 0.428955078125, 0.49859619140625, 0.5682373046875, 0.63787841796875, 0.70751953125, 0.77716064453125, 0.8468017578125, 0.91644287109375, 0.986083984375, 1.05572509765625, 1.1253662109375, 1.19500732421875, 1.2646484375, 1.33428955078125, 1.4039306640625, 1.47357177734375, 1.543212890625, 1.61285400390625, 1.6824951171875, 1.75213623046875, 1.82177734375, 1.89141845703125, 1.9610595703125, 2.03070068359375, 2.100341796875, 2.16998291015625, 2.2396240234375, 2.30926513671875, 2.37890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 10.0, 10.0, 13.0, 20.0, 14.0, 22.0, 18.0, 22.0, 34.0, 44.0, 56.0, 56.0, 73.0, 78.0, 78.0, 79.0, 79.0, 65.0, 44.0, 39.0, 34.0, 26.0, 21.0, 15.0, 9.0, 9.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.669921875, -0.6461105346679688, -0.6222991943359375, -0.5984878540039062, -0.574676513671875, -0.5508651733398438, -0.5270538330078125, -0.5032424926757812, -0.47943115234375, -0.45561981201171875, -0.4318084716796875, -0.40799713134765625, -0.384185791015625, -0.36037445068359375, -0.3365631103515625, -0.31275177001953125, -0.2889404296875, -0.26512908935546875, -0.2413177490234375, -0.21750640869140625, -0.193695068359375, -0.16988372802734375, -0.1460723876953125, -0.12226104736328125, -0.09844970703125, -0.07463836669921875, -0.0508270263671875, -0.02701568603515625, -0.003204345703125, 0.02060699462890625, 0.0444183349609375, 0.06822967529296875, 0.092041015625, 0.11585235595703125, 0.1396636962890625, 0.16347503662109375, 0.187286376953125, 0.21109771728515625, 0.2349090576171875, 0.25872039794921875, 0.28253173828125, 0.30634307861328125, 0.3301544189453125, 0.35396575927734375, 0.377777099609375, 0.40158843994140625, 0.4253997802734375, 0.44921112060546875, 0.4730224609375, 0.49683380126953125, 0.5206451416015625, 0.5444564819335938, 0.568267822265625, 0.5920791625976562, 0.6158905029296875, 0.6397018432617188, 0.66351318359375, 0.6873245239257812, 0.7111358642578125, 0.7349472045898438, 0.758758544921875, 0.7825698852539062, 0.8063812255859375, 0.8301925659179688, 0.85400390625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 6.0, 11.0, 14.0, 20.0, 29.0, 33.0, 40.0, 50.0, 64.0, 87.0, 82.0, 107.0, 88.0, 67.0, 64.0, 51.0, 43.0, 22.0, 20.0, 21.0, 10.0, 8.0, 8.0, 8.0, 12.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.04301643371582, -12.565839767456055, -12.088663101196289, -11.611486434936523, -11.134309768676758, -10.657133102416992, -10.179956436157227, -9.702778816223145, -9.225602149963379, -8.748425483703613, -8.271248817443848, -7.794072151184082, -7.316895008087158, -6.839718341827393, -6.362541675567627, -5.885364532470703, -5.408188343048096, -4.93101167678833, -4.4538350105285645, -3.9766581058502197, -3.499481201171875, -3.0223045349121094, -2.5451278686523438, -2.067950963973999, -1.5907742977142334, -1.1135975122451782, -0.6364207863807678, -0.15924406051635742, 0.31793272495269775, 0.7951095104217529, 1.2722861766815186, 1.7494630813598633, 2.226639747619629, 2.7038164138793945, 3.1809933185577393, 3.658169984817505, 4.13534688949585, 4.612523555755615, 5.089700222015381, 5.566877365112305, 6.04405403137207, 6.521230697631836, 6.998407363891602, 7.475584030151367, 7.952761173248291, 8.429937362670898, 8.907114028930664, 9.384291648864746, 9.861467361450195, 10.338644027709961, 10.815820693969727, 11.292997360229492, 11.770174026489258, 12.247350692749023, 12.724527359008789, 13.201704978942871, 13.678881645202637, 14.156058311462402, 14.633234977722168, 15.110411643981934, 15.5875883102417, 16.06476593017578, 16.541942596435547, 17.019119262695312, 17.496295928955078]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 10.0, 8.0, 8.0, 7.0, 17.0, 12.0, 15.0, 17.0, 19.0, 25.0, 19.0, 29.0, 37.0, 27.0, 26.0, 29.0, 45.0, 33.0, 44.0, 46.0, 33.0, 36.0, 44.0, 43.0, 43.0, 35.0, 23.0, 35.0, 28.0, 29.0, 31.0, 31.0, 25.0, 15.0, 14.0, 11.0, 5.0, 12.0, 5.0, 7.0, 3.0, 2.0, 8.0, 2.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.166965484619141, -6.947599411010742, -6.728233337402344, -6.508867263793945, -6.289501190185547, -6.070135116577148, -5.85076904296875, -5.631402969360352, -5.412036895751953, -5.192670822143555, -4.973304748535156, -4.753938674926758, -4.534572601318359, -4.315206527709961, -4.0958404541015625, -3.876474618911743, -3.657108783721924, -3.4377427101135254, -3.218376636505127, -2.9990105628967285, -2.77964448928833, -2.5602784156799316, -2.3409125804901123, -2.121546506881714, -1.9021804332733154, -1.682814359664917, -1.4634482860565186, -1.2440823316574097, -1.0247162580490112, -0.8053501844406128, -0.5859842300415039, -0.36661815643310547, -0.14725255966186523, 0.07211348414421082, 0.29147952795028687, 0.5108455419540405, 0.730211615562439, 0.9495776891708374, 1.1689436435699463, 1.3883097171783447, 1.6076757907867432, 1.8270418643951416, 2.04640793800354, 2.2657737731933594, 2.485139846801758, 2.7045059204101562, 2.9238719940185547, 3.143238067626953, 3.3626041412353516, 3.58197021484375, 3.8013362884521484, 4.020702362060547, 4.240068435668945, 4.459434509277344, 4.678800582885742, 4.898166656494141, 5.117532730102539, 5.3368988037109375, 5.556264877319336, 5.775630950927734, 5.994997024536133, 6.214363098144531, 6.43372917175293, 6.653095245361328, 6.872460842132568]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 17.0, 22.0, 37.0, 52.0, 67.0, 130.0, 166.0, 302.0, 396.0, 604.0, 929.0, 1500.0, 2328.0, 3647.0, 5674.0, 9153.0, 14856.0, 24964.0, 42198.0, 70673.0, 112718.0, 158122.0, 177387.0, 152491.0, 105922.0, 65256.0, 38650.0, 22903.0, 13878.0, 8547.0, 5293.0, 3365.0, 2163.0, 1440.0, 937.0, 628.0, 399.0, 253.0, 156.0, 94.0, 70.0, 56.0, 31.0, 17.0, 16.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0], "bins": [-8.2109375, -7.972412109375, -7.73388671875, -7.495361328125, -7.2568359375, -7.018310546875, -6.77978515625, -6.541259765625, -6.302734375, -6.064208984375, -5.82568359375, -5.587158203125, -5.3486328125, -5.110107421875, -4.87158203125, -4.633056640625, -4.39453125, -4.156005859375, -3.91748046875, -3.678955078125, -3.4404296875, -3.201904296875, -2.96337890625, -2.724853515625, -2.486328125, -2.247802734375, -2.00927734375, -1.770751953125, -1.5322265625, -1.293701171875, -1.05517578125, -0.816650390625, -0.578125, -0.339599609375, -0.10107421875, 0.137451171875, 0.3759765625, 0.614501953125, 0.85302734375, 1.091552734375, 1.330078125, 1.568603515625, 1.80712890625, 2.045654296875, 2.2841796875, 2.522705078125, 2.76123046875, 2.999755859375, 3.23828125, 3.476806640625, 3.71533203125, 3.953857421875, 4.1923828125, 4.430908203125, 4.66943359375, 4.907958984375, 5.146484375, 5.385009765625, 5.62353515625, 5.862060546875, 6.1005859375, 6.339111328125, 6.57763671875, 6.816162109375, 7.0546875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 14.0, 10.0, 14.0, 16.0, 18.0, 19.0, 22.0, 24.0, 24.0, 31.0, 29.0, 35.0, 36.0, 36.0, 42.0, 43.0, 44.0, 43.0, 36.0, 37.0, 54.0, 38.0, 28.0, 27.0, 36.0, 35.0, 38.0, 23.0, 25.0, 21.0, 16.0, 11.0, 11.0, 7.0, 6.0, 7.0, 10.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.26513671875, -7.0263671875, -6.78759765625, -6.548828125, -6.31005859375, -6.0712890625, -5.83251953125, -5.59375, -5.35498046875, -5.1162109375, -4.87744140625, -4.638671875, -4.39990234375, -4.1611328125, -3.92236328125, -3.68359375, -3.44482421875, -3.2060546875, -2.96728515625, -2.728515625, -2.48974609375, -2.2509765625, -2.01220703125, -1.7734375, -1.53466796875, -1.2958984375, -1.05712890625, -0.818359375, -0.57958984375, -0.3408203125, -0.10205078125, 0.13671875, 0.37548828125, 0.6142578125, 0.85302734375, 1.091796875, 1.33056640625, 1.5693359375, 1.80810546875, 2.046875, 2.28564453125, 2.5244140625, 2.76318359375, 3.001953125, 3.24072265625, 3.4794921875, 3.71826171875, 3.95703125, 4.19580078125, 4.4345703125, 4.67333984375, 4.912109375, 5.15087890625, 5.3896484375, 5.62841796875, 5.8671875, 6.10595703125, 6.3447265625, 6.58349609375, 6.822265625, 7.06103515625, 7.2998046875, 7.53857421875, 7.77734375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 10.0, 7.0, 6.0, 12.0, 14.0, 22.0, 53.0, 68.0, 86.0, 122.0, 193.0, 313.0, 436.0, 640.0, 975.0, 1481.0, 2269.0, 3398.0, 5251.0, 7976.0, 12539.0, 19412.0, 30493.0, 46615.0, 69563.0, 98329.0, 127017.0, 141299.0, 134556.0, 109491.0, 79912.0, 54763.0, 35909.0, 22964.0, 14646.0, 9716.0, 6079.0, 4021.0, 2602.0, 1790.0, 1187.0, 755.0, 516.0, 368.0, 229.0, 145.0, 101.0, 70.0, 57.0, 37.0, 21.0, 15.0, 6.0, 10.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5, -5.31475830078125, -5.1295166015625, -4.94427490234375, -4.759033203125, -4.57379150390625, -4.3885498046875, -4.20330810546875, -4.01806640625, -3.83282470703125, -3.6475830078125, -3.46234130859375, -3.277099609375, -3.09185791015625, -2.9066162109375, -2.72137451171875, -2.5361328125, -2.35089111328125, -2.1656494140625, -1.98040771484375, -1.795166015625, -1.60992431640625, -1.4246826171875, -1.23944091796875, -1.05419921875, -0.86895751953125, -0.6837158203125, -0.49847412109375, -0.313232421875, -0.12799072265625, 0.0572509765625, 0.24249267578125, 0.427734375, 0.61297607421875, 0.7982177734375, 0.98345947265625, 1.168701171875, 1.35394287109375, 1.5391845703125, 1.72442626953125, 1.90966796875, 2.09490966796875, 2.2801513671875, 2.46539306640625, 2.650634765625, 2.83587646484375, 3.0211181640625, 3.20635986328125, 3.3916015625, 3.57684326171875, 3.7620849609375, 3.94732666015625, 4.132568359375, 4.31781005859375, 4.5030517578125, 4.68829345703125, 4.87353515625, 5.05877685546875, 5.2440185546875, 5.42926025390625, 5.614501953125, 5.79974365234375, 5.9849853515625, 6.17022705078125, 6.35546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 9.0, 4.0, 5.0, 8.0, 10.0, 10.0, 10.0, 21.0, 21.0, 13.0, 15.0, 21.0, 27.0, 26.0, 35.0, 41.0, 30.0, 28.0, 39.0, 39.0, 46.0, 33.0, 33.0, 40.0, 46.0, 39.0, 30.0, 38.0, 31.0, 35.0, 33.0, 28.0, 27.0, 23.0, 27.0, 17.0, 9.0, 6.0, 7.0, 10.0, 3.0, 4.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.48828125, -4.3525390625, -4.216796875, -4.0810546875, -3.9453125, -3.8095703125, -3.673828125, -3.5380859375, -3.40234375, -3.2666015625, -3.130859375, -2.9951171875, -2.859375, -2.7236328125, -2.587890625, -2.4521484375, -2.31640625, -2.1806640625, -2.044921875, -1.9091796875, -1.7734375, -1.6376953125, -1.501953125, -1.3662109375, -1.23046875, -1.0947265625, -0.958984375, -0.8232421875, -0.6875, -0.5517578125, -0.416015625, -0.2802734375, -0.14453125, -0.0087890625, 0.126953125, 0.2626953125, 0.3984375, 0.5341796875, 0.669921875, 0.8056640625, 0.94140625, 1.0771484375, 1.212890625, 1.3486328125, 1.484375, 1.6201171875, 1.755859375, 1.8916015625, 2.02734375, 2.1630859375, 2.298828125, 2.4345703125, 2.5703125, 2.7060546875, 2.841796875, 2.9775390625, 3.11328125, 3.2490234375, 3.384765625, 3.5205078125, 3.65625, 3.7919921875, 3.927734375, 4.0634765625, 4.19921875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 24.0, 35.0, 50.0, 60.0, 88.0, 135.0, 192.0, 264.0, 414.0, 575.0, 921.0, 1285.0, 1954.0, 3071.0, 4746.0, 7884.0, 12971.0, 22389.0, 38754.0, 69762.0, 117746.0, 174639.0, 196186.0, 157243.0, 99712.0, 57185.0, 32347.0, 18451.0, 10903.0, 6559.0, 4105.0, 2598.0, 1710.0, 1099.0, 803.0, 534.0, 358.0, 237.0, 164.0, 114.0, 69.0, 53.0, 44.0, 36.0, 20.0, 15.0, 10.0, 2.0, 6.0, 3.0, 1.0, 3.0], "bins": [-4.74609375, -4.60784912109375, -4.4696044921875, -4.33135986328125, -4.193115234375, -4.05487060546875, -3.9166259765625, -3.77838134765625, -3.64013671875, -3.50189208984375, -3.3636474609375, -3.22540283203125, -3.087158203125, -2.94891357421875, -2.8106689453125, -2.67242431640625, -2.5341796875, -2.39593505859375, -2.2576904296875, -2.11944580078125, -1.981201171875, -1.84295654296875, -1.7047119140625, -1.56646728515625, -1.42822265625, -1.28997802734375, -1.1517333984375, -1.01348876953125, -0.875244140625, -0.73699951171875, -0.5987548828125, -0.46051025390625, -0.322265625, -0.18402099609375, -0.0457763671875, 0.09246826171875, 0.230712890625, 0.36895751953125, 0.5072021484375, 0.64544677734375, 0.78369140625, 0.92193603515625, 1.0601806640625, 1.19842529296875, 1.336669921875, 1.47491455078125, 1.6131591796875, 1.75140380859375, 1.8896484375, 2.02789306640625, 2.1661376953125, 2.30438232421875, 2.442626953125, 2.58087158203125, 2.7191162109375, 2.85736083984375, 2.99560546875, 3.13385009765625, 3.2720947265625, 3.41033935546875, 3.548583984375, 3.68682861328125, 3.8250732421875, 3.96331787109375, 4.1015625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 6.0, 9.0, 8.0, 10.0, 14.0, 23.0, 29.0, 37.0, 44.0, 54.0, 65.0, 101.0, 82.0, 93.0, 87.0, 64.0, 62.0, 36.0, 31.0, 32.0, 27.0, 23.0, 16.0, 9.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0006494522094726562, -0.0006327927112579346, -0.0006161332130432129, -0.0005994737148284912, -0.0005828142166137695, -0.0005661547183990479, -0.0005494952201843262, -0.0005328357219696045, -0.0005161762237548828, -0.0004995167255401611, -0.00048285722732543945, -0.0004661977291107178, -0.0004495382308959961, -0.0004328787326812744, -0.00041621923446655273, -0.00039955973625183105, -0.0003829002380371094, -0.0003662407398223877, -0.000349581241607666, -0.00033292174339294434, -0.00031626224517822266, -0.000299602746963501, -0.0002829432487487793, -0.0002662837505340576, -0.00024962425231933594, -0.00023296475410461426, -0.00021630525588989258, -0.0001996457576751709, -0.00018298625946044922, -0.00016632676124572754, -0.00014966726303100586, -0.00013300776481628418, -0.0001163482666015625, -9.968876838684082e-05, -8.302927017211914e-05, -6.636977195739746e-05, -4.971027374267578e-05, -3.30507755279541e-05, -1.6391277313232422e-05, 2.682209014892578e-07, 1.6927719116210938e-05, 3.358721733093262e-05, 5.02467155456543e-05, 6.690621376037598e-05, 8.356571197509766e-05, 0.00010022521018981934, 0.00011688470840454102, 0.0001335442066192627, 0.00015020370483398438, 0.00016686320304870605, 0.00018352270126342773, 0.00020018219947814941, 0.0002168416976928711, 0.00023350119590759277, 0.00025016069412231445, 0.00026682019233703613, 0.0002834796905517578, 0.0003001391887664795, 0.00031679868698120117, 0.00033345818519592285, 0.00035011768341064453, 0.0003667771816253662, 0.0003834366798400879, 0.00040009617805480957, 0.00041675567626953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 7.0, 9.0, 17.0, 40.0, 43.0, 77.0, 101.0, 132.0, 220.0, 320.0, 465.0, 720.0, 1113.0, 1628.0, 2511.0, 3972.0, 6169.0, 10087.0, 16978.0, 28581.0, 50143.0, 85862.0, 139064.0, 187445.0, 183319.0, 132643.0, 81110.0, 46249.0, 27046.0, 16224.0, 9631.0, 5847.0, 3747.0, 2382.0, 1571.0, 1034.0, 691.0, 425.0, 295.0, 205.0, 120.0, 89.0, 66.0, 50.0, 32.0, 26.0, 17.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3125, -4.177490234375, -4.04248046875, -3.907470703125, -3.7724609375, -3.637451171875, -3.50244140625, -3.367431640625, -3.232421875, -3.097412109375, -2.96240234375, -2.827392578125, -2.6923828125, -2.557373046875, -2.42236328125, -2.287353515625, -2.15234375, -2.017333984375, -1.88232421875, -1.747314453125, -1.6123046875, -1.477294921875, -1.34228515625, -1.207275390625, -1.072265625, -0.937255859375, -0.80224609375, -0.667236328125, -0.5322265625, -0.397216796875, -0.26220703125, -0.127197265625, 0.0078125, 0.142822265625, 0.27783203125, 0.412841796875, 0.5478515625, 0.682861328125, 0.81787109375, 0.952880859375, 1.087890625, 1.222900390625, 1.35791015625, 1.492919921875, 1.6279296875, 1.762939453125, 1.89794921875, 2.032958984375, 2.16796875, 2.302978515625, 2.43798828125, 2.572998046875, 2.7080078125, 2.843017578125, 2.97802734375, 3.113037109375, 3.248046875, 3.383056640625, 3.51806640625, 3.653076171875, 3.7880859375, 3.923095703125, 4.05810546875, 4.193115234375, 4.328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 1.0, 8.0, 8.0, 14.0, 11.0, 16.0, 16.0, 24.0, 23.0, 26.0, 40.0, 35.0, 36.0, 42.0, 53.0, 39.0, 45.0, 65.0, 48.0, 49.0, 62.0, 46.0, 39.0, 36.0, 29.0, 23.0, 30.0, 27.0, 19.0, 13.0, 17.0, 6.0, 12.0, 7.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.837890625, -0.8059234619140625, -0.773956298828125, -0.7419891357421875, -0.71002197265625, -0.6780548095703125, -0.646087646484375, -0.6141204833984375, -0.5821533203125, -0.5501861572265625, -0.518218994140625, -0.4862518310546875, -0.45428466796875, -0.4223175048828125, -0.390350341796875, -0.3583831787109375, -0.326416015625, -0.2944488525390625, -0.262481689453125, -0.2305145263671875, -0.19854736328125, -0.1665802001953125, -0.134613037109375, -0.1026458740234375, -0.0706787109375, -0.0387115478515625, -0.006744384765625, 0.0252227783203125, 0.05718994140625, 0.0891571044921875, 0.121124267578125, 0.1530914306640625, 0.18505859375, 0.2170257568359375, 0.248992919921875, 0.2809600830078125, 0.31292724609375, 0.3448944091796875, 0.376861572265625, 0.4088287353515625, 0.4407958984375, 0.4727630615234375, 0.504730224609375, 0.5366973876953125, 0.56866455078125, 0.6006317138671875, 0.632598876953125, 0.6645660400390625, 0.696533203125, 0.7285003662109375, 0.760467529296875, 0.7924346923828125, 0.82440185546875, 0.8563690185546875, 0.888336181640625, 0.9203033447265625, 0.9522705078125, 0.9842376708984375, 1.016204833984375, 1.0481719970703125, 1.08013916015625, 1.1121063232421875, 1.144073486328125, 1.1760406494140625, 1.2080078125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 12.0, 8.0, 20.0, 26.0, 27.0, 30.0, 47.0, 57.0, 75.0, 90.0, 97.0, 79.0, 80.0, 65.0, 62.0, 52.0, 21.0, 30.0, 15.0, 22.0, 11.0, 12.0, 9.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.518157958984375, -12.053613662719727, -11.589069366455078, -11.124526023864746, -10.659981727600098, -10.19543743133545, -9.730894088745117, -9.266349792480469, -8.80180549621582, -8.337261199951172, -7.872717380523682, -7.408173561096191, -6.943629264831543, -6.4790849685668945, -6.014541149139404, -5.549997329711914, -5.085453033447266, -4.620908737182617, -4.156364917755127, -3.6918208599090576, -3.2272768020629883, -2.762732744216919, -2.2981886863708496, -1.8336446285247803, -1.369100570678711, -0.9045565128326416, -0.44001245498657227, 0.02453160285949707, 0.4890756607055664, 0.9536197185516357, 1.418163776397705, 1.8827078342437744, 2.3472518920898438, 2.811795949935913, 3.2763400077819824, 3.7408840656280518, 4.205428123474121, 4.6699724197387695, 5.13451623916626, 5.59906005859375, 6.063604354858398, 6.528148651123047, 6.992692470550537, 7.457236289978027, 7.921780586242676, 8.386324882507324, 8.850868225097656, 9.315412521362305, 9.779956817626953, 10.244501113891602, 10.70904541015625, 11.173588752746582, 11.63813304901123, 12.102677345275879, 12.567220687866211, 13.03176498413086, 13.496309280395508, 13.960853576660156, 14.425397872924805, 14.889941215515137, 15.354485511779785, 15.819029808044434, 16.283573150634766, 16.748117446899414, 17.212661743164062]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 7.0, 13.0, 12.0, 11.0, 16.0, 12.0, 20.0, 16.0, 17.0, 14.0, 15.0, 26.0, 23.0, 34.0, 23.0, 32.0, 37.0, 31.0, 38.0, 30.0, 36.0, 28.0, 37.0, 33.0, 34.0, 41.0, 22.0, 40.0, 25.0, 18.0, 27.0, 26.0, 22.0, 20.0, 17.0, 15.0, 19.0, 14.0, 12.0, 12.0, 9.0, 11.0, 7.0, 4.0, 2.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0], "bins": [-6.223653316497803, -6.032013893127441, -5.84037446975708, -5.648735046386719, -5.457096099853516, -5.265456676483154, -5.073817253112793, -4.882177829742432, -4.69053840637207, -4.498898983001709, -4.307259559631348, -4.1156206130981445, -3.923981189727783, -3.732341766357422, -3.5407023429870605, -3.349062919616699, -3.157423973083496, -2.9657845497131348, -2.7741453647613525, -2.582505941390991, -2.390866756439209, -2.1992273330688477, -2.0075879096984863, -1.8159486055374146, -1.6243093013763428, -1.432669997215271, -1.2410306930541992, -1.049391269683838, -0.8577519655227661, -0.6661126613616943, -0.474473237991333, -0.28283393383026123, -0.09119510650634766, 0.10044422745704651, 0.2920835614204407, 0.4837229251861572, 0.675362229347229, 0.8670015335083008, 1.058640956878662, 1.2502802610397339, 1.4419195652008057, 1.6335588693618774, 1.8251981735229492, 2.0168375968933105, 2.208477020263672, 2.400116205215454, 2.5917556285858154, 2.7833948135375977, 2.975034236907959, 3.1666736602783203, 3.3583128452301025, 3.549952268600464, 3.741591453552246, 3.9332308769226074, 4.124870300292969, 4.31650972366333, 4.508149147033691, 4.699788570404053, 4.891427993774414, 5.083066940307617, 5.2747063636779785, 5.46634578704834, 5.657985210418701, 5.8496246337890625, 6.041263580322266]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 12.0, 10.0, 30.0, 38.0, 66.0, 92.0, 125.0, 176.0, 282.0, 402.0, 679.0, 1031.0, 1716.0, 2699.0, 4745.0, 8258.0, 15533.0, 32158.0, 79999.0, 249575.0, 884544.0, 1681002.0, 854376.0, 233409.0, 75306.0, 31496.0, 15335.0, 8434.0, 4926.0, 2912.0, 1834.0, 1167.0, 703.0, 453.0, 277.0, 186.0, 103.0, 66.0, 43.0, 28.0, 16.0, 6.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.140625, -19.572998046875, -19.00537109375, -18.437744140625, -17.8701171875, -17.302490234375, -16.73486328125, -16.167236328125, -15.599609375, -15.031982421875, -14.46435546875, -13.896728515625, -13.3291015625, -12.761474609375, -12.19384765625, -11.626220703125, -11.05859375, -10.490966796875, -9.92333984375, -9.355712890625, -8.7880859375, -8.220458984375, -7.65283203125, -7.085205078125, -6.517578125, -5.949951171875, -5.38232421875, -4.814697265625, -4.2470703125, -3.679443359375, -3.11181640625, -2.544189453125, -1.9765625, -1.408935546875, -0.84130859375, -0.273681640625, 0.2939453125, 0.861572265625, 1.42919921875, 1.996826171875, 2.564453125, 3.132080078125, 3.69970703125, 4.267333984375, 4.8349609375, 5.402587890625, 5.97021484375, 6.537841796875, 7.10546875, 7.673095703125, 8.24072265625, 8.808349609375, 9.3759765625, 9.943603515625, 10.51123046875, 11.078857421875, 11.646484375, 12.214111328125, 12.78173828125, 13.349365234375, 13.9169921875, 14.484619140625, 15.05224609375, 15.619873046875, 16.1875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 4.0, 4.0, 6.0, 5.0, 14.0, 8.0, 11.0, 11.0, 19.0, 19.0, 16.0, 20.0, 21.0, 22.0, 31.0, 30.0, 37.0, 35.0, 28.0, 42.0, 33.0, 38.0, 37.0, 44.0, 43.0, 38.0, 38.0, 38.0, 37.0, 20.0, 33.0, 25.0, 25.0, 12.0, 27.0, 20.0, 15.0, 13.0, 8.0, 11.0, 11.0, 11.0, 4.0, 11.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.7578125, -5.5872802734375, -5.416748046875, -5.2462158203125, -5.07568359375, -4.9051513671875, -4.734619140625, -4.5640869140625, -4.3935546875, -4.2230224609375, -4.052490234375, -3.8819580078125, -3.71142578125, -3.5408935546875, -3.370361328125, -3.1998291015625, -3.029296875, -2.8587646484375, -2.688232421875, -2.5177001953125, -2.34716796875, -2.1766357421875, -2.006103515625, -1.8355712890625, -1.6650390625, -1.4945068359375, -1.323974609375, -1.1534423828125, -0.98291015625, -0.8123779296875, -0.641845703125, -0.4713134765625, -0.30078125, -0.1302490234375, 0.040283203125, 0.2108154296875, 0.38134765625, 0.5518798828125, 0.722412109375, 0.8929443359375, 1.0634765625, 1.2340087890625, 1.404541015625, 1.5750732421875, 1.74560546875, 1.9161376953125, 2.086669921875, 2.2572021484375, 2.427734375, 2.5982666015625, 2.768798828125, 2.9393310546875, 3.10986328125, 3.2803955078125, 3.450927734375, 3.6214599609375, 3.7919921875, 3.9625244140625, 4.133056640625, 4.3035888671875, 4.47412109375, 4.6446533203125, 4.815185546875, 4.9857177734375, 5.15625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 11.0, 12.0, 16.0, 20.0, 27.0, 42.0, 54.0, 91.0, 142.0, 197.0, 296.0, 503.0, 748.0, 1164.0, 1820.0, 3046.0, 5046.0, 8678.0, 15543.0, 30315.0, 63791.0, 150907.0, 408227.0, 1041186.0, 1349849.0, 675755.0, 246873.0, 96245.0, 43402.0, 21573.0, 11624.0, 6639.0, 3960.0, 2321.0, 1535.0, 891.0, 585.0, 395.0, 250.0, 175.0, 102.0, 77.0, 59.0, 28.0, 21.0, 11.0, 11.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.533447265625, -16.00439453125, -15.475341796875, -14.9462890625, -14.417236328125, -13.88818359375, -13.359130859375, -12.830078125, -12.301025390625, -11.77197265625, -11.242919921875, -10.7138671875, -10.184814453125, -9.65576171875, -9.126708984375, -8.59765625, -8.068603515625, -7.53955078125, -7.010498046875, -6.4814453125, -5.952392578125, -5.42333984375, -4.894287109375, -4.365234375, -3.836181640625, -3.30712890625, -2.778076171875, -2.2490234375, -1.719970703125, -1.19091796875, -0.661865234375, -0.1328125, 0.396240234375, 0.92529296875, 1.454345703125, 1.9833984375, 2.512451171875, 3.04150390625, 3.570556640625, 4.099609375, 4.628662109375, 5.15771484375, 5.686767578125, 6.2158203125, 6.744873046875, 7.27392578125, 7.802978515625, 8.33203125, 8.861083984375, 9.39013671875, 9.919189453125, 10.4482421875, 10.977294921875, 11.50634765625, 12.035400390625, 12.564453125, 13.093505859375, 13.62255859375, 14.151611328125, 14.6806640625, 15.209716796875, 15.73876953125, 16.267822265625, 16.796875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 22.0, 19.0, 25.0, 37.0, 43.0, 74.0, 94.0, 119.0, 149.0, 218.0, 241.0, 324.0, 328.0, 364.0, 386.0, 341.0, 321.0, 233.0, 186.0, 131.0, 105.0, 65.0, 64.0, 50.0, 30.0, 27.0, 16.0, 9.0, 7.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.29400634765625, -5.1387939453125, -4.98358154296875, -4.828369140625, -4.67315673828125, -4.5179443359375, -4.36273193359375, -4.20751953125, -4.05230712890625, -3.8970947265625, -3.74188232421875, -3.586669921875, -3.43145751953125, -3.2762451171875, -3.12103271484375, -2.9658203125, -2.81060791015625, -2.6553955078125, -2.50018310546875, -2.344970703125, -2.18975830078125, -2.0345458984375, -1.87933349609375, -1.72412109375, -1.56890869140625, -1.4136962890625, -1.25848388671875, -1.103271484375, -0.94805908203125, -0.7928466796875, -0.63763427734375, -0.482421875, -0.32720947265625, -0.1719970703125, -0.01678466796875, 0.138427734375, 0.29364013671875, 0.4488525390625, 0.60406494140625, 0.75927734375, 0.91448974609375, 1.0697021484375, 1.22491455078125, 1.380126953125, 1.53533935546875, 1.6905517578125, 1.84576416015625, 2.0009765625, 2.15618896484375, 2.3114013671875, 2.46661376953125, 2.621826171875, 2.77703857421875, 2.9322509765625, 3.08746337890625, 3.24267578125, 3.39788818359375, 3.5531005859375, 3.70831298828125, 3.863525390625, 4.01873779296875, 4.1739501953125, 4.32916259765625, 4.484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 12.0, 13.0, 15.0, 18.0, 28.0, 27.0, 51.0, 56.0, 58.0, 94.0, 101.0, 100.0, 78.0, 76.0, 75.0, 41.0, 38.0, 27.0, 17.0, 17.0, 12.0, 6.0, 9.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.99970817565918, -13.444025039672852, -12.888341903686523, -12.332657814025879, -11.77697467803955, -11.221291542053223, -10.665607452392578, -10.10992431640625, -9.554241180419922, -8.998558044433594, -8.442874908447266, -7.887190818786621, -7.331507682800293, -6.775824546813965, -6.2201409339904785, -5.664457321166992, -5.108774185180664, -4.553091049194336, -3.9974074363708496, -3.4417240619659424, -2.886040687561035, -2.330357313156128, -1.7746739387512207, -1.2189905643463135, -0.6633071899414062, -0.10762381553649902, 0.4480595588684082, 1.0037429332733154, 1.5594263076782227, 2.11510968208313, 2.670793056488037, 3.2264764308929443, 3.7821617126464844, 4.3378448486328125, 4.893528461456299, 5.449212074279785, 6.004895210266113, 6.560578346252441, 7.116261959075928, 7.671945571899414, 8.227628707885742, 8.78331184387207, 9.338994979858398, 9.894679069519043, 10.450362205505371, 11.0060453414917, 11.561729431152344, 12.117412567138672, 12.673095703125, 13.228778839111328, 13.784461975097656, 14.3401460647583, 14.895829200744629, 15.451512336730957, 16.0071964263916, 16.56287956237793, 17.118562698364258, 17.674245834350586, 18.229928970336914, 18.785612106323242, 19.341297149658203, 19.89698028564453, 20.45266342163086, 21.008346557617188, 21.564029693603516]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 7.0, 8.0, 6.0, 1.0, 10.0, 10.0, 21.0, 14.0, 22.0, 26.0, 20.0, 15.0, 22.0, 18.0, 27.0, 43.0, 35.0, 35.0, 30.0, 40.0, 46.0, 39.0, 37.0, 33.0, 27.0, 28.0, 30.0, 30.0, 22.0, 37.0, 26.0, 37.0, 28.0, 26.0, 26.0, 24.0, 14.0, 17.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.00267219543457, -6.778745174407959, -6.5548176765441895, -6.330890655517578, -6.106963157653809, -5.883036136627197, -5.659109115600586, -5.435181617736816, -5.211254596710205, -4.987327575683594, -4.763400077819824, -4.539473056793213, -4.315546035766602, -4.091618537902832, -3.8676915168762207, -3.6437642574310303, -3.41983699798584, -3.1959097385406494, -2.971982479095459, -2.7480554580688477, -2.5241281986236572, -2.300200939178467, -2.0762739181518555, -1.852346658706665, -1.6284193992614746, -1.4044921398162842, -1.1805649995803833, -0.9566377997398376, -0.732710599899292, -0.5087833404541016, -0.2848562002182007, -0.060929059982299805, 0.16299772262573242, 0.3869249224662781, 0.6108521223068237, 0.8347793221473694, 1.058706521987915, 1.2826337814331055, 1.5065609216690063, 1.7304880619049072, 1.9544153213500977, 2.178342580795288, 2.4022698402404785, 2.62619686126709, 2.8501241207122803, 3.0740513801574707, 3.297978401184082, 3.5219056606292725, 3.745832920074463, 3.9697601795196533, 4.193687438964844, 4.417614459991455, 4.641541481018066, 4.865468978881836, 5.089395999908447, 5.313323020935059, 5.537250518798828, 5.7611775398254395, 5.985105037689209, 6.20903205871582, 6.43295955657959, 6.656886577606201, 6.8808135986328125, 7.104741096496582, 7.328668117523193]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 24.0, 27.0, 40.0, 50.0, 94.0, 134.0, 211.0, 304.0, 483.0, 633.0, 1085.0, 1528.0, 2461.0, 3856.0, 6266.0, 10090.0, 16443.0, 27064.0, 44481.0, 71741.0, 110563.0, 152164.0, 171005.0, 146896.0, 104760.0, 67893.0, 41705.0, 25459.0, 15387.0, 9314.0, 5934.0, 3640.0, 2379.0, 1528.0, 1002.0, 617.0, 432.0, 257.0, 196.0, 118.0, 98.0, 66.0, 36.0, 24.0, 18.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.533203125, -3.420806884765625, -3.30841064453125, -3.196014404296875, -3.0836181640625, -2.971221923828125, -2.85882568359375, -2.746429443359375, -2.634033203125, -2.521636962890625, -2.40924072265625, -2.296844482421875, -2.1844482421875, -2.072052001953125, -1.95965576171875, -1.847259521484375, -1.73486328125, -1.622467041015625, -1.51007080078125, -1.397674560546875, -1.2852783203125, -1.172882080078125, -1.06048583984375, -0.948089599609375, -0.835693359375, -0.723297119140625, -0.61090087890625, -0.498504638671875, -0.3861083984375, -0.273712158203125, -0.16131591796875, -0.048919677734375, 0.0634765625, 0.175872802734375, 0.28826904296875, 0.400665283203125, 0.5130615234375, 0.625457763671875, 0.73785400390625, 0.850250244140625, 0.962646484375, 1.075042724609375, 1.18743896484375, 1.299835205078125, 1.4122314453125, 1.524627685546875, 1.63702392578125, 1.749420166015625, 1.86181640625, 1.974212646484375, 2.08660888671875, 2.199005126953125, 2.3114013671875, 2.423797607421875, 2.53619384765625, 2.648590087890625, 2.760986328125, 2.873382568359375, 2.98577880859375, 3.098175048828125, 3.2105712890625, 3.322967529296875, 3.43536376953125, 3.547760009765625, 3.66015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 7.0, 11.0, 10.0, 16.0, 15.0, 19.0, 16.0, 20.0, 17.0, 32.0, 24.0, 22.0, 35.0, 30.0, 48.0, 31.0, 33.0, 43.0, 39.0, 39.0, 28.0, 39.0, 34.0, 33.0, 32.0, 30.0, 29.0, 34.0, 24.0, 33.0, 28.0, 30.0, 25.0, 10.0, 14.0, 10.0, 8.0, 12.0, 6.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.4892578125, -7.236328125, -6.9833984375, -6.73046875, -6.4775390625, -6.224609375, -5.9716796875, -5.71875, -5.4658203125, -5.212890625, -4.9599609375, -4.70703125, -4.4541015625, -4.201171875, -3.9482421875, -3.6953125, -3.4423828125, -3.189453125, -2.9365234375, -2.68359375, -2.4306640625, -2.177734375, -1.9248046875, -1.671875, -1.4189453125, -1.166015625, -0.9130859375, -0.66015625, -0.4072265625, -0.154296875, 0.0986328125, 0.3515625, 0.6044921875, 0.857421875, 1.1103515625, 1.36328125, 1.6162109375, 1.869140625, 2.1220703125, 2.375, 2.6279296875, 2.880859375, 3.1337890625, 3.38671875, 3.6396484375, 3.892578125, 4.1455078125, 4.3984375, 4.6513671875, 4.904296875, 5.1572265625, 5.41015625, 5.6630859375, 5.916015625, 6.1689453125, 6.421875, 6.6748046875, 6.927734375, 7.1806640625, 7.43359375, 7.6865234375, 7.939453125, 8.1923828125, 8.4453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 8.0, 3.0, 6.0, 15.0, 18.0, 27.0, 36.0, 37.0, 71.0, 115.0, 118.0, 205.0, 309.0, 459.0, 675.0, 1057.0, 1515.0, 2489.0, 4063.0, 6585.0, 11127.0, 19161.0, 33962.0, 60920.0, 108180.0, 176007.0, 216019.0, 168164.0, 101960.0, 57368.0, 31846.0, 18369.0, 10617.0, 6351.0, 3836.0, 2304.0, 1554.0, 1009.0, 665.0, 470.0, 248.0, 197.0, 112.0, 84.0, 63.0, 46.0, 30.0, 21.0, 27.0, 9.0, 7.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2237548828125, -4.080322265625, -3.9368896484375, -3.79345703125, -3.6500244140625, -3.506591796875, -3.3631591796875, -3.2197265625, -3.0762939453125, -2.932861328125, -2.7894287109375, -2.64599609375, -2.5025634765625, -2.359130859375, -2.2156982421875, -2.072265625, -1.9288330078125, -1.785400390625, -1.6419677734375, -1.49853515625, -1.3551025390625, -1.211669921875, -1.0682373046875, -0.9248046875, -0.7813720703125, -0.637939453125, -0.4945068359375, -0.35107421875, -0.2076416015625, -0.064208984375, 0.0792236328125, 0.22265625, 0.3660888671875, 0.509521484375, 0.6529541015625, 0.79638671875, 0.9398193359375, 1.083251953125, 1.2266845703125, 1.3701171875, 1.5135498046875, 1.656982421875, 1.8004150390625, 1.94384765625, 2.0872802734375, 2.230712890625, 2.3741455078125, 2.517578125, 2.6610107421875, 2.804443359375, 2.9478759765625, 3.09130859375, 3.2347412109375, 3.378173828125, 3.5216064453125, 3.6650390625, 3.8084716796875, 3.951904296875, 4.0953369140625, 4.23876953125, 4.3822021484375, 4.525634765625, 4.6690673828125, 4.8125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 10.0, 11.0, 14.0, 6.0, 26.0, 22.0, 22.0, 23.0, 26.0, 29.0, 41.0, 36.0, 32.0, 31.0, 39.0, 27.0, 30.0, 49.0, 39.0, 49.0, 37.0, 34.0, 31.0, 35.0, 41.0, 24.0, 41.0, 24.0, 32.0, 24.0, 25.0, 20.0, 17.0, 12.0, 8.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.9429931640625, -4.784423828125, -4.6258544921875, -4.46728515625, -4.3087158203125, -4.150146484375, -3.9915771484375, -3.8330078125, -3.6744384765625, -3.515869140625, -3.3572998046875, -3.19873046875, -3.0401611328125, -2.881591796875, -2.7230224609375, -2.564453125, -2.4058837890625, -2.247314453125, -2.0887451171875, -1.93017578125, -1.7716064453125, -1.613037109375, -1.4544677734375, -1.2958984375, -1.1373291015625, -0.978759765625, -0.8201904296875, -0.66162109375, -0.5030517578125, -0.344482421875, -0.1859130859375, -0.02734375, 0.1312255859375, 0.289794921875, 0.4483642578125, 0.60693359375, 0.7655029296875, 0.924072265625, 1.0826416015625, 1.2412109375, 1.3997802734375, 1.558349609375, 1.7169189453125, 1.87548828125, 2.0340576171875, 2.192626953125, 2.3511962890625, 2.509765625, 2.6683349609375, 2.826904296875, 2.9854736328125, 3.14404296875, 3.3026123046875, 3.461181640625, 3.6197509765625, 3.7783203125, 3.9368896484375, 4.095458984375, 4.2540283203125, 4.41259765625, 4.5711669921875, 4.729736328125, 4.8883056640625, 5.046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 15.0, 10.0, 16.0, 12.0, 44.0, 51.0, 97.0, 121.0, 181.0, 330.0, 490.0, 717.0, 1167.0, 1932.0, 3115.0, 5172.0, 8824.0, 15503.0, 28344.0, 53572.0, 106871.0, 204494.0, 265835.0, 168488.0, 85204.0, 42861.0, 23222.0, 12854.0, 7463.0, 4267.0, 2693.0, 1649.0, 1067.0, 687.0, 414.0, 283.0, 155.0, 115.0, 66.0, 48.0, 35.0, 18.0, 17.0, 12.0, 10.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.625, -2.548553466796875, -2.47210693359375, -2.395660400390625, -2.3192138671875, -2.242767333984375, -2.16632080078125, -2.089874267578125, -2.013427734375, -1.936981201171875, -1.86053466796875, -1.784088134765625, -1.7076416015625, -1.631195068359375, -1.55474853515625, -1.478302001953125, -1.40185546875, -1.325408935546875, -1.24896240234375, -1.172515869140625, -1.0960693359375, -1.019622802734375, -0.94317626953125, -0.866729736328125, -0.790283203125, -0.713836669921875, -0.63739013671875, -0.560943603515625, -0.4844970703125, -0.408050537109375, -0.33160400390625, -0.255157470703125, -0.1787109375, -0.102264404296875, -0.02581787109375, 0.050628662109375, 0.1270751953125, 0.203521728515625, 0.27996826171875, 0.356414794921875, 0.432861328125, 0.509307861328125, 0.58575439453125, 0.662200927734375, 0.7386474609375, 0.815093994140625, 0.89154052734375, 0.967987060546875, 1.04443359375, 1.120880126953125, 1.19732666015625, 1.273773193359375, 1.3502197265625, 1.426666259765625, 1.50311279296875, 1.579559326171875, 1.656005859375, 1.732452392578125, 1.80889892578125, 1.885345458984375, 1.9617919921875, 2.038238525390625, 2.11468505859375, 2.191131591796875, 2.267578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 2.0, 10.0, 17.0, 24.0, 25.0, 27.0, 52.0, 69.0, 77.0, 108.0, 95.0, 89.0, 113.0, 91.0, 53.0, 39.0, 29.0, 26.0, 14.0, 8.0, 11.0, 8.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002205371856689453, -0.00021470710635185242, -0.00020887702703475952, -0.00020304694771766663, -0.00019721686840057373, -0.00019138678908348083, -0.00018555670976638794, -0.00017972663044929504, -0.00017389655113220215, -0.00016806647181510925, -0.00016223639249801636, -0.00015640631318092346, -0.00015057623386383057, -0.00014474615454673767, -0.00013891607522964478, -0.00013308599591255188, -0.00012725591659545898, -0.00012142583727836609, -0.0001155957579612732, -0.0001097656786441803, -0.0001039355993270874, -9.810552000999451e-05, -9.227544069290161e-05, -8.644536137580872e-05, -8.061528205871582e-05, -7.478520274162292e-05, -6.895512342453003e-05, -6.312504410743713e-05, -5.729496479034424e-05, -5.146488547325134e-05, -4.563480615615845e-05, -3.980472683906555e-05, -3.3974647521972656e-05, -2.814456820487976e-05, -2.2314488887786865e-05, -1.648440957069397e-05, -1.0654330253601074e-05, -4.824250936508179e-06, 1.0058283805847168e-06, 6.835907697677612e-06, 1.2665987014770508e-05, 1.8496066331863403e-05, 2.43261456489563e-05, 3.0156224966049194e-05, 3.598630428314209e-05, 4.1816383600234985e-05, 4.764646291732788e-05, 5.3476542234420776e-05, 5.930662155151367e-05, 6.513670086860657e-05, 7.096678018569946e-05, 7.679685950279236e-05, 8.262693881988525e-05, 8.845701813697815e-05, 9.428709745407104e-05, 0.00010011717677116394, 0.00010594725608825684, 0.00011177733540534973, 0.00011760741472244263, 0.00012343749403953552, 0.00012926757335662842, 0.0001350976526737213, 0.0001409277319908142, 0.0001467578113079071, 0.000152587890625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 11.0, 15.0, 17.0, 39.0, 42.0, 67.0, 96.0, 160.0, 241.0, 342.0, 526.0, 782.0, 1306.0, 2039.0, 3511.0, 6081.0, 10868.0, 20102.0, 37840.0, 72028.0, 133232.0, 209218.0, 222573.0, 149670.0, 82328.0, 43155.0, 22720.0, 12326.0, 7015.0, 3846.0, 2350.0, 1448.0, 888.0, 556.0, 373.0, 222.0, 167.0, 112.0, 80.0, 39.0, 37.0, 18.0, 12.0, 16.0, 6.0, 12.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.51171875, -2.43096923828125, -2.3502197265625, -2.26947021484375, -2.188720703125, -2.10797119140625, -2.0272216796875, -1.94647216796875, -1.86572265625, -1.78497314453125, -1.7042236328125, -1.62347412109375, -1.542724609375, -1.46197509765625, -1.3812255859375, -1.30047607421875, -1.2197265625, -1.13897705078125, -1.0582275390625, -0.97747802734375, -0.896728515625, -0.81597900390625, -0.7352294921875, -0.65447998046875, -0.57373046875, -0.49298095703125, -0.4122314453125, -0.33148193359375, -0.250732421875, -0.16998291015625, -0.0892333984375, -0.00848388671875, 0.072265625, 0.15301513671875, 0.2337646484375, 0.31451416015625, 0.395263671875, 0.47601318359375, 0.5567626953125, 0.63751220703125, 0.71826171875, 0.79901123046875, 0.8797607421875, 0.96051025390625, 1.041259765625, 1.12200927734375, 1.2027587890625, 1.28350830078125, 1.3642578125, 1.44500732421875, 1.5257568359375, 1.60650634765625, 1.687255859375, 1.76800537109375, 1.8487548828125, 1.92950439453125, 2.01025390625, 2.09100341796875, 2.1717529296875, 2.25250244140625, 2.333251953125, 2.41400146484375, 2.4947509765625, 2.57550048828125, 2.65625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 3.0, 5.0, 10.0, 15.0, 4.0, 13.0, 21.0, 13.0, 19.0, 17.0, 28.0, 30.0, 24.0, 38.0, 43.0, 49.0, 48.0, 47.0, 53.0, 43.0, 36.0, 44.0, 44.0, 31.0, 36.0, 30.0, 38.0, 23.0, 30.0, 13.0, 23.0, 21.0, 12.0, 16.0, 13.0, 6.0, 8.0, 11.0, 4.0, 5.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5947265625, -0.5768814086914062, -0.5590362548828125, -0.5411911010742188, -0.523345947265625, -0.5055007934570312, -0.4876556396484375, -0.46981048583984375, -0.45196533203125, -0.43412017822265625, -0.4162750244140625, -0.39842987060546875, -0.380584716796875, -0.36273956298828125, -0.3448944091796875, -0.32704925537109375, -0.3092041015625, -0.29135894775390625, -0.2735137939453125, -0.25566864013671875, -0.237823486328125, -0.21997833251953125, -0.2021331787109375, -0.18428802490234375, -0.16644287109375, -0.14859771728515625, -0.1307525634765625, -0.11290740966796875, -0.095062255859375, -0.07721710205078125, -0.0593719482421875, -0.04152679443359375, -0.023681640625, -0.00583648681640625, 0.0120086669921875, 0.02985382080078125, 0.047698974609375, 0.06554412841796875, 0.0833892822265625, 0.10123443603515625, 0.11907958984375, 0.13692474365234375, 0.1547698974609375, 0.17261505126953125, 0.190460205078125, 0.20830535888671875, 0.2261505126953125, 0.24399566650390625, 0.2618408203125, 0.27968597412109375, 0.2975311279296875, 0.31537628173828125, 0.333221435546875, 0.35106658935546875, 0.3689117431640625, 0.38675689697265625, 0.40460205078125, 0.42244720458984375, 0.4402923583984375, 0.45813751220703125, 0.475982666015625, 0.49382781982421875, 0.5116729736328125, 0.5295181274414062, 0.54736328125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 10.0, 19.0, 18.0, 20.0, 34.0, 49.0, 59.0, 56.0, 118.0, 93.0, 94.0, 80.0, 76.0, 73.0, 38.0, 37.0, 29.0, 21.0, 10.0, 10.0, 10.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265263557434082, -13.69668197631836, -13.128101348876953, -12.55951976776123, -11.990938186645508, -11.422357559204102, -10.853775978088379, -10.285194396972656, -9.71661376953125, -9.148032188415527, -8.579451560974121, -8.010869979858398, -7.442288398742676, -6.873707294464111, -6.305126190185547, -5.736544609069824, -5.167963027954102, -4.599381923675537, -4.0308003425598145, -3.46221923828125, -2.8936378955841064, -2.325056552886963, -1.7564754486083984, -1.1878941059112549, -0.6193127632141113, -0.05073148012161255, 0.5178498029708862, 1.0864310264587402, 1.6550123691558838, 2.2235937118530273, 2.792174816131592, 3.3607561588287354, 3.9293365478515625, 4.497917652130127, 5.06649923324585, 5.635080337524414, 6.203661918640137, 6.772243022918701, 7.340824127197266, 7.909405708312988, 8.477987289428711, 9.046568870544434, 9.61514949798584, 10.183731079101562, 10.752312660217285, 11.320894241333008, 11.889474868774414, 12.458056449890137, 13.026637077331543, 13.595218658447266, 14.163799285888672, 14.732380867004395, 15.300962448120117, 15.869543075561523, 16.438125610351562, 17.00670623779297, 17.575286865234375, 18.14386749267578, 18.71245002746582, 19.281030654907227, 19.849611282348633, 20.418193817138672, 20.986774444580078, 21.555355072021484, 22.123937606811523]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 3.0, 4.0, 14.0, 10.0, 22.0, 18.0, 19.0, 24.0, 18.0, 16.0, 23.0, 23.0, 36.0, 39.0, 30.0, 29.0, 42.0, 39.0, 39.0, 43.0, 35.0, 27.0, 31.0, 31.0, 31.0, 22.0, 33.0, 31.0, 26.0, 35.0, 23.0, 31.0, 29.0, 17.0, 13.0, 15.0, 12.0, 6.0, 9.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.914292335510254, -6.692164421081543, -6.47003698348999, -6.247909069061279, -6.025781154632568, -5.803653717041016, -5.581525802612305, -5.359397888183594, -5.137270450592041, -4.91514253616333, -4.693015098571777, -4.470887184143066, -4.2487592697143555, -4.026631832122803, -3.804503917694092, -3.58237624168396, -3.360248327255249, -3.138120651245117, -2.9159927368164062, -2.6938650608062744, -2.4717373847961426, -2.2496094703674316, -2.0274817943573, -1.805354118347168, -1.5832263231277466, -1.3610985279083252, -1.1389708518981934, -0.916843056678772, -0.6947153210639954, -0.47258758544921875, -0.25045979022979736, -0.028332114219665527, 0.19379568099975586, 0.41592341661453247, 0.6380511522293091, 0.8601789474487305, 1.0823066234588623, 1.3044344186782837, 1.526562213897705, 1.748689889907837, 1.9708176851272583, 2.1929454803466797, 2.4150731563568115, 2.6372008323669434, 2.8593287467956543, 3.081456422805786, 3.303584098815918, 3.525712013244629, 3.7478396892547607, 3.9699673652648926, 4.1920952796936035, 4.414222717285156, 4.636350631713867, 4.858478546142578, 5.080606460571289, 5.302733898162842, 5.524861812591553, 5.746989727020264, 5.969117164611816, 6.191245079040527, 6.413372993469238, 6.635500431060791, 6.857628345489502, 7.079755783081055, 7.301883697509766]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 7.0, 4.0, 11.0, 24.0, 39.0, 48.0, 83.0, 121.0, 172.0, 263.0, 397.0, 618.0, 900.0, 1406.0, 2162.0, 3369.0, 5262.0, 7985.0, 12610.0, 19956.0, 31070.0, 47728.0, 71502.0, 101396.0, 130316.0, 144954.0, 135323.0, 107886.0, 77142.0, 51766.0, 33956.0, 21673.0, 13725.0, 8723.0, 5544.0, 3664.0, 2368.0, 1492.0, 1012.0, 654.0, 453.0, 267.0, 155.0, 115.0, 68.0, 61.0, 36.0, 32.0, 12.0, 13.0, 9.0, 3.0, 2.0, 5.0, 3.0], "bins": [-7.0546875, -6.85076904296875, -6.6468505859375, -6.44293212890625, -6.239013671875, -6.03509521484375, -5.8311767578125, -5.62725830078125, -5.42333984375, -5.21942138671875, -5.0155029296875, -4.81158447265625, -4.607666015625, -4.40374755859375, -4.1998291015625, -3.99591064453125, -3.7919921875, -3.58807373046875, -3.3841552734375, -3.18023681640625, -2.976318359375, -2.77239990234375, -2.5684814453125, -2.36456298828125, -2.16064453125, -1.95672607421875, -1.7528076171875, -1.54888916015625, -1.344970703125, -1.14105224609375, -0.9371337890625, -0.73321533203125, -0.529296875, -0.32537841796875, -0.1214599609375, 0.08245849609375, 0.286376953125, 0.49029541015625, 0.6942138671875, 0.89813232421875, 1.10205078125, 1.30596923828125, 1.5098876953125, 1.71380615234375, 1.917724609375, 2.12164306640625, 2.3255615234375, 2.52947998046875, 2.7333984375, 2.93731689453125, 3.1412353515625, 3.34515380859375, 3.549072265625, 3.75299072265625, 3.9569091796875, 4.16082763671875, 4.36474609375, 4.56866455078125, 4.7725830078125, 4.97650146484375, 5.180419921875, 5.38433837890625, 5.5882568359375, 5.79217529296875, 5.99609375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 10.0, 8.0, 17.0, 19.0, 18.0, 19.0, 21.0, 22.0, 24.0, 43.0, 42.0, 25.0, 36.0, 27.0, 32.0, 37.0, 44.0, 29.0, 39.0, 27.0, 45.0, 39.0, 34.0, 38.0, 39.0, 28.0, 35.0, 27.0, 24.0, 21.0, 17.0, 19.0, 13.0, 13.0, 9.0, 10.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.125, -7.8763427734375, -7.627685546875, -7.3790283203125, -7.13037109375, -6.8817138671875, -6.633056640625, -6.3843994140625, -6.1357421875, -5.8870849609375, -5.638427734375, -5.3897705078125, -5.14111328125, -4.8924560546875, -4.643798828125, -4.3951416015625, -4.146484375, -3.8978271484375, -3.649169921875, -3.4005126953125, -3.15185546875, -2.9031982421875, -2.654541015625, -2.4058837890625, -2.1572265625, -1.9085693359375, -1.659912109375, -1.4112548828125, -1.16259765625, -0.9139404296875, -0.665283203125, -0.4166259765625, -0.16796875, 0.0806884765625, 0.329345703125, 0.5780029296875, 0.82666015625, 1.0753173828125, 1.323974609375, 1.5726318359375, 1.8212890625, 2.0699462890625, 2.318603515625, 2.5672607421875, 2.81591796875, 3.0645751953125, 3.313232421875, 3.5618896484375, 3.810546875, 4.0592041015625, 4.307861328125, 4.5565185546875, 4.80517578125, 5.0538330078125, 5.302490234375, 5.5511474609375, 5.7998046875, 6.0484619140625, 6.297119140625, 6.5457763671875, 6.79443359375, 7.0430908203125, 7.291748046875, 7.5404052734375, 7.7890625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 3.0, 6.0, 3.0, 5.0, 6.0, 10.0, 11.0, 20.0, 25.0, 45.0, 76.0, 100.0, 158.0, 312.0, 498.0, 850.0, 1423.0, 2376.0, 4002.0, 6592.0, 11356.0, 19442.0, 33374.0, 57303.0, 93505.0, 138567.0, 171662.0, 167150.0, 129783.0, 86150.0, 51531.0, 29797.0, 17519.0, 10075.0, 5896.0, 3551.0, 2153.0, 1291.0, 753.0, 434.0, 257.0, 171.0, 111.0, 87.0, 39.0, 28.0, 14.0, 9.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.07171630859375, -6.8270263671875, -6.58233642578125, -6.337646484375, -6.09295654296875, -5.8482666015625, -5.60357666015625, -5.35888671875, -5.11419677734375, -4.8695068359375, -4.62481689453125, -4.380126953125, -4.13543701171875, -3.8907470703125, -3.64605712890625, -3.4013671875, -3.15667724609375, -2.9119873046875, -2.66729736328125, -2.422607421875, -2.17791748046875, -1.9332275390625, -1.68853759765625, -1.44384765625, -1.19915771484375, -0.9544677734375, -0.70977783203125, -0.465087890625, -0.22039794921875, 0.0242919921875, 0.26898193359375, 0.513671875, 0.75836181640625, 1.0030517578125, 1.24774169921875, 1.492431640625, 1.73712158203125, 1.9818115234375, 2.22650146484375, 2.47119140625, 2.71588134765625, 2.9605712890625, 3.20526123046875, 3.449951171875, 3.69464111328125, 3.9393310546875, 4.18402099609375, 4.4287109375, 4.67340087890625, 4.9180908203125, 5.16278076171875, 5.407470703125, 5.65216064453125, 5.8968505859375, 6.14154052734375, 6.38623046875, 6.63092041015625, 6.8756103515625, 7.12030029296875, 7.364990234375, 7.60968017578125, 7.8543701171875, 8.09906005859375, 8.34375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 7.0, 9.0, 9.0, 8.0, 15.0, 19.0, 14.0, 21.0, 28.0, 32.0, 36.0, 38.0, 44.0, 34.0, 39.0, 39.0, 42.0, 45.0, 56.0, 45.0, 54.0, 46.0, 44.0, 33.0, 34.0, 32.0, 31.0, 22.0, 29.0, 18.0, 25.0, 9.0, 13.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.8275146484375, -6.651123046875, -6.4747314453125, -6.29833984375, -6.1219482421875, -5.945556640625, -5.7691650390625, -5.5927734375, -5.4163818359375, -5.239990234375, -5.0635986328125, -4.88720703125, -4.7108154296875, -4.534423828125, -4.3580322265625, -4.181640625, -4.0052490234375, -3.828857421875, -3.6524658203125, -3.47607421875, -3.2996826171875, -3.123291015625, -2.9468994140625, -2.7705078125, -2.5941162109375, -2.417724609375, -2.2413330078125, -2.06494140625, -1.8885498046875, -1.712158203125, -1.5357666015625, -1.359375, -1.1829833984375, -1.006591796875, -0.8302001953125, -0.65380859375, -0.4774169921875, -0.301025390625, -0.1246337890625, 0.0517578125, 0.2281494140625, 0.404541015625, 0.5809326171875, 0.75732421875, 0.9337158203125, 1.110107421875, 1.2864990234375, 1.462890625, 1.6392822265625, 1.815673828125, 1.9920654296875, 2.16845703125, 2.3448486328125, 2.521240234375, 2.6976318359375, 2.8740234375, 3.0504150390625, 3.226806640625, 3.4031982421875, 3.57958984375, 3.7559814453125, 3.932373046875, 4.1087646484375, 4.28515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 16.0, 17.0, 34.0, 57.0, 73.0, 109.0, 182.0, 283.0, 473.0, 707.0, 1141.0, 1825.0, 3007.0, 4851.0, 8031.0, 13734.0, 23796.0, 41459.0, 72097.0, 118588.0, 168852.0, 186131.0, 154593.0, 103138.0, 61170.0, 35004.0, 20076.0, 11374.0, 6864.0, 4154.0, 2548.0, 1558.0, 926.0, 579.0, 430.0, 233.0, 175.0, 87.0, 67.0, 36.0, 25.0, 19.0, 11.0, 9.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.1171875, -3.99371337890625, -3.8702392578125, -3.74676513671875, -3.623291015625, -3.49981689453125, -3.3763427734375, -3.25286865234375, -3.12939453125, -3.00592041015625, -2.8824462890625, -2.75897216796875, -2.635498046875, -2.51202392578125, -2.3885498046875, -2.26507568359375, -2.1416015625, -2.01812744140625, -1.8946533203125, -1.77117919921875, -1.647705078125, -1.52423095703125, -1.4007568359375, -1.27728271484375, -1.15380859375, -1.03033447265625, -0.9068603515625, -0.78338623046875, -0.659912109375, -0.53643798828125, -0.4129638671875, -0.28948974609375, -0.166015625, -0.04254150390625, 0.0809326171875, 0.20440673828125, 0.327880859375, 0.45135498046875, 0.5748291015625, 0.69830322265625, 0.82177734375, 0.94525146484375, 1.0687255859375, 1.19219970703125, 1.315673828125, 1.43914794921875, 1.5626220703125, 1.68609619140625, 1.8095703125, 1.93304443359375, 2.0565185546875, 2.17999267578125, 2.303466796875, 2.42694091796875, 2.5504150390625, 2.67388916015625, 2.79736328125, 2.92083740234375, 3.0443115234375, 3.16778564453125, 3.291259765625, 3.41473388671875, 3.5382080078125, 3.66168212890625, 3.78515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 0.0, 3.0, 9.0, 6.0, 6.0, 15.0, 8.0, 11.0, 21.0, 22.0, 26.0, 32.0, 36.0, 45.0, 54.0, 68.0, 61.0, 64.0, 78.0, 72.0, 68.0, 59.0, 50.0, 31.0, 42.0, 24.0, 27.0, 13.0, 19.0, 7.0, 9.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002620220184326172, -0.000249471515417099, -0.0002369210124015808, -0.00022437050938606262, -0.00021182000637054443, -0.00019926950335502625, -0.00018671900033950806, -0.00017416849732398987, -0.00016161799430847168, -0.0001490674912929535, -0.0001365169882774353, -0.00012396648526191711, -0.00011141598224639893, -9.886547923088074e-05, -8.631497621536255e-05, -7.376447319984436e-05, -6.121397018432617e-05, -4.8663467168807983e-05, -3.6112964153289795e-05, -2.3562461137771606e-05, -1.1011958122253418e-05, 1.5385448932647705e-06, 1.4089047908782959e-05, 2.6639550924301147e-05, 3.9190053939819336e-05, 5.1740556955337524e-05, 6.429105997085571e-05, 7.68415629863739e-05, 8.939206600189209e-05, 0.00010194256901741028, 0.00011449307203292847, 0.00012704357504844666, 0.00013959407806396484, 0.00015214458107948303, 0.00016469508409500122, 0.0001772455871105194, 0.0001897960901260376, 0.00020234659314155579, 0.00021489709615707397, 0.00022744759917259216, 0.00023999810218811035, 0.00025254860520362854, 0.00026509910821914673, 0.0002776496112346649, 0.0002902001142501831, 0.0003027506172657013, 0.0003153011202812195, 0.00032785162329673767, 0.00034040212631225586, 0.00035295262932777405, 0.00036550313234329224, 0.0003780536353588104, 0.0003906041383743286, 0.0004031546413898468, 0.000415705144405365, 0.0004282556474208832, 0.00044080615043640137, 0.00045335665345191956, 0.00046590715646743774, 0.00047845765948295593, 0.0004910081624984741, 0.0005035586655139923, 0.0005161091685295105, 0.0005286596715450287, 0.0005412101745605469]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 9.0, 11.0, 9.0, 13.0, 32.0, 46.0, 63.0, 95.0, 156.0, 237.0, 351.0, 552.0, 801.0, 1293.0, 2100.0, 3428.0, 5694.0, 9482.0, 16445.0, 28935.0, 50792.0, 87574.0, 141971.0, 186588.0, 181975.0, 134386.0, 83063.0, 47134.0, 26816.0, 15616.0, 8993.0, 5236.0, 3146.0, 2013.0, 1234.0, 776.0, 464.0, 317.0, 236.0, 147.0, 98.0, 66.0, 54.0, 44.0, 25.0, 16.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.05078125, -3.9239501953125, -3.797119140625, -3.6702880859375, -3.54345703125, -3.4166259765625, -3.289794921875, -3.1629638671875, -3.0361328125, -2.9093017578125, -2.782470703125, -2.6556396484375, -2.52880859375, -2.4019775390625, -2.275146484375, -2.1483154296875, -2.021484375, -1.8946533203125, -1.767822265625, -1.6409912109375, -1.51416015625, -1.3873291015625, -1.260498046875, -1.1336669921875, -1.0068359375, -0.8800048828125, -0.753173828125, -0.6263427734375, -0.49951171875, -0.3726806640625, -0.245849609375, -0.1190185546875, 0.0078125, 0.1346435546875, 0.261474609375, 0.3883056640625, 0.51513671875, 0.6419677734375, 0.768798828125, 0.8956298828125, 1.0224609375, 1.1492919921875, 1.276123046875, 1.4029541015625, 1.52978515625, 1.6566162109375, 1.783447265625, 1.9102783203125, 2.037109375, 2.1639404296875, 2.290771484375, 2.4176025390625, 2.54443359375, 2.6712646484375, 2.798095703125, 2.9249267578125, 3.0517578125, 3.1785888671875, 3.305419921875, 3.4322509765625, 3.55908203125, 3.6859130859375, 3.812744140625, 3.9395751953125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 7.0, 10.0, 18.0, 15.0, 23.0, 20.0, 28.0, 34.0, 41.0, 51.0, 37.0, 51.0, 54.0, 53.0, 59.0, 48.0, 53.0, 59.0, 48.0, 43.0, 38.0, 30.0, 32.0, 29.0, 22.0, 20.0, 15.0, 7.0, 8.0, 7.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3046875, -1.2688369750976562, -1.2329864501953125, -1.1971359252929688, -1.161285400390625, -1.1254348754882812, -1.0895843505859375, -1.0537338256835938, -1.01788330078125, -0.9820327758789062, -0.9461822509765625, -0.9103317260742188, -0.874481201171875, -0.8386306762695312, -0.8027801513671875, -0.7669296264648438, -0.7310791015625, -0.6952285766601562, -0.6593780517578125, -0.6235275268554688, -0.587677001953125, -0.5518264770507812, -0.5159759521484375, -0.48012542724609375, -0.44427490234375, -0.40842437744140625, -0.3725738525390625, -0.33672332763671875, -0.300872802734375, -0.26502227783203125, -0.2291717529296875, -0.19332122802734375, -0.157470703125, -0.12162017822265625, -0.0857696533203125, -0.04991912841796875, -0.014068603515625, 0.02178192138671875, 0.0576324462890625, 0.09348297119140625, 0.12933349609375, 0.16518402099609375, 0.2010345458984375, 0.23688507080078125, 0.272735595703125, 0.30858612060546875, 0.3444366455078125, 0.38028717041015625, 0.4161376953125, 0.45198822021484375, 0.4878387451171875, 0.5236892700195312, 0.559539794921875, 0.5953903198242188, 0.6312408447265625, 0.6670913696289062, 0.70294189453125, 0.7387924194335938, 0.7746429443359375, 0.8104934692382812, 0.846343994140625, 0.8821945190429688, 0.9180450439453125, 0.9538955688476562, 0.98974609375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 11.0, 4.0, 11.0, 16.0, 19.0, 25.0, 34.0, 53.0, 57.0, 73.0, 80.0, 88.0, 105.0, 82.0, 85.0, 55.0, 50.0, 37.0, 23.0, 24.0, 17.0, 6.0, 9.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.371761322021484, -12.816137313842773, -12.260513305664062, -11.704889297485352, -11.14926528930664, -10.59364128112793, -10.038016319274902, -9.482392311096191, -8.92676830291748, -8.37114429473877, -7.815520286560059, -7.2598958015441895, -6.7042717933654785, -6.148647785186768, -5.593023300170898, -5.0373992919921875, -4.481775283813477, -3.9261512756347656, -3.3705270290374756, -2.8149027824401855, -2.2592787742614746, -1.7036547660827637, -1.1480305194854736, -0.5924062728881836, -0.036782264709472656, 0.5188418626785278, 1.0744659900665283, 1.6300901174545288, 2.1857142448425293, 2.7413382530212402, 3.2969624996185303, 3.8525867462158203, 4.408210754394531, 4.963834762573242, 5.519458770751953, 6.075083255767822, 6.630707263946533, 7.186331272125244, 7.741955757141113, 8.297579765319824, 8.853203773498535, 9.408827781677246, 9.964451789855957, 10.520075798034668, 11.075700759887695, 11.631324768066406, 12.186948776245117, 12.742572784423828, 13.298196792602539, 13.85382080078125, 14.409444808959961, 14.965068817138672, 15.520692825317383, 16.076316833496094, 16.631940841674805, 17.187564849853516, 17.74319076538086, 18.29881477355957, 18.85443878173828, 19.410062789916992, 19.965686798095703, 20.521310806274414, 21.076934814453125, 21.63256072998047, 22.188182830810547]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 7.0, 10.0, 7.0, 10.0, 13.0, 14.0, 15.0, 22.0, 15.0, 16.0, 27.0, 21.0, 26.0, 40.0, 30.0, 35.0, 32.0, 38.0, 30.0, 31.0, 43.0, 37.0, 51.0, 43.0, 38.0, 30.0, 29.0, 27.0, 24.0, 28.0, 26.0, 30.0, 23.0, 23.0, 17.0, 16.0, 10.0, 12.0, 13.0, 6.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.199282646179199, -6.966243743896484, -6.7332048416137695, -6.500165939331055, -6.26712703704834, -6.034088134765625, -5.801049709320068, -5.5680108070373535, -5.334971904754639, -5.101933002471924, -4.868894100189209, -4.635855197906494, -4.4028167724609375, -4.169777870178223, -3.936738967895508, -3.703700065612793, -3.470661163330078, -3.2376222610473633, -3.0045833587646484, -2.7715446949005127, -2.538505792617798, -2.305466890335083, -2.0724282264709473, -1.8393893241882324, -1.6063504219055176, -1.3733115196228027, -1.1402727365493774, -0.9072338938713074, -0.6741950511932373, -0.44115614891052246, -0.20811736583709717, 0.024921417236328125, 0.25796079635620117, 0.49099963903427124, 0.7240384817123413, 0.9570773243904114, 1.1901161670684814, 1.4231550693511963, 1.6561938524246216, 1.8892326354980469, 2.1222715377807617, 2.3553104400634766, 2.5883493423461914, 2.821388006210327, 3.054426908493042, 3.287465810775757, 3.5205044746398926, 3.7535433769226074, 3.9865822792053223, 4.219621181488037, 4.452660083770752, 4.685698986053467, 4.918737411499023, 5.151776313781738, 5.384815216064453, 5.617854118347168, 5.850893020629883, 6.083931922912598, 6.3169708251953125, 6.550009727478027, 6.783048629760742, 7.016087532043457, 7.249125957489014, 7.4821648597717285, 7.715203762054443]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 3.0, 9.0, 20.0, 19.0, 32.0, 44.0, 77.0, 109.0, 153.0, 232.0, 307.0, 482.0, 685.0, 1083.0, 1659.0, 2515.0, 3973.0, 6543.0, 11398.0, 21077.0, 44569.0, 110162.0, 323393.0, 920679.0, 1447071.0, 826367.0, 283672.0, 98966.0, 40716.0, 19850.0, 11023.0, 6452.0, 3907.0, 2473.0, 1566.0, 1013.0, 679.0, 460.0, 295.0, 172.0, 147.0, 86.0, 52.0, 34.0, 21.0, 10.0, 9.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.625, -17.064453125, -16.50390625, -15.943359375, -15.3828125, -14.822265625, -14.26171875, -13.701171875, -13.140625, -12.580078125, -12.01953125, -11.458984375, -10.8984375, -10.337890625, -9.77734375, -9.216796875, -8.65625, -8.095703125, -7.53515625, -6.974609375, -6.4140625, -5.853515625, -5.29296875, -4.732421875, -4.171875, -3.611328125, -3.05078125, -2.490234375, -1.9296875, -1.369140625, -0.80859375, -0.248046875, 0.3125, 0.873046875, 1.43359375, 1.994140625, 2.5546875, 3.115234375, 3.67578125, 4.236328125, 4.796875, 5.357421875, 5.91796875, 6.478515625, 7.0390625, 7.599609375, 8.16015625, 8.720703125, 9.28125, 9.841796875, 10.40234375, 10.962890625, 11.5234375, 12.083984375, 12.64453125, 13.205078125, 13.765625, 14.326171875, 14.88671875, 15.447265625, 16.0078125, 16.568359375, 17.12890625, 17.689453125, 18.25]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 0.0, 8.0, 9.0, 9.0, 16.0, 28.0, 17.0, 26.0, 25.0, 20.0, 30.0, 32.0, 40.0, 38.0, 41.0, 32.0, 46.0, 52.0, 40.0, 37.0, 50.0, 47.0, 43.0, 44.0, 41.0, 36.0, 21.0, 28.0, 30.0, 24.0, 13.0, 15.0, 10.0, 14.0, 9.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.74566650390625, -6.5225830078125, -6.29949951171875, -6.076416015625, -5.85333251953125, -5.6302490234375, -5.40716552734375, -5.18408203125, -4.96099853515625, -4.7379150390625, -4.51483154296875, -4.291748046875, -4.06866455078125, -3.8455810546875, -3.62249755859375, -3.3994140625, -3.17633056640625, -2.9532470703125, -2.73016357421875, -2.507080078125, -2.28399658203125, -2.0609130859375, -1.83782958984375, -1.61474609375, -1.39166259765625, -1.1685791015625, -0.94549560546875, -0.722412109375, -0.49932861328125, -0.2762451171875, -0.05316162109375, 0.169921875, 0.39300537109375, 0.6160888671875, 0.83917236328125, 1.062255859375, 1.28533935546875, 1.5084228515625, 1.73150634765625, 1.95458984375, 2.17767333984375, 2.4007568359375, 2.62384033203125, 2.846923828125, 3.07000732421875, 3.2930908203125, 3.51617431640625, 3.7392578125, 3.96234130859375, 4.1854248046875, 4.40850830078125, 4.631591796875, 4.85467529296875, 5.0777587890625, 5.30084228515625, 5.52392578125, 5.74700927734375, 5.9700927734375, 6.19317626953125, 6.416259765625, 6.63934326171875, 6.8624267578125, 7.08551025390625, 7.30859375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 11.0, 23.0, 33.0, 42.0, 59.0, 80.0, 121.0, 180.0, 241.0, 435.0, 608.0, 929.0, 1432.0, 2306.0, 3708.0, 6371.0, 10787.0, 20271.0, 39550.0, 85802.0, 202852.0, 502566.0, 1054377.0, 1171566.0, 626973.0, 254277.0, 105829.0, 48092.0, 23749.0, 12544.0, 7074.0, 4201.0, 2608.0, 1602.0, 981.0, 644.0, 427.0, 274.0, 206.0, 134.0, 94.0, 57.0, 50.0, 38.0, 19.0, 19.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0], "bins": [-18.84375, -18.27490234375, -17.7060546875, -17.13720703125, -16.568359375, -15.99951171875, -15.4306640625, -14.86181640625, -14.29296875, -13.72412109375, -13.1552734375, -12.58642578125, -12.017578125, -11.44873046875, -10.8798828125, -10.31103515625, -9.7421875, -9.17333984375, -8.6044921875, -8.03564453125, -7.466796875, -6.89794921875, -6.3291015625, -5.76025390625, -5.19140625, -4.62255859375, -4.0537109375, -3.48486328125, -2.916015625, -2.34716796875, -1.7783203125, -1.20947265625, -0.640625, -0.07177734375, 0.4970703125, 1.06591796875, 1.634765625, 2.20361328125, 2.7724609375, 3.34130859375, 3.91015625, 4.47900390625, 5.0478515625, 5.61669921875, 6.185546875, 6.75439453125, 7.3232421875, 7.89208984375, 8.4609375, 9.02978515625, 9.5986328125, 10.16748046875, 10.736328125, 11.30517578125, 11.8740234375, 12.44287109375, 13.01171875, 13.58056640625, 14.1494140625, 14.71826171875, 15.287109375, 15.85595703125, 16.4248046875, 16.99365234375, 17.5625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 7.0, 8.0, 8.0, 12.0, 23.0, 17.0, 42.0, 32.0, 47.0, 63.0, 89.0, 90.0, 131.0, 158.0, 199.0, 238.0, 261.0, 320.0, 313.0, 300.0, 281.0, 289.0, 239.0, 195.0, 164.0, 144.0, 89.0, 78.0, 62.0, 45.0, 21.0, 28.0, 20.0, 11.0, 9.0, 10.0, 12.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.8699951171875, -3.716552734375, -3.5631103515625, -3.40966796875, -3.2562255859375, -3.102783203125, -2.9493408203125, -2.7958984375, -2.6424560546875, -2.489013671875, -2.3355712890625, -2.18212890625, -2.0286865234375, -1.875244140625, -1.7218017578125, -1.568359375, -1.4149169921875, -1.261474609375, -1.1080322265625, -0.95458984375, -0.8011474609375, -0.647705078125, -0.4942626953125, -0.3408203125, -0.1873779296875, -0.033935546875, 0.1195068359375, 0.27294921875, 0.4263916015625, 0.579833984375, 0.7332763671875, 0.88671875, 1.0401611328125, 1.193603515625, 1.3470458984375, 1.50048828125, 1.6539306640625, 1.807373046875, 1.9608154296875, 2.1142578125, 2.2677001953125, 2.421142578125, 2.5745849609375, 2.72802734375, 2.8814697265625, 3.034912109375, 3.1883544921875, 3.341796875, 3.4952392578125, 3.648681640625, 3.8021240234375, 3.95556640625, 4.1090087890625, 4.262451171875, 4.4158935546875, 4.5693359375, 4.7227783203125, 4.876220703125, 5.0296630859375, 5.18310546875, 5.3365478515625, 5.489990234375, 5.6434326171875, 5.796875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 9.0, 13.0, 6.0, 8.0, 16.0, 19.0, 23.0, 31.0, 47.0, 59.0, 62.0, 74.0, 84.0, 61.0, 77.0, 67.0, 58.0, 54.0, 47.0, 35.0, 39.0, 20.0, 19.0, 17.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.190109252929688, -15.663307189941406, -15.136505126953125, -14.609703063964844, -14.082901000976562, -13.556098937988281, -13.029295921325684, -12.502493858337402, -11.975691795349121, -11.44888973236084, -10.922087669372559, -10.395285606384277, -9.86848258972168, -9.341680526733398, -8.814878463745117, -8.288076400756836, -7.761274337768555, -7.234472274780273, -6.707670211791992, -6.180867671966553, -5.6540656089782715, -5.12726354598999, -4.600461006164551, -4.0736589431762695, -3.5468568801879883, -3.020054817199707, -2.4932525157928467, -1.9664503335952759, -1.439648151397705, -0.9128460884094238, -0.3860437870025635, 0.14075851440429688, 0.6675586700439453, 1.1943608522415161, 1.721163034439087, 2.2479653358459473, 2.7747673988342285, 3.3015694618225098, 3.82837176322937, 4.3551740646362305, 4.881976127624512, 5.408778190612793, 5.935580253601074, 6.462382793426514, 6.989184856414795, 7.515986919403076, 8.042789459228516, 8.569591522216797, 9.096393585205078, 9.62319564819336, 10.14999771118164, 10.676799774169922, 11.203601837158203, 11.730403900146484, 12.257206916809082, 12.784008979797363, 13.310811042785645, 13.837613105773926, 14.364415168762207, 14.891217231750488, 15.418020248413086, 15.944822311401367, 16.47162437438965, 16.99842643737793, 17.52522850036621]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 13.0, 15.0, 8.0, 18.0, 10.0, 19.0, 20.0, 24.0, 36.0, 24.0, 25.0, 32.0, 30.0, 36.0, 40.0, 40.0, 30.0, 36.0, 32.0, 34.0, 39.0, 36.0, 33.0, 32.0, 27.0, 35.0, 34.0, 20.0, 33.0, 35.0, 18.0, 23.0, 11.0, 18.0, 20.0, 9.0, 4.0, 7.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.16486930847168, -7.919648170471191, -7.674427032470703, -7.429205417633057, -7.183984279632568, -6.93876314163208, -6.693541526794434, -6.448320388793945, -6.203099250793457, -5.957878112792969, -5.7126569747924805, -5.467435359954834, -5.222214221954346, -4.976993083953857, -4.731771469116211, -4.486550331115723, -4.241329193115234, -3.996108055114746, -3.7508866786956787, -3.5056653022766113, -3.260444164276123, -3.0152230262756348, -2.7700016498565674, -2.5247802734375, -2.2795591354370117, -2.0343379974365234, -1.789116621017456, -1.5438953638076782, -1.2986741065979004, -1.0534528493881226, -0.8082315921783447, -0.5630103349685669, -0.31778860092163086, -0.07256734371185303, 0.1726539134979248, 0.41787517070770264, 0.6630964279174805, 0.9083176851272583, 1.1535389423370361, 1.398760199546814, 1.6439814567565918, 1.8892027139663696, 2.1344239711761475, 2.379645347595215, 2.624866485595703, 2.8700876235961914, 3.115309000015259, 3.360530376434326, 3.6057515144348145, 3.8509726524353027, 4.096194267272949, 4.3414154052734375, 4.586636543273926, 4.831857681274414, 5.077078819274902, 5.322300434112549, 5.567521572113037, 5.812742710113525, 6.057964324951172, 6.30318546295166, 6.548406600952148, 6.793627738952637, 7.038848876953125, 7.2840704917907715, 7.52929162979126]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 10.0, 6.0, 11.0, 16.0, 19.0, 40.0, 72.0, 131.0, 176.0, 245.0, 372.0, 548.0, 855.0, 1322.0, 1950.0, 2984.0, 4623.0, 7352.0, 11225.0, 17387.0, 27151.0, 42128.0, 63870.0, 94320.0, 128353.0, 151210.0, 144360.0, 114445.0, 81215.0, 53951.0, 34857.0, 22511.0, 14499.0, 9255.0, 5872.0, 3943.0, 2462.0, 1652.0, 1044.0, 727.0, 448.0, 348.0, 214.0, 138.0, 88.0, 58.0, 40.0, 29.0, 16.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.11328125, -3.99505615234375, -3.8768310546875, -3.75860595703125, -3.640380859375, -3.52215576171875, -3.4039306640625, -3.28570556640625, -3.16748046875, -3.04925537109375, -2.9310302734375, -2.81280517578125, -2.694580078125, -2.57635498046875, -2.4581298828125, -2.33990478515625, -2.2216796875, -2.10345458984375, -1.9852294921875, -1.86700439453125, -1.748779296875, -1.63055419921875, -1.5123291015625, -1.39410400390625, -1.27587890625, -1.15765380859375, -1.0394287109375, -0.92120361328125, -0.802978515625, -0.68475341796875, -0.5665283203125, -0.44830322265625, -0.330078125, -0.21185302734375, -0.0936279296875, 0.02459716796875, 0.142822265625, 0.26104736328125, 0.3792724609375, 0.49749755859375, 0.61572265625, 0.73394775390625, 0.8521728515625, 0.97039794921875, 1.088623046875, 1.20684814453125, 1.3250732421875, 1.44329833984375, 1.5615234375, 1.67974853515625, 1.7979736328125, 1.91619873046875, 2.034423828125, 2.15264892578125, 2.2708740234375, 2.38909912109375, 2.50732421875, 2.62554931640625, 2.7437744140625, 2.86199951171875, 2.980224609375, 3.09844970703125, 3.2166748046875, 3.33489990234375, 3.453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 10.0, 6.0, 12.0, 16.0, 16.0, 11.0, 12.0, 21.0, 16.0, 21.0, 19.0, 24.0, 34.0, 36.0, 27.0, 34.0, 37.0, 31.0, 28.0, 35.0, 46.0, 33.0, 32.0, 42.0, 38.0, 27.0, 32.0, 34.0, 28.0, 24.0, 36.0, 22.0, 19.0, 13.0, 25.0, 21.0, 6.0, 16.0, 13.0, 10.0, 8.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.408935546875, -8.14599609375, -7.883056640625, -7.6201171875, -7.357177734375, -7.09423828125, -6.831298828125, -6.568359375, -6.305419921875, -6.04248046875, -5.779541015625, -5.5166015625, -5.253662109375, -4.99072265625, -4.727783203125, -4.46484375, -4.201904296875, -3.93896484375, -3.676025390625, -3.4130859375, -3.150146484375, -2.88720703125, -2.624267578125, -2.361328125, -2.098388671875, -1.83544921875, -1.572509765625, -1.3095703125, -1.046630859375, -0.78369140625, -0.520751953125, -0.2578125, 0.005126953125, 0.26806640625, 0.531005859375, 0.7939453125, 1.056884765625, 1.31982421875, 1.582763671875, 1.845703125, 2.108642578125, 2.37158203125, 2.634521484375, 2.8974609375, 3.160400390625, 3.42333984375, 3.686279296875, 3.94921875, 4.212158203125, 4.47509765625, 4.738037109375, 5.0009765625, 5.263916015625, 5.52685546875, 5.789794921875, 6.052734375, 6.315673828125, 6.57861328125, 6.841552734375, 7.1044921875, 7.367431640625, 7.63037109375, 7.893310546875, 8.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 15.0, 19.0, 17.0, 38.0, 72.0, 69.0, 117.0, 162.0, 227.0, 351.0, 520.0, 846.0, 1292.0, 1995.0, 3238.0, 5207.0, 9052.0, 15945.0, 28532.0, 53484.0, 102005.0, 181014.0, 236950.0, 182284.0, 102665.0, 54421.0, 28897.0, 15875.0, 9004.0, 5313.0, 3191.0, 1973.0, 1263.0, 839.0, 480.0, 343.0, 243.0, 214.0, 116.0, 82.0, 54.0, 39.0, 20.0, 22.0, 13.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.14453125, -5.95550537109375, -5.7664794921875, -5.57745361328125, -5.388427734375, -5.19940185546875, -5.0103759765625, -4.82135009765625, -4.63232421875, -4.44329833984375, -4.2542724609375, -4.06524658203125, -3.876220703125, -3.68719482421875, -3.4981689453125, -3.30914306640625, -3.1201171875, -2.93109130859375, -2.7420654296875, -2.55303955078125, -2.364013671875, -2.17498779296875, -1.9859619140625, -1.79693603515625, -1.60791015625, -1.41888427734375, -1.2298583984375, -1.04083251953125, -0.851806640625, -0.66278076171875, -0.4737548828125, -0.28472900390625, -0.095703125, 0.09332275390625, 0.2823486328125, 0.47137451171875, 0.660400390625, 0.84942626953125, 1.0384521484375, 1.22747802734375, 1.41650390625, 1.60552978515625, 1.7945556640625, 1.98358154296875, 2.172607421875, 2.36163330078125, 2.5506591796875, 2.73968505859375, 2.9287109375, 3.11773681640625, 3.3067626953125, 3.49578857421875, 3.684814453125, 3.87384033203125, 4.0628662109375, 4.25189208984375, 4.44091796875, 4.62994384765625, 4.8189697265625, 5.00799560546875, 5.197021484375, 5.38604736328125, 5.5750732421875, 5.76409912109375, 5.953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 9.0, 13.0, 19.0, 18.0, 16.0, 22.0, 19.0, 24.0, 31.0, 26.0, 39.0, 30.0, 36.0, 50.0, 51.0, 41.0, 37.0, 41.0, 44.0, 41.0, 49.0, 28.0, 31.0, 42.0, 28.0, 24.0, 20.0, 22.0, 20.0, 16.0, 19.0, 10.0, 12.0, 12.0, 9.0, 5.0, 3.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.796875, -4.631103515625, -4.46533203125, -4.299560546875, -4.1337890625, -3.968017578125, -3.80224609375, -3.636474609375, -3.470703125, -3.304931640625, -3.13916015625, -2.973388671875, -2.8076171875, -2.641845703125, -2.47607421875, -2.310302734375, -2.14453125, -1.978759765625, -1.81298828125, -1.647216796875, -1.4814453125, -1.315673828125, -1.14990234375, -0.984130859375, -0.818359375, -0.652587890625, -0.48681640625, -0.321044921875, -0.1552734375, 0.010498046875, 0.17626953125, 0.342041015625, 0.5078125, 0.673583984375, 0.83935546875, 1.005126953125, 1.1708984375, 1.336669921875, 1.50244140625, 1.668212890625, 1.833984375, 1.999755859375, 2.16552734375, 2.331298828125, 2.4970703125, 2.662841796875, 2.82861328125, 2.994384765625, 3.16015625, 3.325927734375, 3.49169921875, 3.657470703125, 3.8232421875, 3.989013671875, 4.15478515625, 4.320556640625, 4.486328125, 4.652099609375, 4.81787109375, 4.983642578125, 5.1494140625, 5.315185546875, 5.48095703125, 5.646728515625, 5.8125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 11.0, 18.0, 17.0, 32.0, 54.0, 64.0, 75.0, 152.0, 193.0, 300.0, 418.0, 667.0, 978.0, 1538.0, 2444.0, 4111.0, 7102.0, 13252.0, 25450.0, 53319.0, 119165.0, 245616.0, 282668.0, 152558.0, 68866.0, 32122.0, 16093.0, 8462.0, 4778.0, 2848.0, 1757.0, 1152.0, 772.0, 471.0, 320.0, 203.0, 152.0, 110.0, 69.0, 54.0, 38.0, 23.0, 16.0, 11.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.453155517578125, -3.34576416015625, -3.238372802734375, -3.1309814453125, -3.023590087890625, -2.91619873046875, -2.808807373046875, -2.701416015625, -2.594024658203125, -2.48663330078125, -2.379241943359375, -2.2718505859375, -2.164459228515625, -2.05706787109375, -1.949676513671875, -1.84228515625, -1.734893798828125, -1.62750244140625, -1.520111083984375, -1.4127197265625, -1.305328369140625, -1.19793701171875, -1.090545654296875, -0.983154296875, -0.875762939453125, -0.76837158203125, -0.660980224609375, -0.5535888671875, -0.446197509765625, -0.33880615234375, -0.231414794921875, -0.1240234375, -0.016632080078125, 0.09075927734375, 0.198150634765625, 0.3055419921875, 0.412933349609375, 0.52032470703125, 0.627716064453125, 0.735107421875, 0.842498779296875, 0.94989013671875, 1.057281494140625, 1.1646728515625, 1.272064208984375, 1.37945556640625, 1.486846923828125, 1.59423828125, 1.701629638671875, 1.80902099609375, 1.916412353515625, 2.0238037109375, 2.131195068359375, 2.23858642578125, 2.345977783203125, 2.453369140625, 2.560760498046875, 2.66815185546875, 2.775543212890625, 2.8829345703125, 2.990325927734375, 3.09771728515625, 3.205108642578125, 3.3125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 10.0, 10.0, 14.0, 16.0, 14.0, 20.0, 26.0, 33.0, 35.0, 46.0, 54.0, 62.0, 55.0, 89.0, 66.0, 64.0, 64.0, 52.0, 57.0, 25.0, 36.0, 26.0, 23.0, 20.0, 18.0, 13.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0001735687255859375, -0.00016891956329345703, -0.00016427040100097656, -0.0001596212387084961, -0.00015497207641601562, -0.00015032291412353516, -0.0001456737518310547, -0.00014102458953857422, -0.00013637542724609375, -0.00013172626495361328, -0.0001270771026611328, -0.00012242794036865234, -0.00011777877807617188, -0.0001131296157836914, -0.00010848045349121094, -0.00010383129119873047, -9.918212890625e-05, -9.453296661376953e-05, -8.988380432128906e-05, -8.52346420288086e-05, -8.058547973632812e-05, -7.593631744384766e-05, -7.128715515136719e-05, -6.663799285888672e-05, -6.198883056640625e-05, -5.733966827392578e-05, -5.269050598144531e-05, -4.8041343688964844e-05, -4.3392181396484375e-05, -3.8743019104003906e-05, -3.409385681152344e-05, -2.944469451904297e-05, -2.47955322265625e-05, -2.014636993408203e-05, -1.5497207641601562e-05, -1.0848045349121094e-05, -6.198883056640625e-06, -1.5497207641601562e-06, 3.0994415283203125e-06, 7.748603820800781e-06, 1.239776611328125e-05, 1.704692840576172e-05, 2.1696090698242188e-05, 2.6345252990722656e-05, 3.0994415283203125e-05, 3.5643577575683594e-05, 4.029273986816406e-05, 4.494190216064453e-05, 4.9591064453125e-05, 5.424022674560547e-05, 5.888938903808594e-05, 6.35385513305664e-05, 6.818771362304688e-05, 7.283687591552734e-05, 7.748603820800781e-05, 8.213520050048828e-05, 8.678436279296875e-05, 9.143352508544922e-05, 9.608268737792969e-05, 0.00010073184967041016, 0.00010538101196289062, 0.0001100301742553711, 0.00011467933654785156, 0.00011932849884033203, 0.0001239776611328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 9.0, 12.0, 12.0, 22.0, 32.0, 38.0, 69.0, 95.0, 150.0, 226.0, 318.0, 481.0, 767.0, 1195.0, 1863.0, 2965.0, 5014.0, 8238.0, 14033.0, 24676.0, 44883.0, 84927.0, 153369.0, 220018.0, 202260.0, 127621.0, 68410.0, 36766.0, 20302.0, 11576.0, 7017.0, 4034.0, 2593.0, 1625.0, 1032.0, 667.0, 414.0, 268.0, 168.0, 117.0, 73.0, 56.0, 47.0, 25.0, 25.0, 15.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.140625, -3.041961669921875, -2.94329833984375, -2.844635009765625, -2.7459716796875, -2.647308349609375, -2.54864501953125, -2.449981689453125, -2.351318359375, -2.252655029296875, -2.15399169921875, -2.055328369140625, -1.9566650390625, -1.858001708984375, -1.75933837890625, -1.660675048828125, -1.56201171875, -1.463348388671875, -1.36468505859375, -1.266021728515625, -1.1673583984375, -1.068695068359375, -0.97003173828125, -0.871368408203125, -0.772705078125, -0.674041748046875, -0.57537841796875, -0.476715087890625, -0.3780517578125, -0.279388427734375, -0.18072509765625, -0.082061767578125, 0.0166015625, 0.115264892578125, 0.21392822265625, 0.312591552734375, 0.4112548828125, 0.509918212890625, 0.60858154296875, 0.707244873046875, 0.805908203125, 0.904571533203125, 1.00323486328125, 1.101898193359375, 1.2005615234375, 1.299224853515625, 1.39788818359375, 1.496551513671875, 1.59521484375, 1.693878173828125, 1.79254150390625, 1.891204833984375, 1.9898681640625, 2.088531494140625, 2.18719482421875, 2.285858154296875, 2.384521484375, 2.483184814453125, 2.58184814453125, 2.680511474609375, 2.7791748046875, 2.877838134765625, 2.97650146484375, 3.075164794921875, 3.173828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 9.0, 11.0, 10.0, 13.0, 13.0, 14.0, 17.0, 31.0, 27.0, 32.0, 52.0, 60.0, 62.0, 77.0, 60.0, 61.0, 66.0, 62.0, 56.0, 46.0, 46.0, 28.0, 28.0, 15.0, 12.0, 13.0, 17.0, 9.0, 5.0, 8.0, 5.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.015625, -0.9866485595703125, -0.957672119140625, -0.9286956787109375, -0.89971923828125, -0.8707427978515625, -0.841766357421875, -0.8127899169921875, -0.7838134765625, -0.7548370361328125, -0.725860595703125, -0.6968841552734375, -0.66790771484375, -0.6389312744140625, -0.609954833984375, -0.5809783935546875, -0.552001953125, -0.5230255126953125, -0.494049072265625, -0.4650726318359375, -0.43609619140625, -0.4071197509765625, -0.378143310546875, -0.3491668701171875, -0.3201904296875, -0.2912139892578125, -0.262237548828125, -0.2332611083984375, -0.20428466796875, -0.1753082275390625, -0.146331787109375, -0.1173553466796875, -0.08837890625, -0.0594024658203125, -0.030426025390625, -0.0014495849609375, 0.02752685546875, 0.0565032958984375, 0.085479736328125, 0.1144561767578125, 0.1434326171875, 0.1724090576171875, 0.201385498046875, 0.2303619384765625, 0.25933837890625, 0.2883148193359375, 0.317291259765625, 0.3462677001953125, 0.375244140625, 0.4042205810546875, 0.433197021484375, 0.4621734619140625, 0.49114990234375, 0.5201263427734375, 0.549102783203125, 0.5780792236328125, 0.6070556640625, 0.6360321044921875, 0.665008544921875, 0.6939849853515625, 0.72296142578125, 0.7519378662109375, 0.780914306640625, 0.8098907470703125, 0.8388671875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 9.0, 10.0, 9.0, 14.0, 18.0, 25.0, 26.0, 40.0, 63.0, 59.0, 62.0, 79.0, 71.0, 68.0, 77.0, 55.0, 54.0, 60.0, 29.0, 28.0, 34.0, 21.0, 13.0, 16.0, 11.0, 8.0, 8.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.306214332580566, -14.796100616455078, -14.28598690032959, -13.775873184204102, -13.26576042175293, -12.755645751953125, -12.245532989501953, -11.735419273376465, -11.225305557250977, -10.715191841125488, -10.205078125, -9.694964408874512, -9.184850692749023, -8.674737930297852, -8.164624214172363, -7.654510498046875, -7.144396781921387, -6.634283065795898, -6.12416934967041, -5.61405611038208, -5.103942394256592, -4.5938286781311035, -4.083715438842773, -3.573601722717285, -3.063488006591797, -2.5533742904663086, -2.0432608127593994, -1.5331472158432007, -1.023033618927002, -0.5129199028015137, -0.002806425094604492, 0.5073070526123047, 1.0174198150634766, 1.5275334119796753, 2.037647008895874, 2.547760486602783, 3.0578742027282715, 3.5679879188537598, 4.07810115814209, 4.588214874267578, 5.098328590393066, 5.608442306518555, 6.118556022644043, 6.628669261932373, 7.138782978057861, 7.64889669418335, 8.15900993347168, 8.669123649597168, 9.179237365722656, 9.689351081848145, 10.199464797973633, 10.709578514099121, 11.21969223022461, 11.729804992675781, 12.23991870880127, 12.750032424926758, 13.260146141052246, 13.770259857177734, 14.280373573303223, 14.790487289428711, 15.300600051879883, 15.810714721679688, 16.32082748413086, 16.83094024658203, 17.341054916381836]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 8.0, 15.0, 13.0, 9.0, 18.0, 15.0, 16.0, 22.0, 23.0, 29.0, 27.0, 27.0, 32.0, 31.0, 39.0, 27.0, 45.0, 24.0, 46.0, 35.0, 36.0, 31.0, 32.0, 41.0, 29.0, 31.0, 33.0, 29.0, 25.0, 35.0, 32.0, 17.0, 17.0, 14.0, 21.0, 13.0, 11.0, 6.0, 8.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.075865745544434, -7.832607269287109, -7.589348793029785, -7.346090316772461, -7.102831840515137, -6.8595733642578125, -6.616314888000488, -6.373056411743164, -6.12979793548584, -5.886539459228516, -5.643280982971191, -5.400022506713867, -5.156764030456543, -4.913505554199219, -4.6702470779418945, -4.42698860168457, -4.183730125427246, -3.940471649169922, -3.6972131729125977, -3.4539546966552734, -3.210696220397949, -2.967437744140625, -2.724179267883301, -2.4809207916259766, -2.2376623153686523, -1.9944038391113281, -1.751145362854004, -1.5078868865966797, -1.2646284103393555, -1.0213699340820312, -0.778111457824707, -0.5348529815673828, -0.2915940284729004, -0.04833555221557617, 0.19492292404174805, 0.43818140029907227, 0.6814398765563965, 0.9246983528137207, 1.167956829071045, 1.4112153053283691, 1.6544737815856934, 1.8977322578430176, 2.140990734100342, 2.384249210357666, 2.6275076866149902, 2.8707661628723145, 3.1140246391296387, 3.357283115386963, 3.600541591644287, 3.8438000679016113, 4.0870585441589355, 4.33031702041626, 4.573575496673584, 4.816833972930908, 5.060092449188232, 5.303350925445557, 5.546609401702881, 5.789867877960205, 6.033126354217529, 6.2763848304748535, 6.519643306732178, 6.762901782989502, 7.006160259246826, 7.24941873550415, 7.492677211761475]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 16.0, 17.0, 18.0, 37.0, 58.0, 87.0, 142.0, 196.0, 338.0, 499.0, 758.0, 1254.0, 1999.0, 3346.0, 5420.0, 9005.0, 14803.0, 24114.0, 39183.0, 61630.0, 93147.0, 126140.0, 149337.0, 149143.0, 122839.0, 88903.0, 59439.0, 37412.0, 23198.0, 14025.0, 8449.0, 5153.0, 3171.0, 1929.0, 1181.0, 775.0, 514.0, 331.0, 193.0, 91.0, 77.0, 49.0, 40.0, 28.0, 22.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0], "bins": [-8.015625, -7.79266357421875, -7.5697021484375, -7.34674072265625, -7.123779296875, -6.90081787109375, -6.6778564453125, -6.45489501953125, -6.23193359375, -6.00897216796875, -5.7860107421875, -5.56304931640625, -5.340087890625, -5.11712646484375, -4.8941650390625, -4.67120361328125, -4.4482421875, -4.22528076171875, -4.0023193359375, -3.77935791015625, -3.556396484375, -3.33343505859375, -3.1104736328125, -2.88751220703125, -2.66455078125, -2.44158935546875, -2.2186279296875, -1.99566650390625, -1.772705078125, -1.54974365234375, -1.3267822265625, -1.10382080078125, -0.880859375, -0.65789794921875, -0.4349365234375, -0.21197509765625, 0.010986328125, 0.23394775390625, 0.4569091796875, 0.67987060546875, 0.90283203125, 1.12579345703125, 1.3487548828125, 1.57171630859375, 1.794677734375, 2.01763916015625, 2.2406005859375, 2.46356201171875, 2.6865234375, 2.90948486328125, 3.1324462890625, 3.35540771484375, 3.578369140625, 3.80133056640625, 4.0242919921875, 4.24725341796875, 4.47021484375, 4.69317626953125, 4.9161376953125, 5.13909912109375, 5.362060546875, 5.58502197265625, 5.8079833984375, 6.03094482421875, 6.25390625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 7.0, 9.0, 16.0, 24.0, 22.0, 35.0, 20.0, 21.0, 32.0, 35.0, 32.0, 24.0, 30.0, 40.0, 37.0, 34.0, 47.0, 39.0, 45.0, 39.0, 33.0, 38.0, 30.0, 28.0, 34.0, 29.0, 34.0, 29.0, 10.0, 17.0, 22.0, 10.0, 12.0, 15.0, 7.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.75, -9.4776611328125, -9.205322265625, -8.9329833984375, -8.66064453125, -8.3883056640625, -8.115966796875, -7.8436279296875, -7.5712890625, -7.2989501953125, -7.026611328125, -6.7542724609375, -6.48193359375, -6.2095947265625, -5.937255859375, -5.6649169921875, -5.392578125, -5.1202392578125, -4.847900390625, -4.5755615234375, -4.30322265625, -4.0308837890625, -3.758544921875, -3.4862060546875, -3.2138671875, -2.9415283203125, -2.669189453125, -2.3968505859375, -2.12451171875, -1.8521728515625, -1.579833984375, -1.3074951171875, -1.03515625, -0.7628173828125, -0.490478515625, -0.2181396484375, 0.05419921875, 0.3265380859375, 0.598876953125, 0.8712158203125, 1.1435546875, 1.4158935546875, 1.688232421875, 1.9605712890625, 2.23291015625, 2.5052490234375, 2.777587890625, 3.0499267578125, 3.322265625, 3.5946044921875, 3.866943359375, 4.1392822265625, 4.41162109375, 4.6839599609375, 4.956298828125, 5.2286376953125, 5.5009765625, 5.7733154296875, 6.045654296875, 6.3179931640625, 6.59033203125, 6.8626708984375, 7.135009765625, 7.4073486328125, 7.6796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 20.0, 27.0, 44.0, 67.0, 107.0, 150.0, 203.0, 345.0, 527.0, 785.0, 1141.0, 1668.0, 2545.0, 4005.0, 6092.0, 9300.0, 14585.0, 22278.0, 34087.0, 52027.0, 73683.0, 101061.0, 124619.0, 134528.0, 126330.0, 104474.0, 77069.0, 53934.0, 36077.0, 23594.0, 14882.0, 9703.0, 6365.0, 4206.0, 2772.0, 1756.0, 1108.0, 770.0, 520.0, 350.0, 250.0, 166.0, 95.0, 77.0, 53.0, 30.0, 30.0, 17.0, 7.0, 6.0, 5.0, 3.0, 4.0], "bins": [-6.8671875, -6.66845703125, -6.4697265625, -6.27099609375, -6.072265625, -5.87353515625, -5.6748046875, -5.47607421875, -5.27734375, -5.07861328125, -4.8798828125, -4.68115234375, -4.482421875, -4.28369140625, -4.0849609375, -3.88623046875, -3.6875, -3.48876953125, -3.2900390625, -3.09130859375, -2.892578125, -2.69384765625, -2.4951171875, -2.29638671875, -2.09765625, -1.89892578125, -1.7001953125, -1.50146484375, -1.302734375, -1.10400390625, -0.9052734375, -0.70654296875, -0.5078125, -0.30908203125, -0.1103515625, 0.08837890625, 0.287109375, 0.48583984375, 0.6845703125, 0.88330078125, 1.08203125, 1.28076171875, 1.4794921875, 1.67822265625, 1.876953125, 2.07568359375, 2.2744140625, 2.47314453125, 2.671875, 2.87060546875, 3.0693359375, 3.26806640625, 3.466796875, 3.66552734375, 3.8642578125, 4.06298828125, 4.26171875, 4.46044921875, 4.6591796875, 4.85791015625, 5.056640625, 5.25537109375, 5.4541015625, 5.65283203125, 5.8515625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 9.0, 10.0, 20.0, 15.0, 13.0, 28.0, 19.0, 17.0, 29.0, 39.0, 35.0, 43.0, 51.0, 43.0, 50.0, 58.0, 56.0, 45.0, 51.0, 44.0, 30.0, 36.0, 37.0, 28.0, 39.0, 24.0, 30.0, 19.0, 14.0, 14.0, 6.0, 13.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.796875, -6.593994140625, -6.39111328125, -6.188232421875, -5.9853515625, -5.782470703125, -5.57958984375, -5.376708984375, -5.173828125, -4.970947265625, -4.76806640625, -4.565185546875, -4.3623046875, -4.159423828125, -3.95654296875, -3.753662109375, -3.55078125, -3.347900390625, -3.14501953125, -2.942138671875, -2.7392578125, -2.536376953125, -2.33349609375, -2.130615234375, -1.927734375, -1.724853515625, -1.52197265625, -1.319091796875, -1.1162109375, -0.913330078125, -0.71044921875, -0.507568359375, -0.3046875, -0.101806640625, 0.10107421875, 0.303955078125, 0.5068359375, 0.709716796875, 0.91259765625, 1.115478515625, 1.318359375, 1.521240234375, 1.72412109375, 1.927001953125, 2.1298828125, 2.332763671875, 2.53564453125, 2.738525390625, 2.94140625, 3.144287109375, 3.34716796875, 3.550048828125, 3.7529296875, 3.955810546875, 4.15869140625, 4.361572265625, 4.564453125, 4.767333984375, 4.97021484375, 5.173095703125, 5.3759765625, 5.578857421875, 5.78173828125, 5.984619140625, 6.1875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 25.0, 21.0, 31.0, 50.0, 75.0, 146.0, 193.0, 332.0, 590.0, 1050.0, 1907.0, 3672.0, 7199.0, 15021.0, 31750.0, 68463.0, 138895.0, 223291.0, 237199.0, 160828.0, 82660.0, 38683.0, 18324.0, 8649.0, 4323.0, 2265.0, 1248.0, 694.0, 395.0, 222.0, 118.0, 79.0, 49.0, 31.0, 20.0, 13.0, 12.0, 6.0, 7.0, 4.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.3284912109375, -6.137451171875, -5.9464111328125, -5.75537109375, -5.5643310546875, -5.373291015625, -5.1822509765625, -4.9912109375, -4.8001708984375, -4.609130859375, -4.4180908203125, -4.22705078125, -4.0360107421875, -3.844970703125, -3.6539306640625, -3.462890625, -3.2718505859375, -3.080810546875, -2.8897705078125, -2.69873046875, -2.5076904296875, -2.316650390625, -2.1256103515625, -1.9345703125, -1.7435302734375, -1.552490234375, -1.3614501953125, -1.17041015625, -0.9793701171875, -0.788330078125, -0.5972900390625, -0.40625, -0.2152099609375, -0.024169921875, 0.1668701171875, 0.35791015625, 0.5489501953125, 0.739990234375, 0.9310302734375, 1.1220703125, 1.3131103515625, 1.504150390625, 1.6951904296875, 1.88623046875, 2.0772705078125, 2.268310546875, 2.4593505859375, 2.650390625, 2.8414306640625, 3.032470703125, 3.2235107421875, 3.41455078125, 3.6055908203125, 3.796630859375, 3.9876708984375, 4.1787109375, 4.3697509765625, 4.560791015625, 4.7518310546875, 4.94287109375, 5.1339111328125, 5.324951171875, 5.5159912109375, 5.70703125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 10.0, 1.0, 12.0, 25.0, 19.0, 29.0, 29.0, 50.0, 34.0, 61.0, 50.0, 60.0, 62.0, 61.0, 57.0, 55.0, 75.0, 48.0, 40.0, 37.0, 21.0, 23.0, 17.0, 29.0, 15.0, 10.0, 11.0, 7.0, 9.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040340423583984375, -0.00038981810212135315, -0.00037623196840286255, -0.00036264583468437195, -0.00034905970096588135, -0.00033547356724739075, -0.00032188743352890015, -0.00030830129981040955, -0.00029471516609191895, -0.00028112903237342834, -0.00026754289865493774, -0.00025395676493644714, -0.00024037063121795654, -0.00022678449749946594, -0.00021319836378097534, -0.00019961223006248474, -0.00018602609634399414, -0.00017243996262550354, -0.00015885382890701294, -0.00014526769518852234, -0.00013168156147003174, -0.00011809542775154114, -0.00010450929403305054, -9.092316031455994e-05, -7.733702659606934e-05, -6.375089287757874e-05, -5.0164759159088135e-05, -3.6578625440597534e-05, -2.2992491722106934e-05, -9.406358003616333e-06, 4.179775714874268e-06, 1.7765909433364868e-05, 3.135204315185547e-05, 4.493817687034607e-05, 5.852431058883667e-05, 7.211044430732727e-05, 8.569657802581787e-05, 9.928271174430847e-05, 0.00011286884546279907, 0.00012645497918128967, 0.00014004111289978027, 0.00015362724661827087, 0.00016721338033676147, 0.00018079951405525208, 0.00019438564777374268, 0.00020797178149223328, 0.00022155791521072388, 0.00023514404892921448, 0.0002487301826477051, 0.0002623163163661957, 0.0002759024500846863, 0.0002894885838031769, 0.0003030747175216675, 0.0003166608512401581, 0.0003302469849586487, 0.0003438331186771393, 0.0003574192523956299, 0.0003710053861141205, 0.0003845915198326111, 0.0003981776535511017, 0.0004117637872695923, 0.0004253499209880829, 0.0004389360547065735, 0.0004525221884250641, 0.0004661083221435547]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 17.0, 12.0, 26.0, 42.0, 57.0, 76.0, 106.0, 167.0, 237.0, 431.0, 647.0, 1005.0, 1615.0, 2609.0, 4452.0, 7948.0, 14307.0, 26158.0, 49573.0, 90812.0, 151517.0, 200993.0, 191521.0, 133835.0, 77548.0, 41684.0, 22322.0, 12130.0, 6715.0, 3830.0, 2277.0, 1437.0, 844.0, 531.0, 382.0, 258.0, 133.0, 95.0, 77.0, 38.0, 22.0, 22.0, 14.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.83203125, -4.67022705078125, -4.5084228515625, -4.34661865234375, -4.184814453125, -4.02301025390625, -3.8612060546875, -3.69940185546875, -3.53759765625, -3.37579345703125, -3.2139892578125, -3.05218505859375, -2.890380859375, -2.72857666015625, -2.5667724609375, -2.40496826171875, -2.2431640625, -2.08135986328125, -1.9195556640625, -1.75775146484375, -1.595947265625, -1.43414306640625, -1.2723388671875, -1.11053466796875, -0.94873046875, -0.78692626953125, -0.6251220703125, -0.46331787109375, -0.301513671875, -0.13970947265625, 0.0220947265625, 0.18389892578125, 0.345703125, 0.50750732421875, 0.6693115234375, 0.83111572265625, 0.992919921875, 1.15472412109375, 1.3165283203125, 1.47833251953125, 1.64013671875, 1.80194091796875, 1.9637451171875, 2.12554931640625, 2.287353515625, 2.44915771484375, 2.6109619140625, 2.77276611328125, 2.9345703125, 3.09637451171875, 3.2581787109375, 3.41998291015625, 3.581787109375, 3.74359130859375, 3.9053955078125, 4.06719970703125, 4.22900390625, 4.39080810546875, 4.5526123046875, 4.71441650390625, 4.876220703125, 5.03802490234375, 5.1998291015625, 5.36163330078125, 5.5234375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 5.0, 12.0, 12.0, 15.0, 27.0, 45.0, 35.0, 53.0, 61.0, 62.0, 59.0, 66.0, 59.0, 69.0, 70.0, 63.0, 49.0, 42.0, 40.0, 34.0, 25.0, 16.0, 13.0, 14.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.296356201171875, -1.24896240234375, -1.201568603515625, -1.1541748046875, -1.106781005859375, -1.05938720703125, -1.011993408203125, -0.964599609375, -0.917205810546875, -0.86981201171875, -0.822418212890625, -0.7750244140625, -0.727630615234375, -0.68023681640625, -0.632843017578125, -0.58544921875, -0.538055419921875, -0.49066162109375, -0.443267822265625, -0.3958740234375, -0.348480224609375, -0.30108642578125, -0.253692626953125, -0.206298828125, -0.158905029296875, -0.11151123046875, -0.064117431640625, -0.0167236328125, 0.030670166015625, 0.07806396484375, 0.125457763671875, 0.1728515625, 0.220245361328125, 0.26763916015625, 0.315032958984375, 0.3624267578125, 0.409820556640625, 0.45721435546875, 0.504608154296875, 0.552001953125, 0.599395751953125, 0.64678955078125, 0.694183349609375, 0.7415771484375, 0.788970947265625, 0.83636474609375, 0.883758544921875, 0.93115234375, 0.978546142578125, 1.02593994140625, 1.073333740234375, 1.1207275390625, 1.168121337890625, 1.21551513671875, 1.262908935546875, 1.310302734375, 1.357696533203125, 1.40509033203125, 1.452484130859375, 1.4998779296875, 1.547271728515625, 1.59466552734375, 1.642059326171875, 1.689453125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 6.0, 15.0, 11.0, 19.0, 29.0, 34.0, 42.0, 49.0, 51.0, 66.0, 62.0, 67.0, 72.0, 71.0, 62.0, 45.0, 47.0, 39.0, 32.0, 27.0, 34.0, 18.0, 12.0, 15.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.118241310119629, -12.634806632995605, -12.151372909545898, -11.667938232421875, -11.184503555297852, -10.701068878173828, -10.217634201049805, -9.734200477600098, -9.250765800476074, -8.76733112335205, -8.283897399902344, -7.80046272277832, -7.317028045654297, -6.833593368530273, -6.350159168243408, -5.866724967956543, -5.3832902908325195, -4.899855613708496, -4.416421413421631, -3.9329869747161865, -3.449552536010742, -2.966118097305298, -2.4826836585998535, -1.9992492198944092, -1.5158147811889648, -1.0323803424835205, -0.5489459037780762, -0.06551146507263184, 0.4179229736328125, 0.9013574123382568, 1.3847918510437012, 1.8682262897491455, 2.3516597747802734, 2.8350942134857178, 3.318528652191162, 3.8019630908966064, 4.285397529602051, 4.768832206726074, 5.2522664070129395, 5.735700607299805, 6.219135284423828, 6.702569961547852, 7.186004161834717, 7.669438362121582, 8.152873039245605, 8.636307716369629, 9.119741439819336, 9.60317611694336, 10.086610794067383, 10.570045471191406, 11.05348014831543, 11.536913871765137, 12.02034854888916, 12.503783226013184, 12.98721694946289, 13.470651626586914, 13.954086303710938, 14.437520980834961, 14.920955657958984, 15.404389381408691, 15.887824058532715, 16.371257781982422, 16.854692459106445, 17.33812713623047, 17.821561813354492]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 2.0, 5.0, 13.0, 10.0, 7.0, 13.0, 16.0, 12.0, 15.0, 21.0, 17.0, 30.0, 29.0, 21.0, 32.0, 31.0, 27.0, 26.0, 40.0, 43.0, 38.0, 47.0, 31.0, 47.0, 37.0, 29.0, 35.0, 28.0, 20.0, 24.0, 33.0, 29.0, 27.0, 19.0, 20.0, 23.0, 25.0, 16.0, 12.0, 7.0, 10.0, 8.0, 4.0, 8.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.252270698547363, -7.994381427764893, -7.736492156982422, -7.478602886199951, -7.2207136154174805, -6.96282434463501, -6.704935073852539, -6.447045803070068, -6.189156532287598, -5.931267261505127, -5.673377990722656, -5.4154887199401855, -5.157599449157715, -4.899710178375244, -4.641820907592773, -4.383931636810303, -4.126042366027832, -3.8681530952453613, -3.6102638244628906, -3.35237455368042, -3.094485282897949, -2.8365960121154785, -2.578706741333008, -2.320817470550537, -2.0629281997680664, -1.8050389289855957, -1.547149658203125, -1.2892603874206543, -1.0313711166381836, -0.7734818458557129, -0.5155925750732422, -0.2577033042907715, 0.000186920166015625, 0.25807619094848633, 0.515965461730957, 0.7738547325134277, 1.0317440032958984, 1.2896332740783691, 1.5475225448608398, 1.8054118156433105, 2.0633010864257812, 2.321190357208252, 2.5790796279907227, 2.8369688987731934, 3.094858169555664, 3.3527474403381348, 3.6106367111206055, 3.868525981903076, 4.126415252685547, 4.384304523468018, 4.642193794250488, 4.900083065032959, 5.15797233581543, 5.4158616065979, 5.673750877380371, 5.931640148162842, 6.1895294189453125, 6.447418689727783, 6.705307960510254, 6.963197231292725, 7.221086502075195, 7.478975772857666, 7.736865043640137, 7.994754314422607, 8.252643585205078]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 5.0, 15.0, 18.0, 29.0, 38.0, 53.0, 54.0, 71.0, 108.0, 171.0, 225.0, 291.0, 461.0, 670.0, 957.0, 1439.0, 2238.0, 3444.0, 5649.0, 9395.0, 17330.0, 34018.0, 74596.0, 181946.0, 474161.0, 1040454.0, 1215048.0, 670022.0, 262634.0, 101560.0, 44472.0, 21406.0, 11832.0, 6996.0, 4272.0, 2670.0, 1807.0, 1172.0, 812.0, 542.0, 366.0, 274.0, 172.0, 130.0, 73.0, 56.0, 44.0, 29.0, 18.0, 12.0, 11.0, 11.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.109375, -19.521240234375, -18.93310546875, -18.344970703125, -17.7568359375, -17.168701171875, -16.58056640625, -15.992431640625, -15.404296875, -14.816162109375, -14.22802734375, -13.639892578125, -13.0517578125, -12.463623046875, -11.87548828125, -11.287353515625, -10.69921875, -10.111083984375, -9.52294921875, -8.934814453125, -8.3466796875, -7.758544921875, -7.17041015625, -6.582275390625, -5.994140625, -5.406005859375, -4.81787109375, -4.229736328125, -3.6416015625, -3.053466796875, -2.46533203125, -1.877197265625, -1.2890625, -0.700927734375, -0.11279296875, 0.475341796875, 1.0634765625, 1.651611328125, 2.23974609375, 2.827880859375, 3.416015625, 4.004150390625, 4.59228515625, 5.180419921875, 5.7685546875, 6.356689453125, 6.94482421875, 7.532958984375, 8.12109375, 8.709228515625, 9.29736328125, 9.885498046875, 10.4736328125, 11.061767578125, 11.64990234375, 12.238037109375, 12.826171875, 13.414306640625, 14.00244140625, 14.590576171875, 15.1787109375, 15.766845703125, 16.35498046875, 16.943115234375, 17.53125]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 9.0, 7.0, 14.0, 10.0, 15.0, 14.0, 21.0, 23.0, 29.0, 32.0, 29.0, 31.0, 37.0, 38.0, 24.0, 41.0, 47.0, 51.0, 43.0, 38.0, 32.0, 31.0, 39.0, 49.0, 30.0, 32.0, 20.0, 31.0, 33.0, 24.0, 25.0, 20.0, 12.0, 9.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5625, -8.31329345703125, -8.0640869140625, -7.81488037109375, -7.565673828125, -7.31646728515625, -7.0672607421875, -6.81805419921875, -6.56884765625, -6.31964111328125, -6.0704345703125, -5.82122802734375, -5.572021484375, -5.32281494140625, -5.0736083984375, -4.82440185546875, -4.5751953125, -4.32598876953125, -4.0767822265625, -3.82757568359375, -3.578369140625, -3.32916259765625, -3.0799560546875, -2.83074951171875, -2.58154296875, -2.33233642578125, -2.0831298828125, -1.83392333984375, -1.584716796875, -1.33551025390625, -1.0863037109375, -0.83709716796875, -0.587890625, -0.33868408203125, -0.0894775390625, 0.15972900390625, 0.408935546875, 0.65814208984375, 0.9073486328125, 1.15655517578125, 1.40576171875, 1.65496826171875, 1.9041748046875, 2.15338134765625, 2.402587890625, 2.65179443359375, 2.9010009765625, 3.15020751953125, 3.3994140625, 3.64862060546875, 3.8978271484375, 4.14703369140625, 4.396240234375, 4.64544677734375, 4.8946533203125, 5.14385986328125, 5.39306640625, 5.64227294921875, 5.8914794921875, 6.14068603515625, 6.389892578125, 6.63909912109375, 6.8883056640625, 7.13751220703125, 7.38671875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 7.0, 18.0, 24.0, 29.0, 47.0, 68.0, 111.0, 192.0, 307.0, 472.0, 837.0, 1437.0, 2535.0, 4242.0, 8010.0, 15069.0, 30941.0, 68509.0, 165720.0, 436001.0, 1023164.0, 1278235.0, 693838.0, 267722.0, 104799.0, 45880.0, 21604.0, 10842.0, 5864.0, 3281.0, 1829.0, 1036.0, 607.0, 373.0, 234.0, 156.0, 84.0, 61.0, 41.0, 19.0, 14.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.28125, -23.5283203125, -22.775390625, -22.0224609375, -21.26953125, -20.5166015625, -19.763671875, -19.0107421875, -18.2578125, -17.5048828125, -16.751953125, -15.9990234375, -15.24609375, -14.4931640625, -13.740234375, -12.9873046875, -12.234375, -11.4814453125, -10.728515625, -9.9755859375, -9.22265625, -8.4697265625, -7.716796875, -6.9638671875, -6.2109375, -5.4580078125, -4.705078125, -3.9521484375, -3.19921875, -2.4462890625, -1.693359375, -0.9404296875, -0.1875, 0.5654296875, 1.318359375, 2.0712890625, 2.82421875, 3.5771484375, 4.330078125, 5.0830078125, 5.8359375, 6.5888671875, 7.341796875, 8.0947265625, 8.84765625, 9.6005859375, 10.353515625, 11.1064453125, 11.859375, 12.6123046875, 13.365234375, 14.1181640625, 14.87109375, 15.6240234375, 16.376953125, 17.1298828125, 17.8828125, 18.6357421875, 19.388671875, 20.1416015625, 20.89453125, 21.6474609375, 22.400390625, 23.1533203125, 23.90625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 7.0, 12.0, 12.0, 15.0, 22.0, 29.0, 43.0, 40.0, 62.0, 78.0, 89.0, 102.0, 129.0, 156.0, 190.0, 236.0, 252.0, 281.0, 313.0, 297.0, 260.0, 244.0, 221.0, 184.0, 184.0, 122.0, 95.0, 80.0, 70.0, 57.0, 42.0, 38.0, 26.0, 21.0, 17.0, 18.0, 7.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.859375, -5.686767578125, -5.51416015625, -5.341552734375, -5.1689453125, -4.996337890625, -4.82373046875, -4.651123046875, -4.478515625, -4.305908203125, -4.13330078125, -3.960693359375, -3.7880859375, -3.615478515625, -3.44287109375, -3.270263671875, -3.09765625, -2.925048828125, -2.75244140625, -2.579833984375, -2.4072265625, -2.234619140625, -2.06201171875, -1.889404296875, -1.716796875, -1.544189453125, -1.37158203125, -1.198974609375, -1.0263671875, -0.853759765625, -0.68115234375, -0.508544921875, -0.3359375, -0.163330078125, 0.00927734375, 0.181884765625, 0.3544921875, 0.527099609375, 0.69970703125, 0.872314453125, 1.044921875, 1.217529296875, 1.39013671875, 1.562744140625, 1.7353515625, 1.907958984375, 2.08056640625, 2.253173828125, 2.42578125, 2.598388671875, 2.77099609375, 2.943603515625, 3.1162109375, 3.288818359375, 3.46142578125, 3.634033203125, 3.806640625, 3.979248046875, 4.15185546875, 4.324462890625, 4.4970703125, 4.669677734375, 4.84228515625, 5.014892578125, 5.1875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 3.0, 6.0, 10.0, 9.0, 17.0, 12.0, 17.0, 23.0, 40.0, 29.0, 43.0, 49.0, 47.0, 63.0, 73.0, 58.0, 68.0, 73.0, 62.0, 46.0, 56.0, 21.0, 33.0, 26.0, 16.0, 20.0, 18.0, 10.0, 9.0, 10.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-21.823322296142578, -21.2429256439209, -20.66252899169922, -20.08213233947754, -19.50173568725586, -18.92133903503418, -18.3409423828125, -17.76054573059082, -17.18014907836914, -16.59975242614746, -16.01935577392578, -15.438959121704102, -14.858562469482422, -14.278165817260742, -13.697769165039062, -13.117372512817383, -12.53697681427002, -11.95658016204834, -11.37618350982666, -10.79578685760498, -10.2153902053833, -9.634993553161621, -9.054597854614258, -8.474201202392578, -7.89380407333374, -7.3134074211120605, -6.733010768890381, -6.152614593505859, -5.57221794128418, -4.9918212890625, -4.41142463684082, -3.8310279846191406, -3.250631332397461, -2.6702346801757812, -2.0898380279541016, -1.509441614151001, -0.9290449619293213, -0.3486483097076416, 0.23174810409545898, 0.8121447563171387, 1.3925414085388184, 1.972938060760498, 2.5533347129821777, 3.1337311267852783, 3.714127779006958, 4.294524192810059, 4.874920845031738, 5.455317497253418, 6.035714149475098, 6.616110801696777, 7.196507453918457, 7.776904106140137, 8.357300758361816, 8.937697410583496, 9.51809310913086, 10.098489761352539, 10.678886413574219, 11.259283065795898, 11.839679718017578, 12.420076370239258, 13.000473022460938, 13.580869674682617, 14.161266326904297, 14.741662979125977, 15.322059631347656]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 5.0, 5.0, 8.0, 6.0, 10.0, 11.0, 10.0, 17.0, 18.0, 22.0, 21.0, 26.0, 18.0, 28.0, 26.0, 28.0, 23.0, 24.0, 25.0, 35.0, 43.0, 44.0, 37.0, 38.0, 36.0, 42.0, 32.0, 45.0, 33.0, 26.0, 29.0, 32.0, 40.0, 20.0, 20.0, 17.0, 11.0, 16.0, 16.0, 12.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.544527053833008, -9.252277374267578, -8.960027694702148, -8.667778015136719, -8.375528335571289, -8.083277702331543, -7.791028022766113, -7.498778343200684, -7.206528663635254, -6.914278984069824, -6.6220293045043945, -6.329779148101807, -6.037529468536377, -5.745279788970947, -5.453029632568359, -5.16077995300293, -4.8685302734375, -4.57628059387207, -4.284030914306641, -3.9917807579040527, -3.699531078338623, -3.4072813987731934, -3.1150314807891846, -2.822781562805176, -2.530531883239746, -2.2382822036743164, -1.9460322856903076, -1.6537824869155884, -1.3615326881408691, -1.06928288936615, -0.7770330905914307, -0.4847831726074219, -0.19253253936767578, 0.09971725940704346, 0.3919670581817627, 0.6842168569564819, 0.9764666557312012, 1.2687164545059204, 1.5609662532806396, 1.8532161712646484, 2.145465850830078, 2.437715530395508, 2.7299654483795166, 3.0222153663635254, 3.314465045928955, 3.6067147254943848, 3.8989646434783936, 4.191214561462402, 4.483464241027832, 4.775713920593262, 5.067963600158691, 5.360213756561279, 5.652463436126709, 5.944713115692139, 6.236963272094727, 6.529212951660156, 6.821462631225586, 7.113712310791016, 7.405961990356445, 7.698212146759033, 7.990461826324463, 8.28271198272705, 8.57496166229248, 8.86721134185791, 9.15946102142334]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 10.0, 10.0, 12.0, 29.0, 40.0, 60.0, 88.0, 138.0, 178.0, 243.0, 401.0, 597.0, 912.0, 1385.0, 2170.0, 3391.0, 5123.0, 8321.0, 13289.0, 21004.0, 33787.0, 53293.0, 80650.0, 114548.0, 144007.0, 151825.0, 131105.0, 98671.0, 66650.0, 43067.0, 27612.0, 16978.0, 10487.0, 6511.0, 4127.0, 2791.0, 1656.0, 1123.0, 749.0, 500.0, 327.0, 236.0, 128.0, 121.0, 56.0, 51.0, 34.0, 13.0, 16.0, 16.0, 6.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.5625, -4.41656494140625, -4.2706298828125, -4.12469482421875, -3.978759765625, -3.83282470703125, -3.6868896484375, -3.54095458984375, -3.39501953125, -3.24908447265625, -3.1031494140625, -2.95721435546875, -2.811279296875, -2.66534423828125, -2.5194091796875, -2.37347412109375, -2.2275390625, -2.08160400390625, -1.9356689453125, -1.78973388671875, -1.643798828125, -1.49786376953125, -1.3519287109375, -1.20599365234375, -1.06005859375, -0.91412353515625, -0.7681884765625, -0.62225341796875, -0.476318359375, -0.33038330078125, -0.1844482421875, -0.03851318359375, 0.107421875, 0.25335693359375, 0.3992919921875, 0.54522705078125, 0.691162109375, 0.83709716796875, 0.9830322265625, 1.12896728515625, 1.27490234375, 1.42083740234375, 1.5667724609375, 1.71270751953125, 1.858642578125, 2.00457763671875, 2.1505126953125, 2.29644775390625, 2.4423828125, 2.58831787109375, 2.7342529296875, 2.88018798828125, 3.026123046875, 3.17205810546875, 3.3179931640625, 3.46392822265625, 3.60986328125, 3.75579833984375, 3.9017333984375, 4.04766845703125, 4.193603515625, 4.33953857421875, 4.4854736328125, 4.63140869140625, 4.77734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 12.0, 11.0, 15.0, 13.0, 22.0, 18.0, 31.0, 27.0, 25.0, 29.0, 28.0, 33.0, 28.0, 39.0, 43.0, 42.0, 41.0, 45.0, 50.0, 33.0, 47.0, 33.0, 24.0, 40.0, 35.0, 25.0, 27.0, 26.0, 27.0, 19.0, 14.0, 16.0, 12.0, 10.0, 4.0, 10.0, 6.0, 8.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.703125, -10.359375, -10.015625, -9.671875, -9.328125, -8.984375, -8.640625, -8.296875, -7.953125, -7.609375, -7.265625, -6.921875, -6.578125, -6.234375, -5.890625, -5.546875, -5.203125, -4.859375, -4.515625, -4.171875, -3.828125, -3.484375, -3.140625, -2.796875, -2.453125, -2.109375, -1.765625, -1.421875, -1.078125, -0.734375, -0.390625, -0.046875, 0.296875, 0.640625, 0.984375, 1.328125, 1.671875, 2.015625, 2.359375, 2.703125, 3.046875, 3.390625, 3.734375, 4.078125, 4.421875, 4.765625, 5.109375, 5.453125, 5.796875, 6.140625, 6.484375, 6.828125, 7.171875, 7.515625, 7.859375, 8.203125, 8.546875, 8.890625, 9.234375, 9.578125, 9.921875, 10.265625, 10.609375, 10.953125, 11.296875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 4.0, 6.0, 12.0, 18.0, 21.0, 33.0, 45.0, 69.0, 76.0, 140.0, 200.0, 264.0, 433.0, 604.0, 981.0, 1423.0, 2194.0, 3418.0, 5632.0, 9102.0, 15163.0, 25778.0, 44972.0, 79186.0, 133407.0, 193336.0, 196838.0, 138453.0, 81851.0, 46632.0, 26742.0, 15693.0, 9502.0, 5873.0, 3600.0, 2311.0, 1445.0, 1037.0, 639.0, 467.0, 295.0, 200.0, 148.0, 86.0, 76.0, 41.0, 37.0, 27.0, 14.0, 14.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.49609375, -6.2994384765625, -6.102783203125, -5.9061279296875, -5.70947265625, -5.5128173828125, -5.316162109375, -5.1195068359375, -4.9228515625, -4.7261962890625, -4.529541015625, -4.3328857421875, -4.13623046875, -3.9395751953125, -3.742919921875, -3.5462646484375, -3.349609375, -3.1529541015625, -2.956298828125, -2.7596435546875, -2.56298828125, -2.3663330078125, -2.169677734375, -1.9730224609375, -1.7763671875, -1.5797119140625, -1.383056640625, -1.1864013671875, -0.98974609375, -0.7930908203125, -0.596435546875, -0.3997802734375, -0.203125, -0.0064697265625, 0.190185546875, 0.3868408203125, 0.58349609375, 0.7801513671875, 0.976806640625, 1.1734619140625, 1.3701171875, 1.5667724609375, 1.763427734375, 1.9600830078125, 2.15673828125, 2.3533935546875, 2.550048828125, 2.7467041015625, 2.943359375, 3.1400146484375, 3.336669921875, 3.5333251953125, 3.72998046875, 3.9266357421875, 4.123291015625, 4.3199462890625, 4.5166015625, 4.7132568359375, 4.909912109375, 5.1065673828125, 5.30322265625, 5.4998779296875, 5.696533203125, 5.8931884765625, 6.08984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 9.0, 14.0, 11.0, 18.0, 20.0, 20.0, 23.0, 21.0, 21.0, 28.0, 36.0, 31.0, 29.0, 40.0, 45.0, 32.0, 31.0, 35.0, 39.0, 32.0, 35.0, 27.0, 35.0, 41.0, 37.0, 25.0, 36.0, 23.0, 24.0, 28.0, 25.0, 26.0, 12.0, 12.0, 10.0, 12.0, 8.0, 11.0, 5.0, 3.0, 4.0, 5.0, 5.0, 0.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8984375, -5.71002197265625, -5.5216064453125, -5.33319091796875, -5.144775390625, -4.95635986328125, -4.7679443359375, -4.57952880859375, -4.39111328125, -4.20269775390625, -4.0142822265625, -3.82586669921875, -3.637451171875, -3.44903564453125, -3.2606201171875, -3.07220458984375, -2.8837890625, -2.69537353515625, -2.5069580078125, -2.31854248046875, -2.130126953125, -1.94171142578125, -1.7532958984375, -1.56488037109375, -1.37646484375, -1.18804931640625, -0.9996337890625, -0.81121826171875, -0.622802734375, -0.43438720703125, -0.2459716796875, -0.05755615234375, 0.130859375, 0.31927490234375, 0.5076904296875, 0.69610595703125, 0.884521484375, 1.07293701171875, 1.2613525390625, 1.44976806640625, 1.63818359375, 1.82659912109375, 2.0150146484375, 2.20343017578125, 2.391845703125, 2.58026123046875, 2.7686767578125, 2.95709228515625, 3.1455078125, 3.33392333984375, 3.5223388671875, 3.71075439453125, 3.899169921875, 4.08758544921875, 4.2760009765625, 4.46441650390625, 4.65283203125, 4.84124755859375, 5.0296630859375, 5.21807861328125, 5.406494140625, 5.59490966796875, 5.7833251953125, 5.97174072265625, 6.16015625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 4.0, 19.0, 19.0, 31.0, 44.0, 42.0, 101.0, 121.0, 164.0, 248.0, 334.0, 516.0, 734.0, 1112.0, 1656.0, 2536.0, 3851.0, 5913.0, 9762.0, 15977.0, 27028.0, 47516.0, 83835.0, 146839.0, 214292.0, 195513.0, 122614.0, 69070.0, 39075.0, 22508.0, 13808.0, 8186.0, 5152.0, 3308.0, 2123.0, 1461.0, 987.0, 635.0, 439.0, 268.0, 208.0, 150.0, 108.0, 71.0, 45.0, 39.0, 24.0, 17.0, 20.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.072265625, -2.972625732421875, -2.87298583984375, -2.773345947265625, -2.6737060546875, -2.574066162109375, -2.47442626953125, -2.374786376953125, -2.275146484375, -2.175506591796875, -2.07586669921875, -1.976226806640625, -1.8765869140625, -1.776947021484375, -1.67730712890625, -1.577667236328125, -1.47802734375, -1.378387451171875, -1.27874755859375, -1.179107666015625, -1.0794677734375, -0.979827880859375, -0.88018798828125, -0.780548095703125, -0.680908203125, -0.581268310546875, -0.48162841796875, -0.381988525390625, -0.2823486328125, -0.182708740234375, -0.08306884765625, 0.016571044921875, 0.1162109375, 0.215850830078125, 0.31549072265625, 0.415130615234375, 0.5147705078125, 0.614410400390625, 0.71405029296875, 0.813690185546875, 0.913330078125, 1.012969970703125, 1.11260986328125, 1.212249755859375, 1.3118896484375, 1.411529541015625, 1.51116943359375, 1.610809326171875, 1.71044921875, 1.810089111328125, 1.90972900390625, 2.009368896484375, 2.1090087890625, 2.208648681640625, 2.30828857421875, 2.407928466796875, 2.507568359375, 2.607208251953125, 2.70684814453125, 2.806488037109375, 2.9061279296875, 3.005767822265625, 3.10540771484375, 3.205047607421875, 3.3046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 5.0, 4.0, 5.0, 13.0, 11.0, 15.0, 18.0, 30.0, 49.0, 53.0, 57.0, 77.0, 63.0, 92.0, 76.0, 77.0, 59.0, 46.0, 62.0, 27.0, 30.0, 27.0, 17.0, 14.0, 15.0, 12.0, 11.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023162364959716797, -0.00022459588944911957, -0.00021756812930107117, -0.00021054036915302277, -0.00020351260900497437, -0.00019648484885692596, -0.00018945708870887756, -0.00018242932856082916, -0.00017540156841278076, -0.00016837380826473236, -0.00016134604811668396, -0.00015431828796863556, -0.00014729052782058716, -0.00014026276767253876, -0.00013323500752449036, -0.00012620724737644196, -0.00011917948722839355, -0.00011215172708034515, -0.00010512396693229675, -9.809620678424835e-05, -9.106844663619995e-05, -8.404068648815155e-05, -7.701292634010315e-05, -6.998516619205475e-05, -6.295740604400635e-05, -5.592964589595795e-05, -4.8901885747909546e-05, -4.1874125599861145e-05, -3.4846365451812744e-05, -2.7818605303764343e-05, -2.0790845155715942e-05, -1.3763085007667542e-05, -6.735324859619141e-06, 2.9243528842926025e-07, 7.320195436477661e-06, 1.4347955584526062e-05, 2.1375715732574463e-05, 2.8403475880622864e-05, 3.5431236028671265e-05, 4.2458996176719666e-05, 4.9486756324768066e-05, 5.651451647281647e-05, 6.354227662086487e-05, 7.057003676891327e-05, 7.759779691696167e-05, 8.462555706501007e-05, 9.165331721305847e-05, 9.868107736110687e-05, 0.00010570883750915527, 0.00011273659765720367, 0.00011976435780525208, 0.00012679211795330048, 0.00013381987810134888, 0.00014084763824939728, 0.00014787539839744568, 0.00015490315854549408, 0.00016193091869354248, 0.00016895867884159088, 0.00017598643898963928, 0.00018301419913768768, 0.00019004195928573608, 0.00019706971943378448, 0.00020409747958183289, 0.0002111252397298813, 0.0002181529998779297]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 10.0, 7.0, 14.0, 20.0, 33.0, 59.0, 86.0, 129.0, 216.0, 327.0, 556.0, 937.0, 1577.0, 2860.0, 5049.0, 8943.0, 16995.0, 32888.0, 65403.0, 129592.0, 219790.0, 239460.0, 156938.0, 80926.0, 40414.0, 20580.0, 10817.0, 5812.0, 3226.0, 1980.0, 1098.0, 687.0, 425.0, 244.0, 161.0, 104.0, 68.0, 37.0, 28.0, 22.0, 14.0, 8.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.26641845703125, -4.1148681640625, -3.96331787109375, -3.811767578125, -3.66021728515625, -3.5086669921875, -3.35711669921875, -3.20556640625, -3.05401611328125, -2.9024658203125, -2.75091552734375, -2.599365234375, -2.44781494140625, -2.2962646484375, -2.14471435546875, -1.9931640625, -1.84161376953125, -1.6900634765625, -1.53851318359375, -1.386962890625, -1.23541259765625, -1.0838623046875, -0.93231201171875, -0.78076171875, -0.62921142578125, -0.4776611328125, -0.32611083984375, -0.174560546875, -0.02301025390625, 0.1285400390625, 0.28009033203125, 0.431640625, 0.58319091796875, 0.7347412109375, 0.88629150390625, 1.037841796875, 1.18939208984375, 1.3409423828125, 1.49249267578125, 1.64404296875, 1.79559326171875, 1.9471435546875, 2.09869384765625, 2.250244140625, 2.40179443359375, 2.5533447265625, 2.70489501953125, 2.8564453125, 3.00799560546875, 3.1595458984375, 3.31109619140625, 3.462646484375, 3.61419677734375, 3.7657470703125, 3.91729736328125, 4.06884765625, 4.22039794921875, 4.3719482421875, 4.52349853515625, 4.675048828125, 4.82659912109375, 4.9781494140625, 5.12969970703125, 5.28125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 7.0, 5.0, 7.0, 8.0, 8.0, 11.0, 22.0, 18.0, 15.0, 21.0, 34.0, 32.0, 44.0, 36.0, 42.0, 42.0, 31.0, 39.0, 45.0, 43.0, 50.0, 48.0, 34.0, 42.0, 31.0, 37.0, 31.0, 21.0, 34.0, 18.0, 24.0, 23.0, 9.0, 11.0, 7.0, 8.0, 8.0, 12.0, 7.0, 5.0, 2.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.7216796875, -0.6961517333984375, -0.670623779296875, -0.6450958251953125, -0.61956787109375, -0.5940399169921875, -0.568511962890625, -0.5429840087890625, -0.5174560546875, -0.4919281005859375, -0.466400146484375, -0.4408721923828125, -0.41534423828125, -0.3898162841796875, -0.364288330078125, -0.3387603759765625, -0.313232421875, -0.2877044677734375, -0.262176513671875, -0.2366485595703125, -0.21112060546875, -0.1855926513671875, -0.160064697265625, -0.1345367431640625, -0.1090087890625, -0.0834808349609375, -0.057952880859375, -0.0324249267578125, -0.00689697265625, 0.0186309814453125, 0.044158935546875, 0.0696868896484375, 0.09521484375, 0.1207427978515625, 0.146270751953125, 0.1717987060546875, 0.19732666015625, 0.2228546142578125, 0.248382568359375, 0.2739105224609375, 0.2994384765625, 0.3249664306640625, 0.350494384765625, 0.3760223388671875, 0.40155029296875, 0.4270782470703125, 0.452606201171875, 0.4781341552734375, 0.503662109375, 0.5291900634765625, 0.554718017578125, 0.5802459716796875, 0.60577392578125, 0.6313018798828125, 0.656829833984375, 0.6823577880859375, 0.7078857421875, 0.7334136962890625, 0.758941650390625, 0.7844696044921875, 0.80999755859375, 0.8355255126953125, 0.861053466796875, 0.8865814208984375, 0.912109375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 3.0, 12.0, 12.0, 12.0, 8.0, 10.0, 16.0, 40.0, 32.0, 42.0, 36.0, 61.0, 51.0, 65.0, 62.0, 61.0, 79.0, 75.0, 43.0, 49.0, 43.0, 28.0, 26.0, 24.0, 19.0, 20.0, 20.0, 9.0, 6.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-21.74443244934082, -21.160507202148438, -20.576580047607422, -19.99265480041504, -19.408729553222656, -18.82480239868164, -18.240877151489258, -17.656951904296875, -17.07302474975586, -16.489099502563477, -15.905172348022461, -15.321247100830078, -14.737320899963379, -14.15339469909668, -13.569469451904297, -12.985543251037598, -12.401617050170898, -11.8176908493042, -11.2337646484375, -10.649839401245117, -10.065913200378418, -9.481986999511719, -8.898061752319336, -8.314135551452637, -7.7302093505859375, -7.146283149719238, -6.562357425689697, -5.978431701660156, -5.394505500793457, -4.810579299926758, -4.226653575897217, -3.642727851867676, -3.0587997436523438, -2.4748737812042236, -1.8909478187561035, -1.3070218563079834, -0.7230958938598633, -0.13916993141174316, 0.44475603103637695, 1.028681755065918, 1.6126079559326172, 2.1965339183807373, 2.7804598808288574, 3.3643858432769775, 3.9483118057250977, 4.532238006591797, 5.116163730621338, 5.700089454650879, 6.284015655517578, 6.867941856384277, 7.451867580413818, 8.03579330444336, 8.619719505310059, 9.203645706176758, 9.78757095336914, 10.37149715423584, 10.955423355102539, 11.539349555969238, 12.123275756835938, 12.70720100402832, 13.29112720489502, 13.875053405761719, 14.458978652954102, 15.0429048538208, 15.6268310546875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 5.0, 4.0, 10.0, 11.0, 11.0, 11.0, 15.0, 13.0, 26.0, 20.0, 24.0, 20.0, 20.0, 27.0, 34.0, 27.0, 19.0, 31.0, 39.0, 36.0, 33.0, 44.0, 34.0, 38.0, 45.0, 36.0, 40.0, 33.0, 31.0, 26.0, 29.0, 32.0, 24.0, 25.0, 14.0, 17.0, 14.0, 14.0, 17.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.4180908203125, -9.128936767578125, -8.839781761169434, -8.550627708435059, -8.261472702026367, -7.972318649291992, -7.683164119720459, -7.394009590148926, -7.104855060577393, -6.815700531005859, -6.526546001434326, -6.237391471862793, -5.948237419128418, -5.659082412719727, -5.369928359985352, -5.080773830413818, -4.791619300842285, -4.502464771270752, -4.213310241699219, -3.9241559505462646, -3.6350014209747314, -3.3458468914031982, -3.056692600250244, -2.767538070678711, -2.4783835411071777, -2.1892290115356445, -1.9000746011734009, -1.6109201908111572, -1.321765661239624, -1.0326111316680908, -0.7434567213058472, -0.4543023109436035, -0.16514873504638672, 0.12400573492050171, 0.41316020488739014, 0.7023146748542786, 0.991469144821167, 1.2806236743927002, 1.5697780847549438, 1.8589324951171875, 2.1480870246887207, 2.437241554260254, 2.726396083831787, 3.015550374984741, 3.3047049045562744, 3.5938594341278076, 3.8830137252807617, 4.172168254852295, 4.461322784423828, 4.750477313995361, 5.0396318435668945, 5.328786373138428, 5.617940902709961, 5.907094955444336, 6.196249485015869, 6.485404014587402, 6.7745585441589355, 7.063713073730469, 7.352867603302002, 7.642022132873535, 7.93117618560791, 8.220331192016602, 8.509485244750977, 8.798639297485352, 9.087794303894043]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 7.0, 10.0, 20.0, 15.0, 24.0, 39.0, 59.0, 107.0, 132.0, 222.0, 316.0, 492.0, 731.0, 1111.0, 1627.0, 2589.0, 3845.0, 6070.0, 9146.0, 14523.0, 22195.0, 34412.0, 52319.0, 75577.0, 102914.0, 126312.0, 135792.0, 126188.0, 103888.0, 76421.0, 52480.0, 34736.0, 22575.0, 14698.0, 9358.0, 6018.0, 3968.0, 2592.0, 1653.0, 1091.0, 781.0, 511.0, 332.0, 197.0, 167.0, 100.0, 55.0, 42.0, 26.0, 25.0, 18.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0], "bins": [-7.3046875, -7.08001708984375, -6.8553466796875, -6.63067626953125, -6.406005859375, -6.18133544921875, -5.9566650390625, -5.73199462890625, -5.50732421875, -5.28265380859375, -5.0579833984375, -4.83331298828125, -4.608642578125, -4.38397216796875, -4.1593017578125, -3.93463134765625, -3.7099609375, -3.48529052734375, -3.2606201171875, -3.03594970703125, -2.811279296875, -2.58660888671875, -2.3619384765625, -2.13726806640625, -1.91259765625, -1.68792724609375, -1.4632568359375, -1.23858642578125, -1.013916015625, -0.78924560546875, -0.5645751953125, -0.33990478515625, -0.115234375, 0.10943603515625, 0.3341064453125, 0.55877685546875, 0.783447265625, 1.00811767578125, 1.2327880859375, 1.45745849609375, 1.68212890625, 1.90679931640625, 2.1314697265625, 2.35614013671875, 2.580810546875, 2.80548095703125, 3.0301513671875, 3.25482177734375, 3.4794921875, 3.70416259765625, 3.9288330078125, 4.15350341796875, 4.378173828125, 4.60284423828125, 4.8275146484375, 5.05218505859375, 5.27685546875, 5.50152587890625, 5.7261962890625, 5.95086669921875, 6.175537109375, 6.40020751953125, 6.6248779296875, 6.84954833984375, 7.07421875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 10.0, 11.0, 12.0, 13.0, 16.0, 20.0, 22.0, 25.0, 23.0, 24.0, 29.0, 24.0, 28.0, 34.0, 38.0, 38.0, 39.0, 39.0, 32.0, 36.0, 34.0, 51.0, 27.0, 46.0, 30.0, 31.0, 33.0, 28.0, 28.0, 25.0, 20.0, 13.0, 17.0, 13.0, 10.0, 11.0, 13.0, 8.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.640625, -10.3143310546875, -9.988037109375, -9.6617431640625, -9.33544921875, -9.0091552734375, -8.682861328125, -8.3565673828125, -8.0302734375, -7.7039794921875, -7.377685546875, -7.0513916015625, -6.72509765625, -6.3988037109375, -6.072509765625, -5.7462158203125, -5.419921875, -5.0936279296875, -4.767333984375, -4.4410400390625, -4.11474609375, -3.7884521484375, -3.462158203125, -3.1358642578125, -2.8095703125, -2.4832763671875, -2.156982421875, -1.8306884765625, -1.50439453125, -1.1781005859375, -0.851806640625, -0.5255126953125, -0.19921875, 0.1270751953125, 0.453369140625, 0.7796630859375, 1.10595703125, 1.4322509765625, 1.758544921875, 2.0848388671875, 2.4111328125, 2.7374267578125, 3.063720703125, 3.3900146484375, 3.71630859375, 4.0426025390625, 4.368896484375, 4.6951904296875, 5.021484375, 5.3477783203125, 5.674072265625, 6.0003662109375, 6.32666015625, 6.6529541015625, 6.979248046875, 7.3055419921875, 7.6318359375, 7.9581298828125, 8.284423828125, 8.6107177734375, 8.93701171875, 9.2633056640625, 9.589599609375, 9.9158935546875, 10.2421875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 9.0, 14.0, 19.0, 35.0, 52.0, 81.0, 136.0, 208.0, 343.0, 563.0, 909.0, 1552.0, 2496.0, 4200.0, 6919.0, 11430.0, 18986.0, 30039.0, 47891.0, 71701.0, 101440.0, 130042.0, 144221.0, 136666.0, 111622.0, 81290.0, 54347.0, 35030.0, 21905.0, 13464.0, 8315.0, 4871.0, 3020.0, 1883.0, 1073.0, 668.0, 441.0, 269.0, 139.0, 101.0, 57.0, 41.0, 25.0, 17.0, 10.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8828125, -7.625732421875, -7.36865234375, -7.111572265625, -6.8544921875, -6.597412109375, -6.34033203125, -6.083251953125, -5.826171875, -5.569091796875, -5.31201171875, -5.054931640625, -4.7978515625, -4.540771484375, -4.28369140625, -4.026611328125, -3.76953125, -3.512451171875, -3.25537109375, -2.998291015625, -2.7412109375, -2.484130859375, -2.22705078125, -1.969970703125, -1.712890625, -1.455810546875, -1.19873046875, -0.941650390625, -0.6845703125, -0.427490234375, -0.17041015625, 0.086669921875, 0.34375, 0.600830078125, 0.85791015625, 1.114990234375, 1.3720703125, 1.629150390625, 1.88623046875, 2.143310546875, 2.400390625, 2.657470703125, 2.91455078125, 3.171630859375, 3.4287109375, 3.685791015625, 3.94287109375, 4.199951171875, 4.45703125, 4.714111328125, 4.97119140625, 5.228271484375, 5.4853515625, 5.742431640625, 5.99951171875, 6.256591796875, 6.513671875, 6.770751953125, 7.02783203125, 7.284912109375, 7.5419921875, 7.799072265625, 8.05615234375, 8.313232421875, 8.5703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 11.0, 12.0, 10.0, 18.0, 13.0, 18.0, 22.0, 18.0, 32.0, 19.0, 28.0, 31.0, 42.0, 37.0, 42.0, 48.0, 31.0, 41.0, 44.0, 41.0, 34.0, 49.0, 32.0, 35.0, 31.0, 23.0, 27.0, 26.0, 25.0, 21.0, 15.0, 18.0, 18.0, 15.0, 16.0, 13.0, 4.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3321533203125, -6.113525390625, -5.8948974609375, -5.67626953125, -5.4576416015625, -5.239013671875, -5.0203857421875, -4.8017578125, -4.5831298828125, -4.364501953125, -4.1458740234375, -3.92724609375, -3.7086181640625, -3.489990234375, -3.2713623046875, -3.052734375, -2.8341064453125, -2.615478515625, -2.3968505859375, -2.17822265625, -1.9595947265625, -1.740966796875, -1.5223388671875, -1.3037109375, -1.0850830078125, -0.866455078125, -0.6478271484375, -0.42919921875, -0.2105712890625, 0.008056640625, 0.2266845703125, 0.4453125, 0.6639404296875, 0.882568359375, 1.1011962890625, 1.31982421875, 1.5384521484375, 1.757080078125, 1.9757080078125, 2.1943359375, 2.4129638671875, 2.631591796875, 2.8502197265625, 3.06884765625, 3.2874755859375, 3.506103515625, 3.7247314453125, 3.943359375, 4.1619873046875, 4.380615234375, 4.5992431640625, 4.81787109375, 5.0364990234375, 5.255126953125, 5.4737548828125, 5.6923828125, 5.9110107421875, 6.129638671875, 6.3482666015625, 6.56689453125, 6.7855224609375, 7.004150390625, 7.2227783203125, 7.44140625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 10.0, 23.0, 15.0, 19.0, 48.0, 55.0, 65.0, 105.0, 176.0, 253.0, 363.0, 550.0, 801.0, 1236.0, 1814.0, 2775.0, 4121.0, 6431.0, 9965.0, 15581.0, 24470.0, 37525.0, 56805.0, 81659.0, 110301.0, 132815.0, 138728.0, 123439.0, 97380.0, 68928.0, 46568.0, 30613.0, 19531.0, 12202.0, 8022.0, 5117.0, 3372.0, 2234.0, 1476.0, 934.0, 648.0, 469.0, 311.0, 203.0, 117.0, 95.0, 59.0, 43.0, 36.0, 17.0, 13.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0], "bins": [-4.015625, -3.894866943359375, -3.77410888671875, -3.653350830078125, -3.5325927734375, -3.411834716796875, -3.29107666015625, -3.170318603515625, -3.049560546875, -2.928802490234375, -2.80804443359375, -2.687286376953125, -2.5665283203125, -2.445770263671875, -2.32501220703125, -2.204254150390625, -2.08349609375, -1.962738037109375, -1.84197998046875, -1.721221923828125, -1.6004638671875, -1.479705810546875, -1.35894775390625, -1.238189697265625, -1.117431640625, -0.996673583984375, -0.87591552734375, -0.755157470703125, -0.6343994140625, -0.513641357421875, -0.39288330078125, -0.272125244140625, -0.1513671875, -0.030609130859375, 0.09014892578125, 0.210906982421875, 0.3316650390625, 0.452423095703125, 0.57318115234375, 0.693939208984375, 0.814697265625, 0.935455322265625, 1.05621337890625, 1.176971435546875, 1.2977294921875, 1.418487548828125, 1.53924560546875, 1.660003662109375, 1.78076171875, 1.901519775390625, 2.02227783203125, 2.143035888671875, 2.2637939453125, 2.384552001953125, 2.50531005859375, 2.626068115234375, 2.746826171875, 2.867584228515625, 2.98834228515625, 3.109100341796875, 3.2298583984375, 3.350616455078125, 3.47137451171875, 3.592132568359375, 3.712890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 8.0, 10.0, 16.0, 14.0, 20.0, 29.0, 24.0, 25.0, 40.0, 64.0, 64.0, 62.0, 64.0, 55.0, 55.0, 61.0, 56.0, 40.0, 40.0, 40.0, 29.0, 26.0, 28.0, 28.0, 14.0, 17.0, 10.0, 11.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044417381286621094, -0.0004293955862522125, -0.0004146173596382141, -0.0003998391330242157, -0.0003850609064102173, -0.00037028267979621887, -0.00035550445318222046, -0.00034072622656822205, -0.00032594799995422363, -0.0003111697733402252, -0.0002963915467262268, -0.0002816133201122284, -0.00026683509349823, -0.00025205686688423157, -0.00023727864027023315, -0.00022250041365623474, -0.00020772218704223633, -0.00019294396042823792, -0.0001781657338142395, -0.0001633875072002411, -0.00014860928058624268, -0.00013383105397224426, -0.00011905282735824585, -0.00010427460074424744, -8.949637413024902e-05, -7.471814751625061e-05, -5.99399209022522e-05, -4.5161694288253784e-05, -3.038346767425537e-05, -1.5605241060256958e-05, -8.270144462585449e-07, 1.3951212167739868e-05, 2.872943878173828e-05, 4.3507665395736694e-05, 5.828589200973511e-05, 7.306411862373352e-05, 8.784234523773193e-05, 0.00010262057185173035, 0.00011739879846572876, 0.00013217702507972717, 0.00014695525169372559, 0.000161733478307724, 0.0001765117049217224, 0.00019128993153572083, 0.00020606815814971924, 0.00022084638476371765, 0.00023562461137771606, 0.0002504028379917145, 0.0002651810646057129, 0.0002799592912197113, 0.0002947375178337097, 0.00030951574444770813, 0.00032429397106170654, 0.00033907219767570496, 0.00035385042428970337, 0.0003686286509037018, 0.0003834068775177002, 0.0003981851041316986, 0.000412963330745697, 0.00042774155735969543, 0.00044251978397369385, 0.00045729801058769226, 0.0004720762372016907, 0.0004868544638156891, 0.0005016326904296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 14.0, 22.0, 25.0, 42.0, 81.0, 121.0, 194.0, 285.0, 415.0, 673.0, 1024.0, 1704.0, 2648.0, 4267.0, 7200.0, 11879.0, 19626.0, 33703.0, 57155.0, 93053.0, 137695.0, 171923.0, 166631.0, 128869.0, 83975.0, 50570.0, 29787.0, 17515.0, 10362.0, 6361.0, 3957.0, 2448.0, 1578.0, 983.0, 647.0, 380.0, 263.0, 156.0, 115.0, 70.0, 49.0, 27.0, 24.0, 10.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.109375, -4.94915771484375, -4.7889404296875, -4.62872314453125, -4.468505859375, -4.30828857421875, -4.1480712890625, -3.98785400390625, -3.82763671875, -3.66741943359375, -3.5072021484375, -3.34698486328125, -3.186767578125, -3.02655029296875, -2.8663330078125, -2.70611572265625, -2.5458984375, -2.38568115234375, -2.2254638671875, -2.06524658203125, -1.905029296875, -1.74481201171875, -1.5845947265625, -1.42437744140625, -1.26416015625, -1.10394287109375, -0.9437255859375, -0.78350830078125, -0.623291015625, -0.46307373046875, -0.3028564453125, -0.14263916015625, 0.017578125, 0.17779541015625, 0.3380126953125, 0.49822998046875, 0.658447265625, 0.81866455078125, 0.9788818359375, 1.13909912109375, 1.29931640625, 1.45953369140625, 1.6197509765625, 1.77996826171875, 1.940185546875, 2.10040283203125, 2.2606201171875, 2.42083740234375, 2.5810546875, 2.74127197265625, 2.9014892578125, 3.06170654296875, 3.221923828125, 3.38214111328125, 3.5423583984375, 3.70257568359375, 3.86279296875, 4.02301025390625, 4.1832275390625, 4.34344482421875, 4.503662109375, 4.66387939453125, 4.8240966796875, 4.98431396484375, 5.14453125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 7.0, 8.0, 13.0, 12.0, 25.0, 35.0, 24.0, 45.0, 37.0, 48.0, 36.0, 48.0, 51.0, 49.0, 53.0, 64.0, 58.0, 59.0, 53.0, 43.0, 41.0, 38.0, 31.0, 30.0, 22.0, 9.0, 11.0, 4.0, 7.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3818359375, -1.3379058837890625, -1.293975830078125, -1.2500457763671875, -1.20611572265625, -1.1621856689453125, -1.118255615234375, -1.0743255615234375, -1.0303955078125, -0.9864654541015625, -0.942535400390625, -0.8986053466796875, -0.85467529296875, -0.8107452392578125, -0.766815185546875, -0.7228851318359375, -0.678955078125, -0.6350250244140625, -0.591094970703125, -0.5471649169921875, -0.50323486328125, -0.4593048095703125, -0.415374755859375, -0.3714447021484375, -0.3275146484375, -0.2835845947265625, -0.239654541015625, -0.1957244873046875, -0.15179443359375, -0.1078643798828125, -0.063934326171875, -0.0200042724609375, 0.02392578125, 0.0678558349609375, 0.111785888671875, 0.1557159423828125, 0.19964599609375, 0.2435760498046875, 0.287506103515625, 0.3314361572265625, 0.3753662109375, 0.4192962646484375, 0.463226318359375, 0.5071563720703125, 0.55108642578125, 0.5950164794921875, 0.638946533203125, 0.6828765869140625, 0.726806640625, 0.7707366943359375, 0.814666748046875, 0.8585968017578125, 0.90252685546875, 0.9464569091796875, 0.990386962890625, 1.0343170166015625, 1.0782470703125, 1.1221771240234375, 1.166107177734375, 1.2100372314453125, 1.25396728515625, 1.2978973388671875, 1.341827392578125, 1.3857574462890625, 1.4296875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 11.0, 9.0, 10.0, 14.0, 17.0, 9.0, 22.0, 33.0, 29.0, 49.0, 47.0, 61.0, 51.0, 52.0, 64.0, 66.0, 75.0, 59.0, 56.0, 37.0, 39.0, 28.0, 22.0, 28.0, 20.0, 22.0, 8.0, 15.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.807313919067383, -19.240148544311523, -18.672983169555664, -18.105819702148438, -17.538654327392578, -16.97148895263672, -16.40432357788086, -15.837158203125, -15.269993782043457, -14.702828407287598, -14.135663986206055, -13.568498611450195, -13.001333236694336, -12.434168815612793, -11.867003440856934, -11.29983901977539, -10.732673645019531, -10.165508270263672, -9.598343849182129, -9.03117847442627, -8.464014053344727, -7.896848678588867, -7.329683303833008, -6.762518405914307, -6.1953535079956055, -5.628188610076904, -5.061023712158203, -4.493858337402344, -3.9266934394836426, -3.3595285415649414, -2.792363405227661, -2.225198268890381, -1.6580314636230469, -1.0908664464950562, -0.5237014293670654, 0.04346358776092529, 0.610628604888916, 1.1777935028076172, 1.7449586391448975, 2.3121237754821777, 2.879288673400879, 3.44645357131958, 4.013618469238281, 4.580783843994141, 5.147948741912842, 5.715113639831543, 6.282279014587402, 6.8494439125061035, 7.416608810424805, 7.983773708343506, 8.550938606262207, 9.118103981018066, 9.68526840209961, 10.252433776855469, 10.819599151611328, 11.386764526367188, 11.95392894744873, 12.52109432220459, 13.088258743286133, 13.655424118041992, 14.222589492797852, 14.789753913879395, 15.356919288635254, 15.924083709716797, 16.491249084472656]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 3.0, 9.0, 9.0, 12.0, 5.0, 15.0, 13.0, 22.0, 19.0, 27.0, 29.0, 24.0, 24.0, 22.0, 31.0, 41.0, 37.0, 42.0, 48.0, 37.0, 41.0, 36.0, 36.0, 41.0, 41.0, 42.0, 23.0, 43.0, 34.0, 33.0, 23.0, 20.0, 19.0, 17.0, 14.0, 16.0, 12.0, 9.0, 8.0, 6.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.244494438171387, -9.893935203552246, -9.543375968933105, -9.192816734313965, -8.842257499694824, -8.491697311401367, -8.141138076782227, -7.790578842163086, -7.440019607543945, -7.089460372924805, -6.738901138305664, -6.388341903686523, -6.037782192230225, -5.687222957611084, -5.336663722991943, -4.9861040115356445, -4.635545253753662, -4.2849860191345215, -3.9344265460968018, -3.583867311477661, -3.2333078384399414, -2.882748603820801, -2.53218936920166, -2.1816298961639404, -1.8310706615447998, -1.4805113077163696, -1.1299519538879395, -0.7793927192687988, -0.42883336544036865, -0.07827401161193848, 0.27228522300720215, 0.6228446960449219, 0.9734039306640625, 1.3239632844924927, 1.6745226383209229, 2.0250818729400635, 2.375641345977783, 2.726200580596924, 3.0767598152160645, 3.427319288253784, 3.777878522872925, 4.1284379959106445, 4.478997230529785, 4.829556465148926, 5.180115699768066, 5.530674934387207, 5.881234169006348, 6.2317938804626465, 6.582353115081787, 6.932912349700928, 7.283471584320068, 7.634031295776367, 7.984590530395508, 8.335149765014648, 8.685708999633789, 9.03626823425293, 9.38682746887207, 9.737386703491211, 10.087945938110352, 10.438505172729492, 10.789064407348633, 11.139623641967773, 11.490182876586914, 11.840743064880371, 12.191302299499512]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 12.0, 7.0, 16.0, 22.0, 35.0, 44.0, 82.0, 110.0, 145.0, 261.0, 405.0, 648.0, 1028.0, 1616.0, 2689.0, 4948.0, 9112.0, 18598.0, 41480.0, 109493.0, 333596.0, 976617.0, 1491960.0, 790325.0, 256893.0, 85761.0, 34045.0, 15805.0, 8134.0, 4362.0, 2469.0, 1396.0, 829.0, 541.0, 270.0, 179.0, 121.0, 68.0, 55.0, 40.0, 24.0, 15.0, 8.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-31.171875, -30.265380859375, -29.35888671875, -28.452392578125, -27.5458984375, -26.639404296875, -25.73291015625, -24.826416015625, -23.919921875, -23.013427734375, -22.10693359375, -21.200439453125, -20.2939453125, -19.387451171875, -18.48095703125, -17.574462890625, -16.66796875, -15.761474609375, -14.85498046875, -13.948486328125, -13.0419921875, -12.135498046875, -11.22900390625, -10.322509765625, -9.416015625, -8.509521484375, -7.60302734375, -6.696533203125, -5.7900390625, -4.883544921875, -3.97705078125, -3.070556640625, -2.1640625, -1.257568359375, -0.35107421875, 0.555419921875, 1.4619140625, 2.368408203125, 3.27490234375, 4.181396484375, 5.087890625, 5.994384765625, 6.90087890625, 7.807373046875, 8.7138671875, 9.620361328125, 10.52685546875, 11.433349609375, 12.33984375, 13.246337890625, 14.15283203125, 15.059326171875, 15.9658203125, 16.872314453125, 17.77880859375, 18.685302734375, 19.591796875, 20.498291015625, 21.40478515625, 22.311279296875, 23.2177734375, 24.124267578125, 25.03076171875, 25.937255859375, 26.84375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 6.0, 5.0, 10.0, 9.0, 15.0, 10.0, 11.0, 18.0, 18.0, 26.0, 14.0, 25.0, 23.0, 27.0, 32.0, 20.0, 32.0, 38.0, 49.0, 39.0, 35.0, 41.0, 41.0, 36.0, 30.0, 39.0, 37.0, 27.0, 34.0, 29.0, 39.0, 24.0, 24.0, 15.0, 23.0, 21.0, 12.0, 10.0, 12.0, 6.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.715576171875, -8.40771484375, -8.099853515625, -7.7919921875, -7.484130859375, -7.17626953125, -6.868408203125, -6.560546875, -6.252685546875, -5.94482421875, -5.636962890625, -5.3291015625, -5.021240234375, -4.71337890625, -4.405517578125, -4.09765625, -3.789794921875, -3.48193359375, -3.174072265625, -2.8662109375, -2.558349609375, -2.25048828125, -1.942626953125, -1.634765625, -1.326904296875, -1.01904296875, -0.711181640625, -0.4033203125, -0.095458984375, 0.21240234375, 0.520263671875, 0.828125, 1.135986328125, 1.44384765625, 1.751708984375, 2.0595703125, 2.367431640625, 2.67529296875, 2.983154296875, 3.291015625, 3.598876953125, 3.90673828125, 4.214599609375, 4.5224609375, 4.830322265625, 5.13818359375, 5.446044921875, 5.75390625, 6.061767578125, 6.36962890625, 6.677490234375, 6.9853515625, 7.293212890625, 7.60107421875, 7.908935546875, 8.216796875, 8.524658203125, 8.83251953125, 9.140380859375, 9.4482421875, 9.756103515625, 10.06396484375, 10.371826171875, 10.6796875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 11.0, 18.0, 12.0, 18.0, 34.0, 46.0, 98.0, 171.0, 233.0, 448.0, 723.0, 1234.0, 2021.0, 3574.0, 6007.0, 11052.0, 21441.0, 42555.0, 90706.0, 209454.0, 498209.0, 1004084.0, 1137695.0, 652965.0, 279056.0, 119080.0, 54280.0, 27078.0, 14131.0, 7517.0, 4228.0, 2448.0, 1399.0, 882.0, 545.0, 326.0, 197.0, 125.0, 70.0, 33.0, 28.0, 18.0, 7.0, 12.0, 10.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.546875, -25.63671875, -24.7265625, -23.81640625, -22.90625, -21.99609375, -21.0859375, -20.17578125, -19.265625, -18.35546875, -17.4453125, -16.53515625, -15.625, -14.71484375, -13.8046875, -12.89453125, -11.984375, -11.07421875, -10.1640625, -9.25390625, -8.34375, -7.43359375, -6.5234375, -5.61328125, -4.703125, -3.79296875, -2.8828125, -1.97265625, -1.0625, -0.15234375, 0.7578125, 1.66796875, 2.578125, 3.48828125, 4.3984375, 5.30859375, 6.21875, 7.12890625, 8.0390625, 8.94921875, 9.859375, 10.76953125, 11.6796875, 12.58984375, 13.5, 14.41015625, 15.3203125, 16.23046875, 17.140625, 18.05078125, 18.9609375, 19.87109375, 20.78125, 21.69140625, 22.6015625, 23.51171875, 24.421875, 25.33203125, 26.2421875, 27.15234375, 28.0625, 28.97265625, 29.8828125, 30.79296875, 31.703125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 24.0, 23.0, 30.0, 40.0, 47.0, 78.0, 70.0, 99.0, 133.0, 154.0, 190.0, 258.0, 265.0, 277.0, 314.0, 327.0, 297.0, 282.0, 235.0, 203.0, 159.0, 138.0, 94.0, 94.0, 50.0, 48.0, 36.0, 29.0, 11.0, 12.0, 15.0, 11.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.749267578125, -8.49853515625, -8.247802734375, -7.9970703125, -7.746337890625, -7.49560546875, -7.244873046875, -6.994140625, -6.743408203125, -6.49267578125, -6.241943359375, -5.9912109375, -5.740478515625, -5.48974609375, -5.239013671875, -4.98828125, -4.737548828125, -4.48681640625, -4.236083984375, -3.9853515625, -3.734619140625, -3.48388671875, -3.233154296875, -2.982421875, -2.731689453125, -2.48095703125, -2.230224609375, -1.9794921875, -1.728759765625, -1.47802734375, -1.227294921875, -0.9765625, -0.725830078125, -0.47509765625, -0.224365234375, 0.0263671875, 0.277099609375, 0.52783203125, 0.778564453125, 1.029296875, 1.280029296875, 1.53076171875, 1.781494140625, 2.0322265625, 2.282958984375, 2.53369140625, 2.784423828125, 3.03515625, 3.285888671875, 3.53662109375, 3.787353515625, 4.0380859375, 4.288818359375, 4.53955078125, 4.790283203125, 5.041015625, 5.291748046875, 5.54248046875, 5.793212890625, 6.0439453125, 6.294677734375, 6.54541015625, 6.796142578125, 7.046875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 3.0, 11.0, 7.0, 10.0, 12.0, 18.0, 13.0, 22.0, 29.0, 37.0, 37.0, 47.0, 61.0, 65.0, 64.0, 54.0, 59.0, 60.0, 60.0, 44.0, 46.0, 47.0, 37.0, 33.0, 23.0, 26.0, 20.0, 7.0, 8.0, 6.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.552993774414062, -21.752286911010742, -20.951581954956055, -20.150875091552734, -19.350170135498047, -18.549463272094727, -17.748756408691406, -16.94805145263672, -16.14734649658203, -15.346640586853027, -14.545934677124023, -13.745227813720703, -12.944522857666016, -12.143815994262695, -11.343110084533691, -10.542404174804688, -9.741697311401367, -8.940991401672363, -8.14028549194336, -7.339579105377197, -6.538873195648193, -5.7381672859191895, -4.937460899353027, -4.136754989624023, -3.3360490798950195, -2.5353431701660156, -1.7346370220184326, -0.9339308738708496, -0.1332249641418457, 0.6674809455871582, 1.4681873321533203, 2.268893241882324, 3.069601058959961, 3.870306968688965, 4.671012878417969, 5.471719264984131, 6.272425174713135, 7.073131084442139, 7.873837471008301, 8.674543380737305, 9.475249290466309, 10.275955200195312, 11.076661109924316, 11.87736701965332, 12.67807388305664, 13.478778839111328, 14.279485702514648, 15.080191612243652, 15.880897521972656, 16.681604385375977, 17.482309341430664, 18.283016204833984, 19.083721160888672, 19.884428024291992, 20.685134887695312, 21.48583984375, 22.286544799804688, 23.087251663208008, 23.887956619262695, 24.688663482666016, 25.489368438720703, 26.290075302124023, 27.090782165527344, 27.89148712158203, 28.69219398498535]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 8.0, 8.0, 6.0, 3.0, 9.0, 8.0, 11.0, 16.0, 15.0, 23.0, 18.0, 23.0, 23.0, 22.0, 39.0, 29.0, 27.0, 32.0, 47.0, 37.0, 46.0, 39.0, 66.0, 51.0, 37.0, 33.0, 31.0, 38.0, 39.0, 34.0, 29.0, 29.0, 24.0, 26.0, 7.0, 15.0, 14.0, 9.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.265556335449219, -13.828651428222656, -13.391746520996094, -12.954841613769531, -12.517937660217285, -12.081032752990723, -11.64412784576416, -11.207222938537598, -10.770318984985352, -10.333414077758789, -9.896509170532227, -9.459604263305664, -9.022700309753418, -8.585795402526855, -8.148890495300293, -7.7119855880737305, -7.275080680847168, -6.8381757736206055, -6.401271343231201, -5.964366436004639, -5.527462005615234, -5.090557098388672, -4.653652191162109, -4.216747283935547, -3.7798428535461426, -3.342938184738159, -2.906033515930176, -2.4691286087036133, -2.03222393989563, -1.5953192710876465, -1.158414363861084, -0.7215096950531006, -0.2846059799194336, 0.15229874849319458, 0.5892034769058228, 1.0261082649230957, 1.463012933731079, 1.8999176025390625, 2.336822509765625, 2.7737271785736084, 3.210631847381592, 3.647536516189575, 4.084441184997559, 4.521346092224121, 4.958250999450684, 5.395155429840088, 5.83206033706665, 6.268964767456055, 6.705869674682617, 7.14277458190918, 7.579679012298584, 8.016584396362305, 8.45348834991455, 8.890393257141113, 9.327298164367676, 9.764203071594238, 10.201107025146484, 10.638011932373047, 11.07491683959961, 11.511821746826172, 11.948725700378418, 12.38563060760498, 12.822535514831543, 13.259440422058105, 13.696345329284668]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 4.0, 6.0, 11.0, 10.0, 30.0, 36.0, 58.0, 96.0, 145.0, 274.0, 571.0, 1082.0, 2323.0, 5339.0, 11805.0, 28068.0, 68746.0, 161561.0, 293300.0, 258309.0, 125620.0, 52538.0, 21503.0, 9309.0, 4042.0, 1821.0, 899.0, 440.0, 230.0, 135.0, 84.0, 40.0, 31.0, 19.0, 13.0, 14.0, 6.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.2734375, -12.8431396484375, -12.412841796875, -11.9825439453125, -11.55224609375, -11.1219482421875, -10.691650390625, -10.2613525390625, -9.8310546875, -9.4007568359375, -8.970458984375, -8.5401611328125, -8.10986328125, -7.6795654296875, -7.249267578125, -6.8189697265625, -6.388671875, -5.9583740234375, -5.528076171875, -5.0977783203125, -4.66748046875, -4.2371826171875, -3.806884765625, -3.3765869140625, -2.9462890625, -2.5159912109375, -2.085693359375, -1.6553955078125, -1.22509765625, -0.7947998046875, -0.364501953125, 0.0657958984375, 0.49609375, 0.9263916015625, 1.356689453125, 1.7869873046875, 2.21728515625, 2.6475830078125, 3.077880859375, 3.5081787109375, 3.9384765625, 4.3687744140625, 4.799072265625, 5.2293701171875, 5.65966796875, 6.0899658203125, 6.520263671875, 6.9505615234375, 7.380859375, 7.8111572265625, 8.241455078125, 8.6717529296875, 9.10205078125, 9.5323486328125, 9.962646484375, 10.3929443359375, 10.8232421875, 11.2535400390625, 11.683837890625, 12.1141357421875, 12.54443359375, 12.9747314453125, 13.405029296875, 13.8353271484375, 14.265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 2.0, 10.0, 5.0, 8.0, 13.0, 22.0, 14.0, 19.0, 22.0, 21.0, 23.0, 37.0, 26.0, 42.0, 33.0, 36.0, 45.0, 45.0, 52.0, 52.0, 34.0, 44.0, 45.0, 35.0, 36.0, 32.0, 38.0, 32.0, 31.0, 26.0, 16.0, 17.0, 13.0, 12.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.0, -15.5155029296875, -15.031005859375, -14.5465087890625, -14.06201171875, -13.5775146484375, -13.093017578125, -12.6085205078125, -12.1240234375, -11.6395263671875, -11.155029296875, -10.6705322265625, -10.18603515625, -9.7015380859375, -9.217041015625, -8.7325439453125, -8.248046875, -7.7635498046875, -7.279052734375, -6.7945556640625, -6.31005859375, -5.8255615234375, -5.341064453125, -4.8565673828125, -4.3720703125, -3.8875732421875, -3.403076171875, -2.9185791015625, -2.43408203125, -1.9495849609375, -1.465087890625, -0.9805908203125, -0.49609375, -0.0115966796875, 0.472900390625, 0.9573974609375, 1.44189453125, 1.9263916015625, 2.410888671875, 2.8953857421875, 3.3798828125, 3.8643798828125, 4.348876953125, 4.8333740234375, 5.31787109375, 5.8023681640625, 6.286865234375, 6.7713623046875, 7.255859375, 7.7403564453125, 8.224853515625, 8.7093505859375, 9.19384765625, 9.6783447265625, 10.162841796875, 10.6473388671875, 11.1318359375, 11.6163330078125, 12.100830078125, 12.5853271484375, 13.06982421875, 13.5543212890625, 14.038818359375, 14.5233154296875, 15.0078125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 19.0, 20.0, 26.0, 32.0, 60.0, 100.0, 155.0, 233.0, 393.0, 702.0, 1232.0, 2248.0, 4129.0, 8035.0, 17368.0, 38406.0, 91707.0, 213398.0, 319092.0, 198201.0, 84289.0, 35915.0, 16113.0, 7857.0, 3960.0, 2019.0, 1132.0, 668.0, 402.0, 223.0, 149.0, 93.0, 51.0, 44.0, 21.0, 18.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.683837890625, -13.21923828125, -12.754638671875, -12.2900390625, -11.825439453125, -11.36083984375, -10.896240234375, -10.431640625, -9.967041015625, -9.50244140625, -9.037841796875, -8.5732421875, -8.108642578125, -7.64404296875, -7.179443359375, -6.71484375, -6.250244140625, -5.78564453125, -5.321044921875, -4.8564453125, -4.391845703125, -3.92724609375, -3.462646484375, -2.998046875, -2.533447265625, -2.06884765625, -1.604248046875, -1.1396484375, -0.675048828125, -0.21044921875, 0.254150390625, 0.71875, 1.183349609375, 1.64794921875, 2.112548828125, 2.5771484375, 3.041748046875, 3.50634765625, 3.970947265625, 4.435546875, 4.900146484375, 5.36474609375, 5.829345703125, 6.2939453125, 6.758544921875, 7.22314453125, 7.687744140625, 8.15234375, 8.616943359375, 9.08154296875, 9.546142578125, 10.0107421875, 10.475341796875, 10.93994140625, 11.404541015625, 11.869140625, 12.333740234375, 12.79833984375, 13.262939453125, 13.7275390625, 14.192138671875, 14.65673828125, 15.121337890625, 15.5859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 14.0, 12.0, 11.0, 14.0, 16.0, 29.0, 23.0, 28.0, 27.0, 38.0, 38.0, 30.0, 28.0, 29.0, 53.0, 34.0, 42.0, 44.0, 37.0, 26.0, 28.0, 31.0, 41.0, 40.0, 36.0, 33.0, 22.0, 24.0, 22.0, 19.0, 11.0, 17.0, 10.0, 13.0, 14.0, 6.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.125, -8.8516845703125, -8.578369140625, -8.3050537109375, -8.03173828125, -7.7584228515625, -7.485107421875, -7.2117919921875, -6.9384765625, -6.6651611328125, -6.391845703125, -6.1185302734375, -5.84521484375, -5.5718994140625, -5.298583984375, -5.0252685546875, -4.751953125, -4.4786376953125, -4.205322265625, -3.9320068359375, -3.65869140625, -3.3853759765625, -3.112060546875, -2.8387451171875, -2.5654296875, -2.2921142578125, -2.018798828125, -1.7454833984375, -1.47216796875, -1.1988525390625, -0.925537109375, -0.6522216796875, -0.37890625, -0.1055908203125, 0.167724609375, 0.4410400390625, 0.71435546875, 0.9876708984375, 1.260986328125, 1.5343017578125, 1.8076171875, 2.0809326171875, 2.354248046875, 2.6275634765625, 2.90087890625, 3.1741943359375, 3.447509765625, 3.7208251953125, 3.994140625, 4.2674560546875, 4.540771484375, 4.8140869140625, 5.08740234375, 5.3607177734375, 5.634033203125, 5.9073486328125, 6.1806640625, 6.4539794921875, 6.727294921875, 7.0006103515625, 7.27392578125, 7.5472412109375, 7.820556640625, 8.0938720703125, 8.3671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 15.0, 15.0, 32.0, 45.0, 58.0, 78.0, 95.0, 166.0, 228.0, 368.0, 522.0, 809.0, 1139.0, 1786.0, 2960.0, 4720.0, 8246.0, 14682.0, 26791.0, 52190.0, 102072.0, 193308.0, 257209.0, 181418.0, 93585.0, 47658.0, 24917.0, 13532.0, 7649.0, 4527.0, 2777.0, 1722.0, 1102.0, 692.0, 454.0, 299.0, 203.0, 150.0, 99.0, 71.0, 62.0, 39.0, 18.0, 18.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.33984375, -5.17523193359375, -5.0106201171875, -4.84600830078125, -4.681396484375, -4.51678466796875, -4.3521728515625, -4.18756103515625, -4.02294921875, -3.85833740234375, -3.6937255859375, -3.52911376953125, -3.364501953125, -3.19989013671875, -3.0352783203125, -2.87066650390625, -2.7060546875, -2.54144287109375, -2.3768310546875, -2.21221923828125, -2.047607421875, -1.88299560546875, -1.7183837890625, -1.55377197265625, -1.38916015625, -1.22454833984375, -1.0599365234375, -0.89532470703125, -0.730712890625, -0.56610107421875, -0.4014892578125, -0.23687744140625, -0.072265625, 0.09234619140625, 0.2569580078125, 0.42156982421875, 0.586181640625, 0.75079345703125, 0.9154052734375, 1.08001708984375, 1.24462890625, 1.40924072265625, 1.5738525390625, 1.73846435546875, 1.903076171875, 2.06768798828125, 2.2322998046875, 2.39691162109375, 2.5615234375, 2.72613525390625, 2.8907470703125, 3.05535888671875, 3.219970703125, 3.38458251953125, 3.5491943359375, 3.71380615234375, 3.87841796875, 4.04302978515625, 4.2076416015625, 4.37225341796875, 4.536865234375, 4.70147705078125, 4.8660888671875, 5.03070068359375, 5.1953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 11.0, 12.0, 16.0, 21.0, 30.0, 37.0, 39.0, 40.0, 68.0, 70.0, 73.0, 64.0, 70.0, 73.0, 57.0, 52.0, 42.0, 49.0, 24.0, 31.0, 22.0, 20.0, 13.0, 11.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002281665802001953, -0.00022015348076820374, -0.00021214038133621216, -0.00020412728190422058, -0.000196114182472229, -0.00018810108304023743, -0.00018008798360824585, -0.00017207488417625427, -0.0001640617847442627, -0.00015604868531227112, -0.00014803558588027954, -0.00014002248644828796, -0.0001320093870162964, -0.0001239962875843048, -0.00011598318815231323, -0.00010797008872032166, -9.995698928833008e-05, -9.19438898563385e-05, -8.393079042434692e-05, -7.591769099235535e-05, -6.790459156036377e-05, -5.989149212837219e-05, -5.1878392696380615e-05, -4.386529326438904e-05, -3.585219383239746e-05, -2.7839094400405884e-05, -1.9825994968414307e-05, -1.181289553642273e-05, -3.7997961044311523e-06, 4.213303327560425e-06, 1.2226402759552002e-05, 2.023950219154358e-05, 2.8252601623535156e-05, 3.6265701055526733e-05, 4.427880048751831e-05, 5.229189991950989e-05, 6.0304999351501465e-05, 6.831809878349304e-05, 7.633119821548462e-05, 8.43442976474762e-05, 9.235739707946777e-05, 0.00010037049651145935, 0.00010838359594345093, 0.0001163966953754425, 0.00012440979480743408, 0.00013242289423942566, 0.00014043599367141724, 0.0001484490931034088, 0.0001564621925354004, 0.00016447529196739197, 0.00017248839139938354, 0.00018050149083137512, 0.0001885145902633667, 0.00019652768969535828, 0.00020454078912734985, 0.00021255388855934143, 0.000220566987991333, 0.00022858008742332458, 0.00023659318685531616, 0.00024460628628730774, 0.0002526193857192993, 0.0002606324851512909, 0.00026864558458328247, 0.00027665868401527405, 0.0002846717834472656]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 14.0, 16.0, 25.0, 40.0, 44.0, 81.0, 126.0, 193.0, 290.0, 455.0, 695.0, 1081.0, 1727.0, 3005.0, 5038.0, 8915.0, 16625.0, 32341.0, 63861.0, 126721.0, 219086.0, 240968.0, 158064.0, 81463.0, 40902.0, 20770.0, 10889.0, 6069.0, 3490.0, 2025.0, 1266.0, 769.0, 509.0, 331.0, 211.0, 155.0, 77.0, 61.0, 53.0, 31.0, 23.0, 13.0, 10.0, 5.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.96875, -6.75213623046875, -6.5355224609375, -6.31890869140625, -6.102294921875, -5.88568115234375, -5.6690673828125, -5.45245361328125, -5.23583984375, -5.01922607421875, -4.8026123046875, -4.58599853515625, -4.369384765625, -4.15277099609375, -3.9361572265625, -3.71954345703125, -3.5029296875, -3.28631591796875, -3.0697021484375, -2.85308837890625, -2.636474609375, -2.41986083984375, -2.2032470703125, -1.98663330078125, -1.77001953125, -1.55340576171875, -1.3367919921875, -1.12017822265625, -0.903564453125, -0.68695068359375, -0.4703369140625, -0.25372314453125, -0.037109375, 0.17950439453125, 0.3961181640625, 0.61273193359375, 0.829345703125, 1.04595947265625, 1.2625732421875, 1.47918701171875, 1.69580078125, 1.91241455078125, 2.1290283203125, 2.34564208984375, 2.562255859375, 2.77886962890625, 2.9954833984375, 3.21209716796875, 3.4287109375, 3.64532470703125, 3.8619384765625, 4.07855224609375, 4.295166015625, 4.51177978515625, 4.7283935546875, 4.94500732421875, 5.16162109375, 5.37823486328125, 5.5948486328125, 5.81146240234375, 6.028076171875, 6.24468994140625, 6.4613037109375, 6.67791748046875, 6.89453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 10.0, 10.0, 14.0, 14.0, 26.0, 30.0, 39.0, 49.0, 64.0, 67.0, 64.0, 82.0, 91.0, 76.0, 58.0, 55.0, 56.0, 37.0, 36.0, 34.0, 22.0, 18.0, 8.0, 8.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94921875, -1.888427734375, -1.82763671875, -1.766845703125, -1.7060546875, -1.645263671875, -1.58447265625, -1.523681640625, -1.462890625, -1.402099609375, -1.34130859375, -1.280517578125, -1.2197265625, -1.158935546875, -1.09814453125, -1.037353515625, -0.9765625, -0.915771484375, -0.85498046875, -0.794189453125, -0.7333984375, -0.672607421875, -0.61181640625, -0.551025390625, -0.490234375, -0.429443359375, -0.36865234375, -0.307861328125, -0.2470703125, -0.186279296875, -0.12548828125, -0.064697265625, -0.00390625, 0.056884765625, 0.11767578125, 0.178466796875, 0.2392578125, 0.300048828125, 0.36083984375, 0.421630859375, 0.482421875, 0.543212890625, 0.60400390625, 0.664794921875, 0.7255859375, 0.786376953125, 0.84716796875, 0.907958984375, 0.96875, 1.029541015625, 1.09033203125, 1.151123046875, 1.2119140625, 1.272705078125, 1.33349609375, 1.394287109375, 1.455078125, 1.515869140625, 1.57666015625, 1.637451171875, 1.6982421875, 1.759033203125, 1.81982421875, 1.880615234375, 1.94140625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 0.0, 8.0, 6.0, 5.0, 8.0, 20.0, 15.0, 15.0, 14.0, 26.0, 30.0, 42.0, 33.0, 66.0, 70.0, 63.0, 52.0, 59.0, 72.0, 55.0, 46.0, 51.0, 47.0, 38.0, 34.0, 27.0, 20.0, 20.0, 15.0, 6.0, 7.0, 6.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.030563354492188, -23.214033126831055, -22.397502899169922, -21.580974578857422, -20.76444435119629, -19.947914123535156, -19.131383895874023, -18.31485366821289, -17.49832534790039, -16.681795120239258, -15.865265846252441, -15.048735618591309, -14.232206344604492, -13.41567611694336, -12.599145889282227, -11.782615661621094, -10.966085433959961, -10.149555206298828, -9.333025932312012, -8.516495704650879, -7.699965953826904, -6.88343620300293, -6.066905975341797, -5.250376224517822, -4.433846473693848, -3.617316722869873, -2.8007867336273193, -1.9842567443847656, -1.167726993560791, -0.3511972427368164, 0.4653329849243164, 1.281862735748291, 2.0983943939208984, 2.914924144744873, 3.7314541339874268, 4.5479841232299805, 5.364513874053955, 6.18104362487793, 6.9975738525390625, 7.814103603363037, 8.630633354187012, 9.447163581848145, 10.263692855834961, 11.080223083496094, 11.896753311157227, 12.713282585144043, 13.529812812805176, 14.346342086791992, 15.162872314453125, 15.979402542114258, 16.79593276977539, 17.61246109008789, 18.428991317749023, 19.245521545410156, 20.06205177307129, 20.878582000732422, 21.695110321044922, 22.511640548706055, 23.328170776367188, 24.144699096679688, 24.96122932434082, 25.777759552001953, 26.594289779663086, 27.41082000732422, 28.22735023498535]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 6.0, 6.0, 4.0, 4.0, 11.0, 13.0, 10.0, 15.0, 18.0, 22.0, 17.0, 23.0, 26.0, 32.0, 29.0, 26.0, 28.0, 36.0, 33.0, 37.0, 54.0, 46.0, 57.0, 50.0, 30.0, 36.0, 32.0, 34.0, 47.0, 34.0, 29.0, 24.0, 34.0, 14.0, 6.0, 15.0, 19.0, 9.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.910043716430664, -13.482439041137695, -13.054834365844727, -12.627229690551758, -12.199624061584473, -11.772019386291504, -11.344414710998535, -10.916810035705566, -10.489204406738281, -10.061599731445312, -9.633995056152344, -9.206390380859375, -8.77878475189209, -8.351180076599121, -7.923575401306152, -7.495970726013184, -7.068366050720215, -6.640761375427246, -6.213156223297119, -5.78555154800415, -5.357946395874023, -4.930341720581055, -4.502737045288086, -4.075132369995117, -3.6475272178649902, -3.2199223041534424, -2.7923173904418945, -2.364712715148926, -1.937107801437378, -1.50950288772583, -1.0818982124328613, -0.6542932987213135, -0.22668743133544922, 0.20091742277145386, 0.6285222768783569, 1.0561270713806152, 1.483731985092163, 1.911336898803711, 2.3389415740966797, 2.7665464878082275, 3.1941514015197754, 3.6217563152313232, 4.049361228942871, 4.47696590423584, 4.904570579528809, 5.3321757316589355, 5.759780406951904, 6.187385559082031, 6.614990234375, 7.042594909667969, 7.470200061798096, 7.8978047370910645, 8.325409889221191, 8.75301456451416, 9.180619239807129, 9.608223915100098, 10.035829544067383, 10.463434219360352, 10.89103889465332, 11.318643569946289, 11.746249198913574, 12.173853874206543, 12.601458549499512, 13.02906322479248, 13.45666790008545]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 7.0, 10.0, 15.0, 15.0, 29.0, 41.0, 51.0, 66.0, 110.0, 145.0, 218.0, 281.0, 401.0, 584.0, 879.0, 1407.0, 2390.0, 4755.0, 10112.0, 24230.0, 58902.0, 137670.0, 252460.0, 268970.0, 160655.0, 70718.0, 28511.0, 12007.0, 5427.0, 2797.0, 1613.0, 992.0, 624.0, 437.0, 295.0, 207.0, 138.0, 113.0, 80.0, 39.0, 35.0, 30.0, 34.0, 16.0, 12.0, 3.0, 13.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.084716796875, -18.45068359375, -17.816650390625, -17.1826171875, -16.548583984375, -15.91455078125, -15.280517578125, -14.646484375, -14.012451171875, -13.37841796875, -12.744384765625, -12.1103515625, -11.476318359375, -10.84228515625, -10.208251953125, -9.57421875, -8.940185546875, -8.30615234375, -7.672119140625, -7.0380859375, -6.404052734375, -5.77001953125, -5.135986328125, -4.501953125, -3.867919921875, -3.23388671875, -2.599853515625, -1.9658203125, -1.331787109375, -0.69775390625, -0.063720703125, 0.5703125, 1.204345703125, 1.83837890625, 2.472412109375, 3.1064453125, 3.740478515625, 4.37451171875, 5.008544921875, 5.642578125, 6.276611328125, 6.91064453125, 7.544677734375, 8.1787109375, 8.812744140625, 9.44677734375, 10.080810546875, 10.71484375, 11.348876953125, 11.98291015625, 12.616943359375, 13.2509765625, 13.885009765625, 14.51904296875, 15.153076171875, 15.787109375, 16.421142578125, 17.05517578125, 17.689208984375, 18.3232421875, 18.957275390625, 19.59130859375, 20.225341796875, 20.859375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 9.0, 2.0, 4.0, 8.0, 7.0, 11.0, 14.0, 15.0, 20.0, 12.0, 10.0, 25.0, 28.0, 27.0, 22.0, 24.0, 28.0, 42.0, 35.0, 47.0, 42.0, 39.0, 49.0, 47.0, 51.0, 35.0, 33.0, 42.0, 38.0, 33.0, 28.0, 35.0, 20.0, 20.0, 14.0, 17.0, 11.0, 10.0, 10.0, 6.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.1171875, -13.6663818359375, -13.215576171875, -12.7647705078125, -12.31396484375, -11.8631591796875, -11.412353515625, -10.9615478515625, -10.5107421875, -10.0599365234375, -9.609130859375, -9.1583251953125, -8.70751953125, -8.2567138671875, -7.805908203125, -7.3551025390625, -6.904296875, -6.4534912109375, -6.002685546875, -5.5518798828125, -5.10107421875, -4.6502685546875, -4.199462890625, -3.7486572265625, -3.2978515625, -2.8470458984375, -2.396240234375, -1.9454345703125, -1.49462890625, -1.0438232421875, -0.593017578125, -0.1422119140625, 0.30859375, 0.7593994140625, 1.210205078125, 1.6610107421875, 2.11181640625, 2.5626220703125, 3.013427734375, 3.4642333984375, 3.9150390625, 4.3658447265625, 4.816650390625, 5.2674560546875, 5.71826171875, 6.1690673828125, 6.619873046875, 7.0706787109375, 7.521484375, 7.9722900390625, 8.423095703125, 8.8739013671875, 9.32470703125, 9.7755126953125, 10.226318359375, 10.6771240234375, 11.1279296875, 11.5787353515625, 12.029541015625, 12.4803466796875, 12.93115234375, 13.3819580078125, 13.832763671875, 14.2835693359375, 14.734375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 6.0, 14.0, 11.0, 9.0, 14.0, 29.0, 35.0, 55.0, 75.0, 100.0, 116.0, 158.0, 218.0, 307.0, 441.0, 642.0, 924.0, 1612.0, 3275.0, 7983.0, 24496.0, 88112.0, 276177.0, 385076.0, 180332.0, 51890.0, 14883.0, 5256.0, 2344.0, 1214.0, 815.0, 535.0, 380.0, 273.0, 217.0, 159.0, 98.0, 70.0, 47.0, 47.0, 27.0, 26.0, 16.0, 21.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.609375, -29.598876953125, -28.58837890625, -27.577880859375, -26.5673828125, -25.556884765625, -24.54638671875, -23.535888671875, -22.525390625, -21.514892578125, -20.50439453125, -19.493896484375, -18.4833984375, -17.472900390625, -16.46240234375, -15.451904296875, -14.44140625, -13.430908203125, -12.42041015625, -11.409912109375, -10.3994140625, -9.388916015625, -8.37841796875, -7.367919921875, -6.357421875, -5.346923828125, -4.33642578125, -3.325927734375, -2.3154296875, -1.304931640625, -0.29443359375, 0.716064453125, 1.7265625, 2.737060546875, 3.74755859375, 4.758056640625, 5.7685546875, 6.779052734375, 7.78955078125, 8.800048828125, 9.810546875, 10.821044921875, 11.83154296875, 12.842041015625, 13.8525390625, 14.863037109375, 15.87353515625, 16.884033203125, 17.89453125, 18.905029296875, 19.91552734375, 20.926025390625, 21.9365234375, 22.947021484375, 23.95751953125, 24.968017578125, 25.978515625, 26.989013671875, 27.99951171875, 29.010009765625, 30.0205078125, 31.031005859375, 32.04150390625, 33.052001953125, 34.0625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 13.0, 11.0, 13.0, 17.0, 27.0, 22.0, 21.0, 24.0, 15.0, 23.0, 22.0, 32.0, 38.0, 34.0, 39.0, 39.0, 34.0, 35.0, 44.0, 33.0, 48.0, 42.0, 37.0, 46.0, 34.0, 38.0, 32.0, 24.0, 28.0, 18.0, 15.0, 14.0, 12.0, 10.0, 10.0, 8.0, 7.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.0390625, -8.7491455078125, -8.459228515625, -8.1693115234375, -7.87939453125, -7.5894775390625, -7.299560546875, -7.0096435546875, -6.7197265625, -6.4298095703125, -6.139892578125, -5.8499755859375, -5.56005859375, -5.2701416015625, -4.980224609375, -4.6903076171875, -4.400390625, -4.1104736328125, -3.820556640625, -3.5306396484375, -3.24072265625, -2.9508056640625, -2.660888671875, -2.3709716796875, -2.0810546875, -1.7911376953125, -1.501220703125, -1.2113037109375, -0.92138671875, -0.6314697265625, -0.341552734375, -0.0516357421875, 0.23828125, 0.5281982421875, 0.818115234375, 1.1080322265625, 1.39794921875, 1.6878662109375, 1.977783203125, 2.2677001953125, 2.5576171875, 2.8475341796875, 3.137451171875, 3.4273681640625, 3.71728515625, 4.0072021484375, 4.297119140625, 4.5870361328125, 4.876953125, 5.1668701171875, 5.456787109375, 5.7467041015625, 6.03662109375, 6.3265380859375, 6.616455078125, 6.9063720703125, 7.1962890625, 7.4862060546875, 7.776123046875, 8.0660400390625, 8.35595703125, 8.6458740234375, 8.935791015625, 9.2257080078125, 9.515625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 3.0, 13.0, 10.0, 22.0, 32.0, 43.0, 68.0, 97.0, 157.0, 260.0, 378.0, 491.0, 743.0, 1174.0, 1709.0, 2770.0, 4517.0, 8036.0, 16660.0, 40474.0, 101668.0, 222223.0, 293501.0, 198566.0, 87248.0, 34253.0, 14537.0, 7286.0, 4142.0, 2547.0, 1638.0, 1056.0, 733.0, 517.0, 316.0, 208.0, 136.0, 103.0, 73.0, 39.0, 30.0, 25.0, 20.0, 12.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.376708984375, -9.03466796875, -8.692626953125, -8.3505859375, -8.008544921875, -7.66650390625, -7.324462890625, -6.982421875, -6.640380859375, -6.29833984375, -5.956298828125, -5.6142578125, -5.272216796875, -4.93017578125, -4.588134765625, -4.24609375, -3.904052734375, -3.56201171875, -3.219970703125, -2.8779296875, -2.535888671875, -2.19384765625, -1.851806640625, -1.509765625, -1.167724609375, -0.82568359375, -0.483642578125, -0.1416015625, 0.200439453125, 0.54248046875, 0.884521484375, 1.2265625, 1.568603515625, 1.91064453125, 2.252685546875, 2.5947265625, 2.936767578125, 3.27880859375, 3.620849609375, 3.962890625, 4.304931640625, 4.64697265625, 4.989013671875, 5.3310546875, 5.673095703125, 6.01513671875, 6.357177734375, 6.69921875, 7.041259765625, 7.38330078125, 7.725341796875, 8.0673828125, 8.409423828125, 8.75146484375, 9.093505859375, 9.435546875, 9.777587890625, 10.11962890625, 10.461669921875, 10.8037109375, 11.145751953125, 11.48779296875, 11.829833984375, 12.171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 7.0, 13.0, 16.0, 19.0, 31.0, 26.0, 55.0, 69.0, 67.0, 63.0, 107.0, 89.0, 73.0, 68.0, 66.0, 59.0, 33.0, 22.0, 16.0, 18.0, 17.0, 14.0, 7.0, 6.0, 7.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007643699645996094, -0.0007371082901954651, -0.0007098466157913208, -0.0006825849413871765, -0.0006553232669830322, -0.0006280615925788879, -0.0006007999181747437, -0.0005735382437705994, -0.0005462765693664551, -0.0005190148949623108, -0.0004917532205581665, -0.0004644915461540222, -0.00043722987174987793, -0.00040996819734573364, -0.00038270652294158936, -0.00035544484853744507, -0.0003281831741333008, -0.0003009214997291565, -0.0002736598253250122, -0.0002463981509208679, -0.00021913647651672363, -0.00019187480211257935, -0.00016461312770843506, -0.00013735145330429077, -0.00011008977890014648, -8.28281044960022e-05, -5.556643009185791e-05, -2.8304755687713623e-05, -1.043081283569336e-06, 2.621859312057495e-05, 5.348026752471924e-05, 8.074194192886353e-05, 0.00010800361633300781, 0.0001352652907371521, 0.0001625269651412964, 0.00018978863954544067, 0.00021705031394958496, 0.00024431198835372925, 0.00027157366275787354, 0.0002988353371620178, 0.0003260970115661621, 0.0003533586859703064, 0.0003806203603744507, 0.00040788203477859497, 0.00043514370918273926, 0.00046240538358688354, 0.0004896670579910278, 0.0005169287323951721, 0.0005441904067993164, 0.0005714520812034607, 0.000598713755607605, 0.0006259754300117493, 0.0006532371044158936, 0.0006804987788200378, 0.0007077604532241821, 0.0007350221276283264, 0.0007622838020324707, 0.000789545476436615, 0.0008168071508407593, 0.0008440688252449036, 0.0008713304996490479, 0.0008985921740531921, 0.0009258538484573364, 0.0009531155228614807, 0.000980377197265625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 10.0, 7.0, 16.0, 24.0, 39.0, 44.0, 77.0, 126.0, 169.0, 290.0, 466.0, 805.0, 1319.0, 2457.0, 4849.0, 10333.0, 27546.0, 93489.0, 291335.0, 378064.0, 161703.0, 45774.0, 15454.0, 6571.0, 3323.0, 1689.0, 951.0, 576.0, 373.0, 203.0, 142.0, 97.0, 64.0, 44.0, 35.0, 24.0, 22.0, 10.0, 12.0, 5.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.296875, -12.808349609375, -12.31982421875, -11.831298828125, -11.3427734375, -10.854248046875, -10.36572265625, -9.877197265625, -9.388671875, -8.900146484375, -8.41162109375, -7.923095703125, -7.4345703125, -6.946044921875, -6.45751953125, -5.968994140625, -5.48046875, -4.991943359375, -4.50341796875, -4.014892578125, -3.5263671875, -3.037841796875, -2.54931640625, -2.060791015625, -1.572265625, -1.083740234375, -0.59521484375, -0.106689453125, 0.3818359375, 0.870361328125, 1.35888671875, 1.847412109375, 2.3359375, 2.824462890625, 3.31298828125, 3.801513671875, 4.2900390625, 4.778564453125, 5.26708984375, 5.755615234375, 6.244140625, 6.732666015625, 7.22119140625, 7.709716796875, 8.1982421875, 8.686767578125, 9.17529296875, 9.663818359375, 10.15234375, 10.640869140625, 11.12939453125, 11.617919921875, 12.1064453125, 12.594970703125, 13.08349609375, 13.572021484375, 14.060546875, 14.549072265625, 15.03759765625, 15.526123046875, 16.0146484375, 16.503173828125, 16.99169921875, 17.480224609375, 17.96875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 8.0, 6.0, 8.0, 12.0, 19.0, 26.0, 32.0, 41.0, 51.0, 75.0, 61.0, 66.0, 80.0, 94.0, 78.0, 66.0, 66.0, 45.0, 46.0, 35.0, 26.0, 11.0, 6.0, 11.0, 10.0, 2.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8984375, -2.808074951171875, -2.71771240234375, -2.627349853515625, -2.5369873046875, -2.446624755859375, -2.35626220703125, -2.265899658203125, -2.175537109375, -2.085174560546875, -1.99481201171875, -1.904449462890625, -1.8140869140625, -1.723724365234375, -1.63336181640625, -1.542999267578125, -1.45263671875, -1.362274169921875, -1.27191162109375, -1.181549072265625, -1.0911865234375, -1.000823974609375, -0.91046142578125, -0.820098876953125, -0.729736328125, -0.639373779296875, -0.54901123046875, -0.458648681640625, -0.3682861328125, -0.277923583984375, -0.18756103515625, -0.097198486328125, -0.0068359375, 0.083526611328125, 0.17388916015625, 0.264251708984375, 0.3546142578125, 0.444976806640625, 0.53533935546875, 0.625701904296875, 0.716064453125, 0.806427001953125, 0.89678955078125, 0.987152099609375, 1.0775146484375, 1.167877197265625, 1.25823974609375, 1.348602294921875, 1.43896484375, 1.529327392578125, 1.61968994140625, 1.710052490234375, 1.8004150390625, 1.890777587890625, 1.98114013671875, 2.071502685546875, 2.161865234375, 2.252227783203125, 2.34259033203125, 2.432952880859375, 2.5233154296875, 2.613677978515625, 2.70404052734375, 2.794403076171875, 2.884765625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 12.0, 14.0, 9.0, 20.0, 26.0, 28.0, 44.0, 30.0, 59.0, 50.0, 63.0, 49.0, 61.0, 59.0, 73.0, 52.0, 40.0, 46.0, 44.0, 40.0, 38.0, 24.0, 19.0, 12.0, 15.0, 16.0, 6.0, 6.0, 5.0, 2.0, 7.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.312686920166016, -21.490901947021484, -20.66911506652832, -19.84733009338379, -19.025543212890625, -18.203758239746094, -17.381973266601562, -16.5601863861084, -15.73840045928955, -14.916614532470703, -14.094828605651855, -13.273042678833008, -12.451257705688477, -11.629470825195312, -10.807685852050781, -9.985899925231934, -9.164113998413086, -8.342328071594238, -7.520542144775391, -6.698756694793701, -5.8769707679748535, -5.055184841156006, -4.233399391174316, -3.4116134643554688, -2.589827537536621, -1.768041729927063, -0.9462559223175049, -0.12447023391723633, 0.6973156929016113, 1.519101619720459, 2.3408870697021484, 3.162672996520996, 3.9844589233398438, 4.806244850158691, 5.628030776977539, 6.4498162269592285, 7.271602153778076, 8.093387603759766, 8.915173530578613, 9.736959457397461, 10.558745384216309, 11.380531311035156, 12.202317237854004, 13.024103164672852, 13.845888137817383, 14.667675018310547, 15.489459991455078, 16.31124496459961, 17.133031845092773, 17.954816818237305, 18.77660369873047, 19.598388671875, 20.420175552368164, 21.241960525512695, 22.06374740600586, 22.88553237915039, 23.707317352294922, 24.529102325439453, 25.350889205932617, 26.17267417907715, 26.994461059570312, 27.816246032714844, 28.638031005859375, 29.45981788635254, 30.281604766845703]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 7.0, 6.0, 6.0, 8.0, 10.0, 10.0, 17.0, 20.0, 20.0, 17.0, 37.0, 20.0, 23.0, 33.0, 38.0, 40.0, 48.0, 39.0, 50.0, 40.0, 53.0, 39.0, 51.0, 36.0, 36.0, 31.0, 29.0, 34.0, 35.0, 31.0, 22.0, 16.0, 22.0, 12.0, 17.0, 13.0, 8.0, 5.0, 6.0, 3.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.957361221313477, -16.446117401123047, -15.934871673583984, -15.423626899719238, -14.912382125854492, -14.401137351989746, -13.889892578125, -13.37864875793457, -12.867403030395508, -12.356158256530762, -11.844913482666016, -11.33366870880127, -10.822423934936523, -10.311179161071777, -9.799934387207031, -9.288690567016602, -8.777445793151855, -8.26620101928711, -7.754956245422363, -7.243711471557617, -6.732466697692871, -6.221221923828125, -5.709977626800537, -5.198732852935791, -4.687488079071045, -4.176243305206299, -3.6649985313415527, -3.1537539958953857, -2.6425092220306396, -2.1312644481658936, -1.6200199127197266, -1.1087751388549805, -0.5975313186645508, -0.08628660440444946, 0.42495810985565186, 0.9362027645111084, 1.4474475383758545, 1.9586923122406006, 2.4699368476867676, 2.9811816215515137, 3.4924263954162598, 4.003671169281006, 4.514915943145752, 5.02616024017334, 5.537405014038086, 6.048649787902832, 6.559894561767578, 7.071139335632324, 7.58238410949707, 8.093628883361816, 8.604873657226562, 9.116118431091309, 9.627363204956055, 10.1386079788208, 10.649852752685547, 11.161096572875977, 11.672342300415039, 12.183587074279785, 12.694831848144531, 13.206076622009277, 13.717321395874023, 14.22856616973877, 14.739810943603516, 15.251054763793945, 15.762299537658691]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 16.0, 14.0, 26.0, 33.0, 57.0, 83.0, 138.0, 260.0, 370.0, 649.0, 1196.0, 2262.0, 4414.0, 8551.0, 18965.0, 46038.0, 126947.0, 407608.0, 1227535.0, 1491336.0, 576063.0, 174162.0, 60209.0, 24070.0, 11067.0, 5476.0, 2821.0, 1582.0, 894.0, 520.0, 341.0, 208.0, 139.0, 67.0, 58.0, 40.0, 15.0, 12.0, 12.0, 8.0, 7.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.1875, -41.80078125, -40.4140625, -39.02734375, -37.640625, -36.25390625, -34.8671875, -33.48046875, -32.09375, -30.70703125, -29.3203125, -27.93359375, -26.546875, -25.16015625, -23.7734375, -22.38671875, -21.0, -19.61328125, -18.2265625, -16.83984375, -15.453125, -14.06640625, -12.6796875, -11.29296875, -9.90625, -8.51953125, -7.1328125, -5.74609375, -4.359375, -2.97265625, -1.5859375, -0.19921875, 1.1875, 2.57421875, 3.9609375, 5.34765625, 6.734375, 8.12109375, 9.5078125, 10.89453125, 12.28125, 13.66796875, 15.0546875, 16.44140625, 17.828125, 19.21484375, 20.6015625, 21.98828125, 23.375, 24.76171875, 26.1484375, 27.53515625, 28.921875, 30.30859375, 31.6953125, 33.08203125, 34.46875, 35.85546875, 37.2421875, 38.62890625, 40.015625, 41.40234375, 42.7890625, 44.17578125, 45.5625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 3.0, 9.0, 7.0, 11.0, 8.0, 8.0, 14.0, 17.0, 18.0, 18.0, 27.0, 19.0, 33.0, 36.0, 27.0, 37.0, 48.0, 50.0, 44.0, 58.0, 40.0, 48.0, 38.0, 40.0, 54.0, 27.0, 39.0, 25.0, 17.0, 30.0, 32.0, 10.0, 23.0, 15.0, 16.0, 12.0, 7.0, 7.0, 4.0, 3.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.296875, -15.77392578125, -15.2509765625, -14.72802734375, -14.205078125, -13.68212890625, -13.1591796875, -12.63623046875, -12.11328125, -11.59033203125, -11.0673828125, -10.54443359375, -10.021484375, -9.49853515625, -8.9755859375, -8.45263671875, -7.9296875, -7.40673828125, -6.8837890625, -6.36083984375, -5.837890625, -5.31494140625, -4.7919921875, -4.26904296875, -3.74609375, -3.22314453125, -2.7001953125, -2.17724609375, -1.654296875, -1.13134765625, -0.6083984375, -0.08544921875, 0.4375, 0.96044921875, 1.4833984375, 2.00634765625, 2.529296875, 3.05224609375, 3.5751953125, 4.09814453125, 4.62109375, 5.14404296875, 5.6669921875, 6.18994140625, 6.712890625, 7.23583984375, 7.7587890625, 8.28173828125, 8.8046875, 9.32763671875, 9.8505859375, 10.37353515625, 10.896484375, 11.41943359375, 11.9423828125, 12.46533203125, 12.98828125, 13.51123046875, 14.0341796875, 14.55712890625, 15.080078125, 15.60302734375, 16.1259765625, 16.64892578125, 17.171875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 13.0, 24.0, 46.0, 48.0, 99.0, 167.0, 240.0, 385.0, 648.0, 968.0, 1573.0, 2479.0, 4277.0, 7340.0, 12860.0, 23348.0, 44071.0, 86189.0, 178233.0, 380332.0, 777814.0, 1109075.0, 795358.0, 394644.0, 184388.0, 88447.0, 44999.0, 24063.0, 13267.0, 7614.0, 4431.0, 2598.0, 1552.0, 951.0, 623.0, 388.0, 247.0, 186.0, 105.0, 66.0, 37.0, 23.0, 17.0, 13.0, 8.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.15625, -38.88232421875, -37.6083984375, -36.33447265625, -35.060546875, -33.78662109375, -32.5126953125, -31.23876953125, -29.96484375, -28.69091796875, -27.4169921875, -26.14306640625, -24.869140625, -23.59521484375, -22.3212890625, -21.04736328125, -19.7734375, -18.49951171875, -17.2255859375, -15.95166015625, -14.677734375, -13.40380859375, -12.1298828125, -10.85595703125, -9.58203125, -8.30810546875, -7.0341796875, -5.76025390625, -4.486328125, -3.21240234375, -1.9384765625, -0.66455078125, 0.609375, 1.88330078125, 3.1572265625, 4.43115234375, 5.705078125, 6.97900390625, 8.2529296875, 9.52685546875, 10.80078125, 12.07470703125, 13.3486328125, 14.62255859375, 15.896484375, 17.17041015625, 18.4443359375, 19.71826171875, 20.9921875, 22.26611328125, 23.5400390625, 24.81396484375, 26.087890625, 27.36181640625, 28.6357421875, 29.90966796875, 31.18359375, 32.45751953125, 33.7314453125, 35.00537109375, 36.279296875, 37.55322265625, 38.8271484375, 40.10107421875, 41.375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 10.0, 4.0, 13.0, 14.0, 19.0, 25.0, 41.0, 42.0, 49.0, 65.0, 89.0, 101.0, 119.0, 135.0, 152.0, 193.0, 230.0, 237.0, 251.0, 257.0, 286.0, 279.0, 241.0, 233.0, 167.0, 161.0, 129.0, 116.0, 81.0, 71.0, 66.0, 40.0, 26.0, 29.0, 22.0, 22.0, 11.0, 13.0, 10.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.443603515625, -9.11376953125, -8.783935546875, -8.4541015625, -8.124267578125, -7.79443359375, -7.464599609375, -7.134765625, -6.804931640625, -6.47509765625, -6.145263671875, -5.8154296875, -5.485595703125, -5.15576171875, -4.825927734375, -4.49609375, -4.166259765625, -3.83642578125, -3.506591796875, -3.1767578125, -2.846923828125, -2.51708984375, -2.187255859375, -1.857421875, -1.527587890625, -1.19775390625, -0.867919921875, -0.5380859375, -0.208251953125, 0.12158203125, 0.451416015625, 0.78125, 1.111083984375, 1.44091796875, 1.770751953125, 2.1005859375, 2.430419921875, 2.76025390625, 3.090087890625, 3.419921875, 3.749755859375, 4.07958984375, 4.409423828125, 4.7392578125, 5.069091796875, 5.39892578125, 5.728759765625, 6.05859375, 6.388427734375, 6.71826171875, 7.048095703125, 7.3779296875, 7.707763671875, 8.03759765625, 8.367431640625, 8.697265625, 9.027099609375, 9.35693359375, 9.686767578125, 10.0166015625, 10.346435546875, 10.67626953125, 11.006103515625, 11.3359375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 3.0, 4.0, 4.0, 10.0, 13.0, 16.0, 24.0, 31.0, 21.0, 33.0, 44.0, 59.0, 78.0, 85.0, 73.0, 76.0, 79.0, 72.0, 58.0, 36.0, 46.0, 32.0, 20.0, 13.0, 18.0, 14.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.13146209716797, -44.4886589050293, -42.84585189819336, -41.20304870605469, -39.56024169921875, -37.91743850708008, -36.274635314941406, -34.63182830810547, -32.98902130126953, -31.346216201782227, -29.703411102294922, -28.06060791015625, -26.417800903320312, -24.77499771118164, -23.132192611694336, -21.48938751220703, -19.84658432006836, -18.203779220581055, -16.56097412109375, -14.918169975280762, -13.275364875793457, -11.632559776306152, -9.989755630493164, -8.34695053100586, -6.704145431518555, -5.06134033203125, -3.4185357093811035, -1.775731086730957, -0.13292598724365234, 1.5098791122436523, 3.1526832580566406, 4.795488357543945, 6.438289642333984, 8.081094741821289, 9.723899841308594, 11.366703987121582, 13.009509086608887, 14.652314186096191, 16.29511833190918, 17.937923431396484, 19.58072853088379, 21.223533630371094, 22.8663387298584, 24.509143829345703, 26.151947021484375, 27.794754028320312, 29.437557220458984, 31.08036231994629, 32.723167419433594, 34.365970611572266, 36.0087776184082, 37.651580810546875, 39.29438781738281, 40.937191009521484, 42.579994201660156, 44.222801208496094, 45.86560821533203, 47.5084114074707, 49.15121841430664, 50.79402160644531, 52.43682861328125, 54.07963180541992, 55.722434997558594, 57.36524200439453, 59.0080451965332]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 7.0, 9.0, 10.0, 11.0, 15.0, 28.0, 29.0, 21.0, 29.0, 29.0, 37.0, 44.0, 44.0, 40.0, 50.0, 40.0, 35.0, 59.0, 41.0, 48.0, 47.0, 49.0, 37.0, 32.0, 26.0, 19.0, 26.0, 20.0, 16.0, 21.0, 6.0, 14.0, 9.0, 10.0, 10.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.20033836364746, -23.439237594604492, -22.67813491821289, -21.917034149169922, -21.155933380126953, -20.394832611083984, -19.633731842041016, -18.872629165649414, -18.111528396606445, -17.350427627563477, -16.589324951171875, -15.828224182128906, -15.067123413085938, -14.306022644042969, -13.544920921325684, -12.783819198608398, -12.02271842956543, -11.261617660522461, -10.500515937805176, -9.73941421508789, -8.978313446044922, -8.217212677001953, -7.456110954284668, -6.695009708404541, -5.933908462524414, -5.172807216644287, -4.41170597076416, -3.650604724884033, -2.8895034790039062, -2.1284022331237793, -1.3673009872436523, -0.6061997413635254, 0.15489959716796875, 0.9160008430480957, 1.6771020889282227, 2.4382033348083496, 3.1993045806884766, 3.9604058265686035, 4.7215070724487305, 5.482608318328857, 6.243709564208984, 7.004810810089111, 7.765912055969238, 8.527013778686523, 9.288114547729492, 10.049215316772461, 10.810317039489746, 11.571418762207031, 12.33251953125, 13.093620300292969, 13.854722023010254, 14.615823745727539, 15.376924514770508, 16.138025283813477, 16.899127960205078, 17.660228729248047, 18.421329498291016, 19.182430267333984, 19.943531036376953, 20.704633712768555, 21.465734481811523, 22.226835250854492, 22.987937927246094, 23.749038696289062, 24.51013946533203]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 14.0, 6.0, 17.0, 35.0, 46.0, 73.0, 121.0, 195.0, 303.0, 482.0, 793.0, 1258.0, 2049.0, 3299.0, 5425.0, 9223.0, 15195.0, 25505.0, 43007.0, 70647.0, 111380.0, 156347.0, 177733.0, 151480.0, 105377.0, 67288.0, 40828.0, 24234.0, 14553.0, 8452.0, 5090.0, 3100.0, 1872.0, 1193.0, 708.0, 460.0, 286.0, 175.0, 117.0, 70.0, 51.0, 29.0, 14.0, 12.0, 3.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.303955078125, -11.93603515625, -11.568115234375, -11.2001953125, -10.832275390625, -10.46435546875, -10.096435546875, -9.728515625, -9.360595703125, -8.99267578125, -8.624755859375, -8.2568359375, -7.888916015625, -7.52099609375, -7.153076171875, -6.78515625, -6.417236328125, -6.04931640625, -5.681396484375, -5.3134765625, -4.945556640625, -4.57763671875, -4.209716796875, -3.841796875, -3.473876953125, -3.10595703125, -2.738037109375, -2.3701171875, -2.002197265625, -1.63427734375, -1.266357421875, -0.8984375, -0.530517578125, -0.16259765625, 0.205322265625, 0.5732421875, 0.941162109375, 1.30908203125, 1.677001953125, 2.044921875, 2.412841796875, 2.78076171875, 3.148681640625, 3.5166015625, 3.884521484375, 4.25244140625, 4.620361328125, 4.98828125, 5.356201171875, 5.72412109375, 6.092041015625, 6.4599609375, 6.827880859375, 7.19580078125, 7.563720703125, 7.931640625, 8.299560546875, 8.66748046875, 9.035400390625, 9.4033203125, 9.771240234375, 10.13916015625, 10.507080078125, 10.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 13.0, 3.0, 10.0, 8.0, 8.0, 15.0, 23.0, 22.0, 29.0, 26.0, 29.0, 38.0, 39.0, 39.0, 37.0, 36.0, 57.0, 47.0, 40.0, 51.0, 48.0, 47.0, 43.0, 53.0, 30.0, 29.0, 28.0, 22.0, 26.0, 23.0, 8.0, 17.0, 18.0, 6.0, 10.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.90625, -29.03662109375, -28.1669921875, -27.29736328125, -26.427734375, -25.55810546875, -24.6884765625, -23.81884765625, -22.94921875, -22.07958984375, -21.2099609375, -20.34033203125, -19.470703125, -18.60107421875, -17.7314453125, -16.86181640625, -15.9921875, -15.12255859375, -14.2529296875, -13.38330078125, -12.513671875, -11.64404296875, -10.7744140625, -9.90478515625, -9.03515625, -8.16552734375, -7.2958984375, -6.42626953125, -5.556640625, -4.68701171875, -3.8173828125, -2.94775390625, -2.078125, -1.20849609375, -0.3388671875, 0.53076171875, 1.400390625, 2.27001953125, 3.1396484375, 4.00927734375, 4.87890625, 5.74853515625, 6.6181640625, 7.48779296875, 8.357421875, 9.22705078125, 10.0966796875, 10.96630859375, 11.8359375, 12.70556640625, 13.5751953125, 14.44482421875, 15.314453125, 16.18408203125, 17.0537109375, 17.92333984375, 18.79296875, 19.66259765625, 20.5322265625, 21.40185546875, 22.271484375, 23.14111328125, 24.0107421875, 24.88037109375, 25.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 11.0, 10.0, 27.0, 42.0, 54.0, 58.0, 107.0, 148.0, 211.0, 335.0, 472.0, 692.0, 1157.0, 1574.0, 2516.0, 4096.0, 6577.0, 10978.0, 18558.0, 31409.0, 55874.0, 95678.0, 153777.0, 201669.0, 178595.0, 116642.0, 69103.0, 39902.0, 22928.0, 13408.0, 8262.0, 4821.0, 3121.0, 1935.0, 1248.0, 846.0, 529.0, 388.0, 225.0, 165.0, 114.0, 92.0, 61.0, 37.0, 20.0, 21.0, 15.0, 5.0, 8.0, 8.0, 2.0, 2.0, 4.0, 3.0], "bins": [-13.640625, -13.23583984375, -12.8310546875, -12.42626953125, -12.021484375, -11.61669921875, -11.2119140625, -10.80712890625, -10.40234375, -9.99755859375, -9.5927734375, -9.18798828125, -8.783203125, -8.37841796875, -7.9736328125, -7.56884765625, -7.1640625, -6.75927734375, -6.3544921875, -5.94970703125, -5.544921875, -5.14013671875, -4.7353515625, -4.33056640625, -3.92578125, -3.52099609375, -3.1162109375, -2.71142578125, -2.306640625, -1.90185546875, -1.4970703125, -1.09228515625, -0.6875, -0.28271484375, 0.1220703125, 0.52685546875, 0.931640625, 1.33642578125, 1.7412109375, 2.14599609375, 2.55078125, 2.95556640625, 3.3603515625, 3.76513671875, 4.169921875, 4.57470703125, 4.9794921875, 5.38427734375, 5.7890625, 6.19384765625, 6.5986328125, 7.00341796875, 7.408203125, 7.81298828125, 8.2177734375, 8.62255859375, 9.02734375, 9.43212890625, 9.8369140625, 10.24169921875, 10.646484375, 11.05126953125, 11.4560546875, 11.86083984375, 12.265625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 0.0, 5.0, 4.0, 4.0, 9.0, 7.0, 10.0, 14.0, 5.0, 9.0, 12.0, 7.0, 11.0, 21.0, 17.0, 26.0, 31.0, 26.0, 26.0, 24.0, 37.0, 19.0, 36.0, 42.0, 29.0, 40.0, 36.0, 32.0, 48.0, 39.0, 38.0, 30.0, 30.0, 32.0, 27.0, 31.0, 25.0, 22.0, 11.0, 15.0, 29.0, 17.0, 14.0, 12.0, 6.0, 12.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.0546875, -12.6634521484375, -12.272216796875, -11.8809814453125, -11.48974609375, -11.0985107421875, -10.707275390625, -10.3160400390625, -9.9248046875, -9.5335693359375, -9.142333984375, -8.7510986328125, -8.35986328125, -7.9686279296875, -7.577392578125, -7.1861572265625, -6.794921875, -6.4036865234375, -6.012451171875, -5.6212158203125, -5.22998046875, -4.8387451171875, -4.447509765625, -4.0562744140625, -3.6650390625, -3.2738037109375, -2.882568359375, -2.4913330078125, -2.10009765625, -1.7088623046875, -1.317626953125, -0.9263916015625, -0.53515625, -0.1439208984375, 0.247314453125, 0.6385498046875, 1.02978515625, 1.4210205078125, 1.812255859375, 2.2034912109375, 2.5947265625, 2.9859619140625, 3.377197265625, 3.7684326171875, 4.15966796875, 4.5509033203125, 4.942138671875, 5.3333740234375, 5.724609375, 6.1158447265625, 6.507080078125, 6.8983154296875, 7.28955078125, 7.6807861328125, 8.072021484375, 8.4632568359375, 8.8544921875, 9.2457275390625, 9.636962890625, 10.0281982421875, 10.41943359375, 10.8106689453125, 11.201904296875, 11.5931396484375, 11.984375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 6.0, 9.0, 14.0, 19.0, 32.0, 36.0, 69.0, 67.0, 96.0, 192.0, 257.0, 388.0, 607.0, 961.0, 1467.0, 2269.0, 3671.0, 6106.0, 10475.0, 18559.0, 33853.0, 65014.0, 123691.0, 209028.0, 233622.0, 155084.0, 83230.0, 43791.0, 23270.0, 13000.0, 7484.0, 4512.0, 2768.0, 1763.0, 1075.0, 674.0, 471.0, 288.0, 193.0, 144.0, 92.0, 67.0, 44.0, 27.0, 21.0, 16.0, 13.0, 6.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-6.5390625, -6.32940673828125, -6.1197509765625, -5.91009521484375, -5.700439453125, -5.49078369140625, -5.2811279296875, -5.07147216796875, -4.86181640625, -4.65216064453125, -4.4425048828125, -4.23284912109375, -4.023193359375, -3.81353759765625, -3.6038818359375, -3.39422607421875, -3.1845703125, -2.97491455078125, -2.7652587890625, -2.55560302734375, -2.345947265625, -2.13629150390625, -1.9266357421875, -1.71697998046875, -1.50732421875, -1.29766845703125, -1.0880126953125, -0.87835693359375, -0.668701171875, -0.45904541015625, -0.2493896484375, -0.03973388671875, 0.169921875, 0.37957763671875, 0.5892333984375, 0.79888916015625, 1.008544921875, 1.21820068359375, 1.4278564453125, 1.63751220703125, 1.84716796875, 2.05682373046875, 2.2664794921875, 2.47613525390625, 2.685791015625, 2.89544677734375, 3.1051025390625, 3.31475830078125, 3.5244140625, 3.73406982421875, 3.9437255859375, 4.15338134765625, 4.363037109375, 4.57269287109375, 4.7823486328125, 4.99200439453125, 5.20166015625, 5.41131591796875, 5.6209716796875, 5.83062744140625, 6.040283203125, 6.24993896484375, 6.4595947265625, 6.66925048828125, 6.87890625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 13.0, 13.0, 10.0, 18.0, 23.0, 17.0, 33.0, 41.0, 46.0, 61.0, 62.0, 64.0, 62.0, 63.0, 72.0, 76.0, 65.0, 48.0, 28.0, 42.0, 32.0, 27.0, 16.0, 15.0, 17.0, 4.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003056526184082031, -0.00029353052377700806, -0.000281408429145813, -0.0002692863345146179, -0.00025716423988342285, -0.0002450421452522278, -0.00023292005062103271, -0.00022079795598983765, -0.00020867586135864258, -0.0001965537667274475, -0.00018443167209625244, -0.00017230957746505737, -0.0001601874828338623, -0.00014806538820266724, -0.00013594329357147217, -0.0001238211989402771, -0.00011169910430908203, -9.957700967788696e-05, -8.74549150466919e-05, -7.533282041549683e-05, -6.321072578430176e-05, -5.108863115310669e-05, -3.896653652191162e-05, -2.6844441890716553e-05, -1.4722347259521484e-05, -2.600252628326416e-06, 9.521842002868652e-06, 2.164393663406372e-05, 3.376603126525879e-05, 4.588812589645386e-05, 5.8010220527648926e-05, 7.0132315158844e-05, 8.225440979003906e-05, 9.437650442123413e-05, 0.0001064985990524292, 0.00011862069368362427, 0.00013074278831481934, 0.0001428648829460144, 0.00015498697757720947, 0.00016710907220840454, 0.0001792311668395996, 0.00019135326147079468, 0.00020347535610198975, 0.00021559745073318481, 0.00022771954536437988, 0.00023984163999557495, 0.00025196373462677, 0.0002640858292579651, 0.00027620792388916016, 0.0002883300185203552, 0.0003004521131515503, 0.00031257420778274536, 0.00032469630241394043, 0.0003368183970451355, 0.00034894049167633057, 0.00036106258630752563, 0.0003731846809387207, 0.00038530677556991577, 0.00039742887020111084, 0.0004095509648323059, 0.000421673059463501, 0.00043379515409469604, 0.0004459172487258911, 0.0004580393433570862, 0.00047016143798828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 10.0, 11.0, 16.0, 25.0, 40.0, 65.0, 76.0, 140.0, 176.0, 282.0, 359.0, 519.0, 844.0, 1180.0, 1820.0, 2567.0, 3877.0, 6211.0, 9707.0, 15499.0, 24421.0, 39734.0, 64272.0, 99759.0, 144216.0, 172115.0, 155357.0, 111346.0, 72703.0, 44825.0, 27838.0, 17123.0, 10846.0, 6982.0, 4487.0, 3048.0, 1979.0, 1247.0, 878.0, 602.0, 437.0, 286.0, 174.0, 143.0, 88.0, 79.0, 43.0, 34.0, 17.0, 19.0, 11.0, 13.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0], "bins": [-6.203125, -6.00701904296875, -5.8109130859375, -5.61480712890625, -5.418701171875, -5.22259521484375, -5.0264892578125, -4.83038330078125, -4.63427734375, -4.43817138671875, -4.2420654296875, -4.04595947265625, -3.849853515625, -3.65374755859375, -3.4576416015625, -3.26153564453125, -3.0654296875, -2.86932373046875, -2.6732177734375, -2.47711181640625, -2.281005859375, -2.08489990234375, -1.8887939453125, -1.69268798828125, -1.49658203125, -1.30047607421875, -1.1043701171875, -0.90826416015625, -0.712158203125, -0.51605224609375, -0.3199462890625, -0.12384033203125, 0.072265625, 0.26837158203125, 0.4644775390625, 0.66058349609375, 0.856689453125, 1.05279541015625, 1.2489013671875, 1.44500732421875, 1.64111328125, 1.83721923828125, 2.0333251953125, 2.22943115234375, 2.425537109375, 2.62164306640625, 2.8177490234375, 3.01385498046875, 3.2099609375, 3.40606689453125, 3.6021728515625, 3.79827880859375, 3.994384765625, 4.19049072265625, 4.3865966796875, 4.58270263671875, 4.77880859375, 4.97491455078125, 5.1710205078125, 5.36712646484375, 5.563232421875, 5.75933837890625, 5.9554443359375, 6.15155029296875, 6.34765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 7.0, 9.0, 9.0, 16.0, 12.0, 19.0, 27.0, 26.0, 30.0, 36.0, 42.0, 50.0, 56.0, 59.0, 65.0, 69.0, 55.0, 69.0, 51.0, 62.0, 55.0, 36.0, 24.0, 24.0, 23.0, 18.0, 6.0, 18.0, 6.0, 7.0, 4.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9228515625, -1.8580169677734375, -1.793182373046875, -1.7283477783203125, -1.66351318359375, -1.5986785888671875, -1.533843994140625, -1.4690093994140625, -1.4041748046875, -1.3393402099609375, -1.274505615234375, -1.2096710205078125, -1.14483642578125, -1.0800018310546875, -1.015167236328125, -0.9503326416015625, -0.885498046875, -0.8206634521484375, -0.755828857421875, -0.6909942626953125, -0.62615966796875, -0.5613250732421875, -0.496490478515625, -0.4316558837890625, -0.3668212890625, -0.3019866943359375, -0.237152099609375, -0.1723175048828125, -0.10748291015625, -0.0426483154296875, 0.022186279296875, 0.0870208740234375, 0.15185546875, 0.2166900634765625, 0.281524658203125, 0.3463592529296875, 0.41119384765625, 0.4760284423828125, 0.540863037109375, 0.6056976318359375, 0.6705322265625, 0.7353668212890625, 0.800201416015625, 0.8650360107421875, 0.92987060546875, 0.9947052001953125, 1.059539794921875, 1.1243743896484375, 1.189208984375, 1.2540435791015625, 1.318878173828125, 1.3837127685546875, 1.44854736328125, 1.5133819580078125, 1.578216552734375, 1.6430511474609375, 1.7078857421875, 1.7727203369140625, 1.837554931640625, 1.9023895263671875, 1.96722412109375, 2.0320587158203125, 2.096893310546875, 2.1617279052734375, 2.2265625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 5.0, 13.0, 18.0, 14.0, 27.0, 30.0, 22.0, 39.0, 46.0, 71.0, 72.0, 70.0, 76.0, 74.0, 88.0, 60.0, 53.0, 42.0, 38.0, 26.0, 22.0, 16.0, 18.0, 11.0, 6.0, 9.0, 5.0, 7.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.864013671875, -43.24891662597656, -41.63382339477539, -40.01872634887695, -38.40363311767578, -36.788536071777344, -35.173439025878906, -33.558345794677734, -31.94325065612793, -30.328155517578125, -28.71306037902832, -27.097965240478516, -25.482868194580078, -23.867774963378906, -22.25267791748047, -20.637582778930664, -19.02248764038086, -17.407392501831055, -15.79229736328125, -14.177201271057129, -12.562106132507324, -10.94701099395752, -9.331914901733398, -7.716819763183594, -6.101724624633789, -4.486629486083984, -2.8715338706970215, -1.2564382553100586, 0.3586568832397461, 1.9737520217895508, 3.588848114013672, 5.203943252563477, 6.819042205810547, 8.434137344360352, 10.049232482910156, 11.664328575134277, 13.279423713684082, 14.894518852233887, 16.509614944458008, 18.124710083007812, 19.739805221557617, 21.354900360107422, 22.969995498657227, 24.58509063720703, 26.20018768310547, 27.81528091430664, 29.430377960205078, 31.045473098754883, 32.66056823730469, 34.275665283203125, 35.8907585144043, 37.505855560302734, 39.120948791503906, 40.736045837402344, 42.35114288330078, 43.96623611450195, 45.581329345703125, 47.19642639160156, 48.811519622802734, 50.42661666870117, 52.041709899902344, 53.65680694580078, 55.27190399169922, 56.88699722290039, 58.50209426879883]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 10.0, 6.0, 8.0, 9.0, 13.0, 15.0, 23.0, 23.0, 22.0, 30.0, 30.0, 38.0, 32.0, 53.0, 39.0, 45.0, 46.0, 40.0, 43.0, 43.0, 53.0, 50.0, 53.0, 38.0, 31.0, 23.0, 35.0, 18.0, 22.0, 20.0, 13.0, 13.0, 12.0, 12.0, 9.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.110742568969727, -23.335065841674805, -22.559389114379883, -21.78371238708496, -21.00803565979004, -20.232358932495117, -19.456684112548828, -18.681007385253906, -17.905330657958984, -17.129653930664062, -16.35397720336914, -15.578300476074219, -14.802623748779297, -14.026947021484375, -13.25127124786377, -12.475594520568848, -11.69991683959961, -10.924240112304688, -10.148563385009766, -9.372886657714844, -8.597209930419922, -7.821533679962158, -7.0458574295043945, -6.270180702209473, -5.494503974914551, -4.718827247619629, -3.943150758743286, -3.1674742698669434, -2.3917975425720215, -1.6161208152770996, -0.8404445648193359, -0.06476783752441406, 0.7109088897705078, 1.4865854978561401, 2.2622621059417725, 3.0379385948181152, 3.813615322113037, 4.589292049407959, 5.364968299865723, 6.1406450271606445, 6.916321754455566, 7.691998481750488, 8.46767520904541, 9.243350982666016, 10.019027709960938, 10.79470443725586, 11.570381164550781, 12.346057891845703, 13.121734619140625, 13.897411346435547, 14.673088073730469, 15.44876480102539, 16.224441528320312, 17.000118255615234, 17.775794982910156, 18.551471710205078, 19.3271484375, 20.102825164794922, 20.878501892089844, 21.654178619384766, 22.429855346679688, 23.20553207397461, 23.98120880126953, 24.756885528564453, 25.532560348510742]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 5.0, 9.0, 16.0, 29.0, 29.0, 52.0, 69.0, 95.0, 131.0, 231.0, 348.0, 478.0, 847.0, 1372.0, 2251.0, 3959.0, 7105.0, 13813.0, 25747.0, 50346.0, 96637.0, 171220.0, 228868.0, 195814.0, 118230.0, 61782.0, 31944.0, 16502.0, 8936.0, 4743.0, 2741.0, 1577.0, 941.0, 617.0, 350.0, 226.0, 163.0, 105.0, 70.0, 51.0, 37.0, 20.0, 13.0, 13.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -24.896728515625, -23.99658203125, -23.096435546875, -22.1962890625, -21.296142578125, -20.39599609375, -19.495849609375, -18.595703125, -17.695556640625, -16.79541015625, -15.895263671875, -14.9951171875, -14.094970703125, -13.19482421875, -12.294677734375, -11.39453125, -10.494384765625, -9.59423828125, -8.694091796875, -7.7939453125, -6.893798828125, -5.99365234375, -5.093505859375, -4.193359375, -3.293212890625, -2.39306640625, -1.492919921875, -0.5927734375, 0.307373046875, 1.20751953125, 2.107666015625, 3.0078125, 3.907958984375, 4.80810546875, 5.708251953125, 6.6083984375, 7.508544921875, 8.40869140625, 9.308837890625, 10.208984375, 11.109130859375, 12.00927734375, 12.909423828125, 13.8095703125, 14.709716796875, 15.60986328125, 16.510009765625, 17.41015625, 18.310302734375, 19.21044921875, 20.110595703125, 21.0107421875, 21.910888671875, 22.81103515625, 23.711181640625, 24.611328125, 25.511474609375, 26.41162109375, 27.311767578125, 28.2119140625, 29.112060546875, 30.01220703125, 30.912353515625, 31.8125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 3.0, 12.0, 9.0, 14.0, 17.0, 26.0, 34.0, 30.0, 33.0, 36.0, 46.0, 30.0, 48.0, 34.0, 41.0, 47.0, 53.0, 43.0, 48.0, 55.0, 48.0, 35.0, 34.0, 22.0, 24.0, 23.0, 25.0, 19.0, 11.0, 5.0, 24.0, 13.0, 7.0, 9.0, 2.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.21875, -26.36767578125, -25.5166015625, -24.66552734375, -23.814453125, -22.96337890625, -22.1123046875, -21.26123046875, -20.41015625, -19.55908203125, -18.7080078125, -17.85693359375, -17.005859375, -16.15478515625, -15.3037109375, -14.45263671875, -13.6015625, -12.75048828125, -11.8994140625, -11.04833984375, -10.197265625, -9.34619140625, -8.4951171875, -7.64404296875, -6.79296875, -5.94189453125, -5.0908203125, -4.23974609375, -3.388671875, -2.53759765625, -1.6865234375, -0.83544921875, 0.015625, 0.86669921875, 1.7177734375, 2.56884765625, 3.419921875, 4.27099609375, 5.1220703125, 5.97314453125, 6.82421875, 7.67529296875, 8.5263671875, 9.37744140625, 10.228515625, 11.07958984375, 11.9306640625, 12.78173828125, 13.6328125, 14.48388671875, 15.3349609375, 16.18603515625, 17.037109375, 17.88818359375, 18.7392578125, 19.59033203125, 20.44140625, 21.29248046875, 22.1435546875, 22.99462890625, 23.845703125, 24.69677734375, 25.5478515625, 26.39892578125, 27.25]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 6.0, 3.0, 12.0, 23.0, 25.0, 33.0, 53.0, 86.0, 124.0, 195.0, 245.0, 402.0, 655.0, 933.0, 1411.0, 2251.0, 3514.0, 5687.0, 9314.0, 15940.0, 26994.0, 46817.0, 82358.0, 137563.0, 196647.0, 194190.0, 133377.0, 79101.0, 45430.0, 25578.0, 15156.0, 9098.0, 5619.0, 3359.0, 2199.0, 1446.0, 934.0, 600.0, 376.0, 260.0, 187.0, 139.0, 73.0, 41.0, 39.0, 13.0, 16.0, 10.0, 14.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.25732421875, -30.1396484375, -29.02197265625, -27.904296875, -26.78662109375, -25.6689453125, -24.55126953125, -23.43359375, -22.31591796875, -21.1982421875, -20.08056640625, -18.962890625, -17.84521484375, -16.7275390625, -15.60986328125, -14.4921875, -13.37451171875, -12.2568359375, -11.13916015625, -10.021484375, -8.90380859375, -7.7861328125, -6.66845703125, -5.55078125, -4.43310546875, -3.3154296875, -2.19775390625, -1.080078125, 0.03759765625, 1.1552734375, 2.27294921875, 3.390625, 4.50830078125, 5.6259765625, 6.74365234375, 7.861328125, 8.97900390625, 10.0966796875, 11.21435546875, 12.33203125, 13.44970703125, 14.5673828125, 15.68505859375, 16.802734375, 17.92041015625, 19.0380859375, 20.15576171875, 21.2734375, 22.39111328125, 23.5087890625, 24.62646484375, 25.744140625, 26.86181640625, 27.9794921875, 29.09716796875, 30.21484375, 31.33251953125, 32.4501953125, 33.56787109375, 34.685546875, 35.80322265625, 36.9208984375, 38.03857421875, 39.15625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 11.0, 10.0, 16.0, 19.0, 27.0, 30.0, 31.0, 34.0, 29.0, 28.0, 33.0, 38.0, 29.0, 34.0, 43.0, 44.0, 48.0, 41.0, 37.0, 27.0, 31.0, 35.0, 34.0, 39.0, 34.0, 28.0, 22.0, 15.0, 21.0, 18.0, 14.0, 12.0, 8.0, 11.0, 8.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8984375, -14.4100341796875, -13.921630859375, -13.4332275390625, -12.94482421875, -12.4564208984375, -11.968017578125, -11.4796142578125, -10.9912109375, -10.5028076171875, -10.014404296875, -9.5260009765625, -9.03759765625, -8.5491943359375, -8.060791015625, -7.5723876953125, -7.083984375, -6.5955810546875, -6.107177734375, -5.6187744140625, -5.13037109375, -4.6419677734375, -4.153564453125, -3.6651611328125, -3.1767578125, -2.6883544921875, -2.199951171875, -1.7115478515625, -1.22314453125, -0.7347412109375, -0.246337890625, 0.2420654296875, 0.73046875, 1.2188720703125, 1.707275390625, 2.1956787109375, 2.68408203125, 3.1724853515625, 3.660888671875, 4.1492919921875, 4.6376953125, 5.1260986328125, 5.614501953125, 6.1029052734375, 6.59130859375, 7.0797119140625, 7.568115234375, 8.0565185546875, 8.544921875, 9.0333251953125, 9.521728515625, 10.0101318359375, 10.49853515625, 10.9869384765625, 11.475341796875, 11.9637451171875, 12.4521484375, 12.9405517578125, 13.428955078125, 13.9173583984375, 14.40576171875, 14.8941650390625, 15.382568359375, 15.8709716796875, 16.359375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 16.0, 24.0, 46.0, 68.0, 97.0, 139.0, 248.0, 334.0, 616.0, 1026.0, 2013.0, 4352.0, 10522.0, 27846.0, 77723.0, 197642.0, 320983.0, 240492.0, 102394.0, 37139.0, 13823.0, 5480.0, 2446.0, 1179.0, 679.0, 412.0, 262.0, 186.0, 105.0, 72.0, 56.0, 23.0, 32.0, 20.0, 11.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.7255859375, -22.029296875, -21.3330078125, -20.63671875, -19.9404296875, -19.244140625, -18.5478515625, -17.8515625, -17.1552734375, -16.458984375, -15.7626953125, -15.06640625, -14.3701171875, -13.673828125, -12.9775390625, -12.28125, -11.5849609375, -10.888671875, -10.1923828125, -9.49609375, -8.7998046875, -8.103515625, -7.4072265625, -6.7109375, -6.0146484375, -5.318359375, -4.6220703125, -3.92578125, -3.2294921875, -2.533203125, -1.8369140625, -1.140625, -0.4443359375, 0.251953125, 0.9482421875, 1.64453125, 2.3408203125, 3.037109375, 3.7333984375, 4.4296875, 5.1259765625, 5.822265625, 6.5185546875, 7.21484375, 7.9111328125, 8.607421875, 9.3037109375, 10.0, 10.6962890625, 11.392578125, 12.0888671875, 12.78515625, 13.4814453125, 14.177734375, 14.8740234375, 15.5703125, 16.2666015625, 16.962890625, 17.6591796875, 18.35546875, 19.0517578125, 19.748046875, 20.4443359375, 21.140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 15.0, 21.0, 25.0, 27.0, 30.0, 41.0, 52.0, 78.0, 74.0, 96.0, 82.0, 83.0, 69.0, 66.0, 46.0, 39.0, 32.0, 20.0, 19.0, 8.0, 9.0, 7.0, 4.0, 4.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.0021353960037231445, -0.002077341079711914, -0.0020192861557006836, -0.001961231231689453, -0.0019031763076782227, -0.0018451213836669922, -0.0017870664596557617, -0.0017290115356445312, -0.0016709566116333008, -0.0016129016876220703, -0.0015548467636108398, -0.0014967918395996094, -0.001438736915588379, -0.0013806819915771484, -0.001322627067565918, -0.0012645721435546875, -0.001206517219543457, -0.0011484622955322266, -0.001090407371520996, -0.0010323524475097656, -0.0009742975234985352, -0.0009162425994873047, -0.0008581876754760742, -0.0008001327514648438, -0.0007420778274536133, -0.0006840229034423828, -0.0006259679794311523, -0.0005679130554199219, -0.0005098581314086914, -0.00045180320739746094, -0.00039374828338623047, -0.000335693359375, -0.00027763843536376953, -0.00021958351135253906, -0.0001615285873413086, -0.00010347366333007812, -4.5418739318847656e-05, 1.2636184692382812e-05, 7.069110870361328e-05, 0.00012874603271484375, 0.00018680095672607422, 0.0002448558807373047, 0.00030291080474853516, 0.0003609657287597656, 0.0004190206527709961, 0.00047707557678222656, 0.000535130500793457, 0.0005931854248046875, 0.000651240348815918, 0.0007092952728271484, 0.0007673501968383789, 0.0008254051208496094, 0.0008834600448608398, 0.0009415149688720703, 0.0009995698928833008, 0.0010576248168945312, 0.0011156797409057617, 0.0011737346649169922, 0.0012317895889282227, 0.0012898445129394531, 0.0013478994369506836, 0.001405954360961914, 0.0014640092849731445, 0.001522064208984375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 10.0, 22.0, 32.0, 35.0, 57.0, 78.0, 137.0, 237.0, 366.0, 574.0, 870.0, 1438.0, 2468.0, 4233.0, 8086.0, 14993.0, 29194.0, 56448.0, 106427.0, 175558.0, 218944.0, 184485.0, 114148.0, 61612.0, 31657.0, 16245.0, 8589.0, 4764.0, 2668.0, 1552.0, 1013.0, 563.0, 367.0, 236.0, 141.0, 102.0, 69.0, 46.0, 33.0, 15.0, 13.0, 11.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.9453125, -12.5074462890625, -12.069580078125, -11.6317138671875, -11.19384765625, -10.7559814453125, -10.318115234375, -9.8802490234375, -9.4423828125, -9.0045166015625, -8.566650390625, -8.1287841796875, -7.69091796875, -7.2530517578125, -6.815185546875, -6.3773193359375, -5.939453125, -5.5015869140625, -5.063720703125, -4.6258544921875, -4.18798828125, -3.7501220703125, -3.312255859375, -2.8743896484375, -2.4365234375, -1.9986572265625, -1.560791015625, -1.1229248046875, -0.68505859375, -0.2471923828125, 0.190673828125, 0.6285400390625, 1.06640625, 1.5042724609375, 1.942138671875, 2.3800048828125, 2.81787109375, 3.2557373046875, 3.693603515625, 4.1314697265625, 4.5693359375, 5.0072021484375, 5.445068359375, 5.8829345703125, 6.32080078125, 6.7586669921875, 7.196533203125, 7.6343994140625, 8.072265625, 8.5101318359375, 8.947998046875, 9.3858642578125, 9.82373046875, 10.2615966796875, 10.699462890625, 11.1373291015625, 11.5751953125, 12.0130615234375, 12.450927734375, 12.8887939453125, 13.32666015625, 13.7645263671875, 14.202392578125, 14.6402587890625, 15.078125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 17.0, 16.0, 19.0, 17.0, 22.0, 29.0, 33.0, 52.0, 43.0, 54.0, 72.0, 69.0, 61.0, 61.0, 62.0, 51.0, 34.0, 38.0, 41.0, 45.0, 28.0, 24.0, 17.0, 12.0, 20.0, 8.0, 6.0, 8.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.9742431640625, -2.868408203125, -2.7625732421875, -2.65673828125, -2.5509033203125, -2.445068359375, -2.3392333984375, -2.2333984375, -2.1275634765625, -2.021728515625, -1.9158935546875, -1.81005859375, -1.7042236328125, -1.598388671875, -1.4925537109375, -1.38671875, -1.2808837890625, -1.175048828125, -1.0692138671875, -0.96337890625, -0.8575439453125, -0.751708984375, -0.6458740234375, -0.5400390625, -0.4342041015625, -0.328369140625, -0.2225341796875, -0.11669921875, -0.0108642578125, 0.094970703125, 0.2008056640625, 0.306640625, 0.4124755859375, 0.518310546875, 0.6241455078125, 0.72998046875, 0.8358154296875, 0.941650390625, 1.0474853515625, 1.1533203125, 1.2591552734375, 1.364990234375, 1.4708251953125, 1.57666015625, 1.6824951171875, 1.788330078125, 1.8941650390625, 2.0, 2.1058349609375, 2.211669921875, 2.3175048828125, 2.42333984375, 2.5291748046875, 2.635009765625, 2.7408447265625, 2.8466796875, 2.9525146484375, 3.058349609375, 3.1641845703125, 3.27001953125, 3.3758544921875, 3.481689453125, 3.5875244140625, 3.693359375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 3.0, 10.0, 13.0, 11.0, 27.0, 24.0, 26.0, 37.0, 46.0, 46.0, 76.0, 60.0, 71.0, 77.0, 72.0, 72.0, 53.0, 41.0, 42.0, 42.0, 28.0, 20.0, 18.0, 19.0, 12.0, 15.0, 6.0, 6.0, 4.0, 0.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.69246292114258, -41.01814270019531, -39.34382629394531, -37.66950988769531, -35.99518966674805, -34.32086944580078, -32.64655303955078, -30.97223472595215, -29.297916412353516, -27.623598098754883, -25.94927978515625, -24.274961471557617, -22.600643157958984, -20.92632484436035, -19.25200653076172, -17.577688217163086, -15.903369903564453, -14.22905158996582, -12.554733276367188, -10.880414962768555, -9.206096649169922, -7.531778335571289, -5.857460021972656, -4.183141708374023, -2.5088233947753906, -0.8345050811767578, 0.839813232421875, 2.514131546020508, 4.188449859619141, 5.862768173217773, 7.537086486816406, 9.211404800415039, 10.885726928710938, 12.56004524230957, 14.234363555908203, 15.908681869506836, 17.58300018310547, 19.2573184967041, 20.931636810302734, 22.605955123901367, 24.2802734375, 25.954591751098633, 27.628910064697266, 29.3032283782959, 30.97754669189453, 32.65186309814453, 34.3261833190918, 36.00050354003906, 37.67481994628906, 39.34913635253906, 41.02345657348633, 42.697776794433594, 44.372093200683594, 46.046409606933594, 47.72072982788086, 49.395050048828125, 51.069366455078125, 52.743682861328125, 54.41800308227539, 56.092323303222656, 57.766639709472656, 59.440956115722656, 61.11527633666992, 62.78959655761719, 64.46391296386719]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 9.0, 1.0, 12.0, 15.0, 8.0, 18.0, 18.0, 24.0, 31.0, 32.0, 35.0, 46.0, 46.0, 49.0, 40.0, 39.0, 60.0, 43.0, 50.0, 61.0, 50.0, 43.0, 44.0, 34.0, 38.0, 29.0, 22.0, 26.0, 9.0, 14.0, 13.0, 9.0, 11.0, 4.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.47378158569336, -34.3286018371582, -33.18342208862305, -32.03824234008789, -30.893062591552734, -29.747882843017578, -28.60270118713379, -27.457521438598633, -26.312341690063477, -25.16716194152832, -24.021982192993164, -22.876802444458008, -21.73162078857422, -20.586441040039062, -19.441261291503906, -18.29608154296875, -17.150901794433594, -16.005722045898438, -14.860542297363281, -13.715361595153809, -12.570181846618652, -11.425002098083496, -10.279821395874023, -9.134641647338867, -7.989461898803711, -6.844282150268555, -5.69910192489624, -4.553921699523926, -3.4087419509887695, -2.2635622024536133, -1.1183819770812988, 0.026798248291015625, 1.1719818115234375, 2.317161798477173, 3.462341785430908, 4.607522010803223, 5.752701759338379, 6.897881507873535, 8.043062210083008, 9.188241958618164, 10.33342170715332, 11.478601455688477, 12.623781204223633, 13.768961906433105, 14.914141654968262, 16.059322357177734, 17.20450210571289, 18.349681854248047, 19.494861602783203, 20.64004135131836, 21.785221099853516, 22.930400848388672, 24.075580596923828, 25.220760345458984, 26.365942001342773, 27.51112174987793, 28.656301498413086, 29.801481246948242, 30.9466609954834, 32.09184265136719, 33.237022399902344, 34.3822021484375, 35.527381896972656, 36.67256164550781, 37.81774139404297]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 7.0, 14.0, 12.0, 18.0, 23.0, 39.0, 51.0, 56.0, 47.0, 86.0, 111.0, 181.0, 229.0, 385.0, 588.0, 1023.0, 2112.0, 5848.0, 499078.0, 8256.0, 2775.0, 1200.0, 698.0, 420.0, 256.0, 170.0, 141.0, 94.0, 75.0, 54.0, 41.0, 37.0, 26.0, 22.0, 14.0, 12.0, 13.0, 7.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-657.5618286132812, -635.3809204101562, -613.199951171875, -591.01904296875, -568.838134765625, -546.6572265625, -524.4762573242188, -502.29534912109375, -480.1144104003906, -457.9334716796875, -435.7525634765625, -413.5716247558594, -391.39068603515625, -369.20977783203125, -347.0288391113281, -324.847900390625, -302.6669921875, -280.4860534667969, -258.3051452636719, -236.12420654296875, -213.9432830810547, -191.76235961914062, -169.5814208984375, -147.40049743652344, -125.21957397460938, -103.03865051269531, -80.85771942138672, -58.676788330078125, -36.49586486816406, -14.31494140625, 7.865997314453125, 30.046920776367188, 52.22784423828125, 74.40876770019531, 96.5896987915039, 118.7706298828125, 140.95155334472656, 163.13247680664062, 185.31341552734375, 207.4943389892578, 229.67526245117188, 251.85618591308594, 274.037109375, 296.2180480957031, 318.39898681640625, 340.57989501953125, 362.7608337402344, 384.9417724609375, 407.1226806640625, 429.3036193847656, 451.4845275878906, 473.66546630859375, 495.84637451171875, 518.02734375, 540.208251953125, 562.38916015625, 584.570068359375, 606.7509765625, 628.9319458007812, 651.1128540039062, 673.2937622070312, 695.4747314453125, 717.6556396484375, 739.8365478515625, 762.0175170898438]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 15.0, 11.0, 8.0, 23.0, 15.0, 23.0, 33.0, 37.0, 32.0, 45.0, 60.0, 36.0, 40.0, 48.0, 1080.0, 45.0, 41.0, 62.0, 52.0, 46.0, 40.0, 30.0, 40.0, 29.0, 20.0, 21.0, 12.0, 12.0, 18.0, 4.0, 12.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1096.271728515625, -1060.7425537109375, -1025.21337890625, -989.6842041015625, -954.1550903320312, -918.6259155273438, -883.0967407226562, -847.5675659179688, -812.0384521484375, -776.50927734375, -740.9801025390625, -705.450927734375, -669.9218139648438, -634.3926391601562, -598.8634643554688, -563.3342895507812, -527.8051147460938, -492.27593994140625, -456.7467956542969, -421.2176208496094, -385.6884765625, -350.1593017578125, -314.630126953125, -279.1009521484375, -243.57180786132812, -208.0426483154297, -172.51348876953125, -136.98431396484375, -101.45515441894531, -65.92599487304688, -30.396820068359375, 5.1323394775390625, 40.6614990234375, 76.19065856933594, 111.7198257446289, 147.24899291992188, 182.7781524658203, 218.30731201171875, 253.83648681640625, 289.36566162109375, 324.8948059082031, 360.4239807128906, 395.953125, 431.4822998046875, 467.011474609375, 502.5406188964844, 538.06982421875, 573.5989379882812, 609.1281127929688, 644.6572875976562, 680.1864624023438, 715.715576171875, 751.2447509765625, 786.77392578125, 822.3031005859375, 857.832275390625, 893.3614501953125, 928.890625, 964.4197998046875, 999.948974609375, 1035.4781494140625, 1071.00732421875, 1106.536376953125, 1142.0655517578125, 1177.5947265625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 9.0, 13.0, 7.0, 13.0, 13.0, 15.0, 32.0, 44.0, 66.0, 56.0, 66.0, 117.0, 157.0, 237.0, 458.0, 1001.0, 2305.0, 5516.0, 11046.0, 20476.0, 31079760.0, 99038.0, 27229.0, 3810.0, 1166.0, 606.0, 372.0, 223.0, 161.0, 113.0, 86.0, 57.0, 43.0, 44.0, 22.0, 29.0, 19.0, 22.0, 5.0, 10.0, 6.0, 11.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-708.4880981445312, -685.5228271484375, -662.5575561523438, -639.59228515625, -616.6270141601562, -593.6617431640625, -570.6964721679688, -547.731201171875, -524.7659301757812, -501.8006591796875, -478.83538818359375, -455.8701171875, -432.90484619140625, -409.9395751953125, -386.97430419921875, -364.009033203125, -341.0437927246094, -318.0785217285156, -295.1132507324219, -272.1479797363281, -249.18270874023438, -226.21743774414062, -203.25218200683594, -180.2869110107422, -157.32164001464844, -134.3563690185547, -111.39109802246094, -88.42583465576172, -65.46056365966797, -42.49529266357422, -19.530029296875, 3.43524169921875, 26.4005126953125, 49.36578369140625, 72.3310546875, 95.29631805419922, 118.26158905029297, 141.22686767578125, 164.19212341308594, 187.1573944091797, 210.12266540527344, 233.0879364013672, 256.0531921386719, 279.0184631347656, 301.9837341308594, 324.9490051269531, 347.9142761230469, 370.8795471191406, 393.8448181152344, 416.8100891113281, 439.7753601074219, 462.7406311035156, 485.7059020996094, 508.6711730957031, 531.6364135742188, 554.6016845703125, 577.5669555664062, 600.5322265625, 623.4974975585938, 646.4627685546875, 669.4280395507812, 692.393310546875, 715.3585815429688, 738.3238525390625, 761.2891235351562]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 12.0, 18.0, 40.0, 47.0, 59.0, 98.0, 158.0, 210.0, 329.0, 515.0, 860.0, 1310.0, 2168.0, 3581.0, 6264.0, 10968.0, 20173.0, 38774.0, 79661.0, 174501.0, 430603.0, 1210587.0, 2462732.0, 1124170.0, 404186.0, 164573.0, 74661.0, 36170.0, 19091.0, 10264.0, 5843.0, 3394.0, 2002.0, 1246.0, 737.0, 508.0, 337.0, 186.0, 123.0, 91.0, 55.0, 39.0, 27.0, 17.0, 14.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-62.625, -60.75341796875, -58.8818359375, -57.01025390625, -55.138671875, -53.26708984375, -51.3955078125, -49.52392578125, -47.65234375, -45.78076171875, -43.9091796875, -42.03759765625, -40.166015625, -38.29443359375, -36.4228515625, -34.55126953125, -32.6796875, -30.80810546875, -28.9365234375, -27.06494140625, -25.193359375, -23.32177734375, -21.4501953125, -19.57861328125, -17.70703125, -15.83544921875, -13.9638671875, -12.09228515625, -10.220703125, -8.34912109375, -6.4775390625, -4.60595703125, -2.734375, -0.86279296875, 1.0087890625, 2.88037109375, 4.751953125, 6.62353515625, 8.4951171875, 10.36669921875, 12.23828125, 14.10986328125, 15.9814453125, 17.85302734375, 19.724609375, 21.59619140625, 23.4677734375, 25.33935546875, 27.2109375, 29.08251953125, 30.9541015625, 32.82568359375, 34.697265625, 36.56884765625, 38.4404296875, 40.31201171875, 42.18359375, 44.05517578125, 45.9267578125, 47.79833984375, 49.669921875, 51.54150390625, 53.4130859375, 55.28466796875, 57.15625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 10.0, 4.0, 11.0, 15.0, 15.0, 20.0, 17.0, 32.0, 34.0, 33.0, 56.0, 49.0, 63.0, 63.0, 87.0, 121.0, 125.0, 147.0, 134.0, 141.0, 109.0, 108.0, 82.0, 93.0, 61.0, 66.0, 67.0, 47.0, 27.0, 28.0, 19.0, 22.0, 30.0, 14.0, 11.0, 12.0, 11.0, 5.0, 9.0, 5.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.265625, -17.69189453125, -17.1181640625, -16.54443359375, -15.970703125, -15.39697265625, -14.8232421875, -14.24951171875, -13.67578125, -13.10205078125, -12.5283203125, -11.95458984375, -11.380859375, -10.80712890625, -10.2333984375, -9.65966796875, -9.0859375, -8.51220703125, -7.9384765625, -7.36474609375, -6.791015625, -6.21728515625, -5.6435546875, -5.06982421875, -4.49609375, -3.92236328125, -3.3486328125, -2.77490234375, -2.201171875, -1.62744140625, -1.0537109375, -0.47998046875, 0.09375, 0.66748046875, 1.2412109375, 1.81494140625, 2.388671875, 2.96240234375, 3.5361328125, 4.10986328125, 4.68359375, 5.25732421875, 5.8310546875, 6.40478515625, 6.978515625, 7.55224609375, 8.1259765625, 8.69970703125, 9.2734375, 9.84716796875, 10.4208984375, 10.99462890625, 11.568359375, 12.14208984375, 12.7158203125, 13.28955078125, 13.86328125, 14.43701171875, 15.0107421875, 15.58447265625, 16.158203125, 16.73193359375, 17.3056640625, 17.87939453125, 18.453125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 18.0, 28.0, 39.0, 43.0, 86.0, 126.0, 210.0, 325.0, 533.0, 785.0, 1276.0, 2041.0, 3355.0, 5410.0, 8656.0, 14526.0, 24435.0, 41532.0, 69397.0, 116905.0, 193796.0, 326586.0, 589135.0, 1200580.0, 1632651.0, 922947.0, 467526.0, 266899.0, 160622.0, 96176.0, 57655.0, 34537.0, 20410.0, 12493.0, 7486.0, 4571.0, 2812.0, 1695.0, 1109.0, 699.0, 477.0, 307.0, 171.0, 131.0, 72.0, 54.0, 33.0, 29.0, 17.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.265625, -19.61865234375, -18.9716796875, -18.32470703125, -17.677734375, -17.03076171875, -16.3837890625, -15.73681640625, -15.08984375, -14.44287109375, -13.7958984375, -13.14892578125, -12.501953125, -11.85498046875, -11.2080078125, -10.56103515625, -9.9140625, -9.26708984375, -8.6201171875, -7.97314453125, -7.326171875, -6.67919921875, -6.0322265625, -5.38525390625, -4.73828125, -4.09130859375, -3.4443359375, -2.79736328125, -2.150390625, -1.50341796875, -0.8564453125, -0.20947265625, 0.4375, 1.08447265625, 1.7314453125, 2.37841796875, 3.025390625, 3.67236328125, 4.3193359375, 4.96630859375, 5.61328125, 6.26025390625, 6.9072265625, 7.55419921875, 8.201171875, 8.84814453125, 9.4951171875, 10.14208984375, 10.7890625, 11.43603515625, 12.0830078125, 12.72998046875, 13.376953125, 14.02392578125, 14.6708984375, 15.31787109375, 15.96484375, 16.61181640625, 17.2587890625, 17.90576171875, 18.552734375, 19.19970703125, 19.8466796875, 20.49365234375, 21.140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 5.0, 10.0, 11.0, 12.0, 9.0, 19.0, 19.0, 38.0, 24.0, 37.0, 56.0, 71.0, 66.0, 103.0, 142.0, 149.0, 195.0, 173.0, 164.0, 131.0, 100.0, 101.0, 76.0, 55.0, 61.0, 34.0, 34.0, 24.0, 23.0, 16.0, 15.0, 16.0, 4.0, 10.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.33740234375, -20.5185546875, -19.69970703125, -18.880859375, -18.06201171875, -17.2431640625, -16.42431640625, -15.60546875, -14.78662109375, -13.9677734375, -13.14892578125, -12.330078125, -11.51123046875, -10.6923828125, -9.87353515625, -9.0546875, -8.23583984375, -7.4169921875, -6.59814453125, -5.779296875, -4.96044921875, -4.1416015625, -3.32275390625, -2.50390625, -1.68505859375, -0.8662109375, -0.04736328125, 0.771484375, 1.59033203125, 2.4091796875, 3.22802734375, 4.046875, 4.86572265625, 5.6845703125, 6.50341796875, 7.322265625, 8.14111328125, 8.9599609375, 9.77880859375, 10.59765625, 11.41650390625, 12.2353515625, 13.05419921875, 13.873046875, 14.69189453125, 15.5107421875, 16.32958984375, 17.1484375, 17.96728515625, 18.7861328125, 19.60498046875, 20.423828125, 21.24267578125, 22.0615234375, 22.88037109375, 23.69921875, 24.51806640625, 25.3369140625, 26.15576171875, 26.974609375, 27.79345703125, 28.6123046875, 29.43115234375, 30.25]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 5.0, 14.0, 10.0, 18.0, 45.0, 55.0, 96.0, 143.0, 235.0, 319.0, 445.0, 693.0, 1071.0, 1596.0, 2353.0, 3725.0, 5685.0, 9229.0, 14846.0, 24145.0, 41164.0, 79397.0, 235142.0, 5508615.0, 192854.0, 71799.0, 37762.0, 22115.0, 13343.0, 8472.0, 5426.0, 3527.0, 2301.0, 1611.0, 928.0, 689.0, 497.0, 344.0, 234.0, 168.0, 107.0, 72.0, 57.0, 32.0, 22.0, 10.0, 11.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.47705078125, -45.6103515625, -43.74365234375, -41.876953125, -40.01025390625, -38.1435546875, -36.27685546875, -34.41015625, -32.54345703125, -30.6767578125, -28.81005859375, -26.943359375, -25.07666015625, -23.2099609375, -21.34326171875, -19.4765625, -17.60986328125, -15.7431640625, -13.87646484375, -12.009765625, -10.14306640625, -8.2763671875, -6.40966796875, -4.54296875, -2.67626953125, -0.8095703125, 1.05712890625, 2.923828125, 4.79052734375, 6.6572265625, 8.52392578125, 10.390625, 12.25732421875, 14.1240234375, 15.99072265625, 17.857421875, 19.72412109375, 21.5908203125, 23.45751953125, 25.32421875, 27.19091796875, 29.0576171875, 30.92431640625, 32.791015625, 34.65771484375, 36.5244140625, 38.39111328125, 40.2578125, 42.12451171875, 43.9912109375, 45.85791015625, 47.724609375, 49.59130859375, 51.4580078125, 53.32470703125, 55.19140625, 57.05810546875, 58.9248046875, 60.79150390625, 62.658203125, 64.52490234375, 66.3916015625, 68.25830078125, 70.125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 8.0, 17.0, 17.0, 17.0, 20.0, 18.0, 21.0, 24.0, 30.0, 32.0, 44.0, 46.0, 63.0, 94.0, 153.0, 201.0, 221.0, 213.0, 158.0, 137.0, 89.0, 54.0, 64.0, 43.0, 31.0, 28.0, 20.0, 28.0, 23.0, 15.0, 14.0, 9.0, 5.0, 8.0, 7.0, 4.0, 3.0, 6.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.46630859375, -33.4013671875, -32.33642578125, -31.271484375, -30.20654296875, -29.1416015625, -28.07666015625, -27.01171875, -25.94677734375, -24.8818359375, -23.81689453125, -22.751953125, -21.68701171875, -20.6220703125, -19.55712890625, -18.4921875, -17.42724609375, -16.3623046875, -15.29736328125, -14.232421875, -13.16748046875, -12.1025390625, -11.03759765625, -9.97265625, -8.90771484375, -7.8427734375, -6.77783203125, -5.712890625, -4.64794921875, -3.5830078125, -2.51806640625, -1.453125, -0.38818359375, 0.6767578125, 1.74169921875, 2.806640625, 3.87158203125, 4.9365234375, 6.00146484375, 7.06640625, 8.13134765625, 9.1962890625, 10.26123046875, 11.326171875, 12.39111328125, 13.4560546875, 14.52099609375, 15.5859375, 16.65087890625, 17.7158203125, 18.78076171875, 19.845703125, 20.91064453125, 21.9755859375, 23.04052734375, 24.10546875, 25.17041015625, 26.2353515625, 27.30029296875, 28.365234375, 29.43017578125, 30.4951171875, 31.56005859375, 32.625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 14.0, 20.0, 47.0, 95.0, 490.0, 189.0, 60.0, 27.0, 21.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4114.9453125, -3985.138427734375, -3855.33154296875, -3725.5244140625, -3595.717529296875, -3465.91064453125, -3336.103515625, -3206.296630859375, -3076.48974609375, -2946.682861328125, -2816.8759765625, -2687.06884765625, -2557.261962890625, -2427.455078125, -2297.64794921875, -2167.841064453125, -2038.0341796875, -1908.227294921875, -1778.4202880859375, -1648.61328125, -1518.806396484375, -1388.99951171875, -1259.1925048828125, -1129.385498046875, -999.57861328125, -869.7716674804688, -739.9647216796875, -610.1577758789062, -480.350830078125, -350.54388427734375, -220.7369384765625, -90.92999267578125, 38.87646484375, 168.68341064453125, 298.4903564453125, 428.29730224609375, 558.104248046875, 687.9111938476562, 817.7181396484375, 947.5250854492188, 1077.33203125, 1207.138916015625, 1336.9459228515625, 1466.7529296875, 1596.559814453125, 1726.36669921875, 1856.1737060546875, 1985.980712890625, 2115.78759765625, 2245.594482421875, 2375.4013671875, 2505.20849609375, 2635.015380859375, 2764.822265625, 2894.62939453125, 3024.436279296875, 3154.2431640625, 3284.050048828125, 3413.85693359375, 3543.6640625, 3673.470947265625, 3803.27783203125, 3933.0849609375, 4062.891845703125, 4192.69873046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 7.0, 10.0, 6.0, 5.0, 11.0, 5.0, 10.0, 8.0, 11.0, 13.0, 21.0, 16.0, 20.0, 43.0, 58.0, 102.0, 279.0, 114.0, 48.0, 30.0, 27.0, 22.0, 16.0, 21.0, 12.0, 7.0, 8.0, 14.0, 9.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-948.9963989257812, -918.8461303710938, -888.6958618164062, -858.5455322265625, -828.395263671875, -798.2449951171875, -768.0947265625, -737.9444580078125, -707.794189453125, -677.6439208984375, -647.49365234375, -617.3433837890625, -587.1930541992188, -557.0427856445312, -526.8925170898438, -496.74224853515625, -466.5919189453125, -436.441650390625, -406.2913513183594, -376.1410827636719, -345.99078369140625, -315.84051513671875, -285.69024658203125, -255.5399627685547, -225.38967895507812, -195.23939514160156, -165.089111328125, -134.9388427734375, -104.78855895996094, -74.63827514648438, -44.488006591796875, -14.337722778320312, 15.8126220703125, 45.9629020690918, 76.1131820678711, 106.26345825195312, 136.4137420654297, 166.56402587890625, 196.71429443359375, 226.8645782470703, 257.0148620605469, 287.1651306152344, 317.3154296875, 347.4656982421875, 377.615966796875, 407.7662658691406, 437.9165344238281, 468.06683349609375, 498.21710205078125, 528.3673706054688, 558.5176391601562, 588.66796875, 618.8182373046875, 648.968505859375, 679.1187744140625, 709.26904296875, 739.4193115234375, 769.569580078125, 799.7198486328125, 829.8701171875, 860.0204467773438, 890.1707153320312, 920.3209838867188, 950.4712524414062, 980.62158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 14.0, 18.0, 21.0, 24.0, 44.0, 81.0, 116.0, 142.0, 195.0, 328.0, 477.0, 777.0, 1177.0, 2027.0, 3293.0, 5508.0, 10284.0, 20106.0, 44471.0, 137221.0, 2326453.0, 1425456.0, 128088.0, 43830.0, 19737.0, 10094.0, 5495.0, 3254.0, 1990.0, 1211.0, 781.0, 561.0, 323.0, 213.0, 155.0, 84.0, 56.0, 53.0, 35.0, 20.0, 17.0, 12.0, 6.0, 8.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.7861328125, -10.400390625, -10.0146484375, -9.62890625, -9.2431640625, -8.857421875, -8.4716796875, -8.0859375, -7.7001953125, -7.314453125, -6.9287109375, -6.54296875, -6.1572265625, -5.771484375, -5.3857421875, -5.0, -4.6142578125, -4.228515625, -3.8427734375, -3.45703125, -3.0712890625, -2.685546875, -2.2998046875, -1.9140625, -1.5283203125, -1.142578125, -0.7568359375, -0.37109375, 0.0146484375, 0.400390625, 0.7861328125, 1.171875, 1.5576171875, 1.943359375, 2.3291015625, 2.71484375, 3.1005859375, 3.486328125, 3.8720703125, 4.2578125, 4.6435546875, 5.029296875, 5.4150390625, 5.80078125, 6.1865234375, 6.572265625, 6.9580078125, 7.34375, 7.7294921875, 8.115234375, 8.5009765625, 8.88671875, 9.2724609375, 9.658203125, 10.0439453125, 10.4296875, 10.8154296875, 11.201171875, 11.5869140625, 11.97265625, 12.3583984375, 12.744140625, 13.1298828125, 13.515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 10.0, 10.0, 10.0, 23.0, 25.0, 69.0, 93.0, 167.0, 179.0, 143.0, 94.0, 42.0, 29.0, 15.0, 11.0, 13.0, 10.0, 8.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.173828125, -1.1352081298828125, -1.096588134765625, -1.0579681396484375, -1.01934814453125, -0.9807281494140625, -0.942108154296875, -0.9034881591796875, -0.8648681640625, -0.8262481689453125, -0.787628173828125, -0.7490081787109375, -0.71038818359375, -0.6717681884765625, -0.633148193359375, -0.5945281982421875, -0.555908203125, -0.5172882080078125, -0.478668212890625, -0.4400482177734375, -0.40142822265625, -0.3628082275390625, -0.324188232421875, -0.2855682373046875, -0.2469482421875, -0.2083282470703125, -0.169708251953125, -0.1310882568359375, -0.09246826171875, -0.0538482666015625, -0.015228271484375, 0.0233917236328125, 0.06201171875, 0.1006317138671875, 0.139251708984375, 0.1778717041015625, 0.21649169921875, 0.2551116943359375, 0.293731689453125, 0.3323516845703125, 0.3709716796875, 0.4095916748046875, 0.448211669921875, 0.4868316650390625, 0.52545166015625, 0.5640716552734375, 0.602691650390625, 0.6413116455078125, 0.679931640625, 0.7185516357421875, 0.757171630859375, 0.7957916259765625, 0.83441162109375, 0.8730316162109375, 0.911651611328125, 0.9502716064453125, 0.9888916015625, 1.0275115966796875, 1.066131591796875, 1.1047515869140625, 1.14337158203125, 1.1819915771484375, 1.220611572265625, 1.2592315673828125, 1.2978515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 23.0, 31.0, 41.0, 84.0, 70.0, 160.0, 253.0, 436.0, 764.0, 1411.0, 2812.0, 5616.0, 12034.0, 28885.0, 78273.0, 243477.0, 950784.0, 2099949.0, 530714.0, 151094.0, 50820.0, 19911.0, 8365.0, 3900.0, 1850.0, 1002.0, 606.0, 307.0, 188.0, 125.0, 76.0, 63.0, 40.0, 34.0, 11.0, 16.0, 14.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9654541015625, -11.594970703125, -11.2244873046875, -10.85400390625, -10.4835205078125, -10.113037109375, -9.7425537109375, -9.3720703125, -9.0015869140625, -8.631103515625, -8.2606201171875, -7.89013671875, -7.5196533203125, -7.149169921875, -6.7786865234375, -6.408203125, -6.0377197265625, -5.667236328125, -5.2967529296875, -4.92626953125, -4.5557861328125, -4.185302734375, -3.8148193359375, -3.4443359375, -3.0738525390625, -2.703369140625, -2.3328857421875, -1.96240234375, -1.5919189453125, -1.221435546875, -0.8509521484375, -0.48046875, -0.1099853515625, 0.260498046875, 0.6309814453125, 1.00146484375, 1.3719482421875, 1.742431640625, 2.1129150390625, 2.4833984375, 2.8538818359375, 3.224365234375, 3.5948486328125, 3.96533203125, 4.3358154296875, 4.706298828125, 5.0767822265625, 5.447265625, 5.8177490234375, 6.188232421875, 6.5587158203125, 6.92919921875, 7.2996826171875, 7.670166015625, 8.0406494140625, 8.4111328125, 8.7816162109375, 9.152099609375, 9.5225830078125, 9.89306640625, 10.2635498046875, 10.634033203125, 11.0045166015625, 11.375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 10.0, 11.0, 11.0, 23.0, 20.0, 31.0, 27.0, 40.0, 29.0, 53.0, 57.0, 92.0, 100.0, 107.0, 114.0, 165.0, 181.0, 258.0, 266.0, 340.0, 399.0, 276.0, 258.0, 209.0, 169.0, 131.0, 125.0, 90.0, 73.0, 77.0, 51.0, 53.0, 42.0, 25.0, 24.0, 31.0, 14.0, 16.0, 8.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 6.0, 0.0, 2.0], "bins": [-2.751953125, -2.673614501953125, -2.59527587890625, -2.516937255859375, -2.4385986328125, -2.360260009765625, -2.28192138671875, -2.203582763671875, -2.125244140625, -2.046905517578125, -1.96856689453125, -1.890228271484375, -1.8118896484375, -1.733551025390625, -1.65521240234375, -1.576873779296875, -1.49853515625, -1.420196533203125, -1.34185791015625, -1.263519287109375, -1.1851806640625, -1.106842041015625, -1.02850341796875, -0.950164794921875, -0.871826171875, -0.793487548828125, -0.71514892578125, -0.636810302734375, -0.5584716796875, -0.480133056640625, -0.40179443359375, -0.323455810546875, -0.2451171875, -0.166778564453125, -0.08843994140625, -0.010101318359375, 0.0682373046875, 0.146575927734375, 0.22491455078125, 0.303253173828125, 0.381591796875, 0.459930419921875, 0.53826904296875, 0.616607666015625, 0.6949462890625, 0.773284912109375, 0.85162353515625, 0.929962158203125, 1.00830078125, 1.086639404296875, 1.16497802734375, 1.243316650390625, 1.3216552734375, 1.399993896484375, 1.47833251953125, 1.556671142578125, 1.635009765625, 1.713348388671875, 1.79168701171875, 1.870025634765625, 1.9483642578125, 2.026702880859375, 2.10504150390625, 2.183380126953125, 2.26171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 13.0, 26.0, 59.0, 80.0, 116.0, 188.0, 193.0, 161.0, 79.0, 36.0, 17.0, 16.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-88.87611389160156, -86.59979248046875, -84.32347106933594, -82.04714965820312, -79.77082824707031, -77.4945068359375, -75.21818542480469, -72.9418716430664, -70.6655502319336, -68.38922882080078, -66.11290740966797, -63.836585998535156, -61.56026840209961, -59.2839469909668, -57.007625579833984, -54.73130416870117, -52.45498275756836, -50.17866134643555, -47.902339935302734, -45.62602233886719, -43.349700927734375, -41.07337951660156, -38.79705810546875, -36.52073669433594, -34.244415283203125, -31.968093872070312, -29.691774368286133, -27.41545295715332, -25.13913345336914, -22.862812042236328, -20.586490631103516, -18.310169219970703, -16.033851623535156, -13.75753116607666, -11.481210708618164, -9.204889297485352, -6.9285688400268555, -4.652248382568359, -2.375926971435547, -0.09960651397705078, 2.1767139434814453, 4.453034400939941, 6.729355335235596, 9.00567626953125, 11.281996726989746, 13.558317184448242, 15.834638595581055, 18.110958099365234, 20.387279510498047, 22.66360092163086, 24.93992042541504, 27.21624183654785, 29.49256134033203, 31.768882751464844, 34.045204162597656, 36.32152557373047, 38.59784698486328, 40.874168395996094, 43.150489807128906, 45.42681121826172, 47.703128814697266, 49.97945022583008, 52.25577163696289, 54.5320930480957, 56.80841064453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 13.0, 10.0, 31.0, 21.0, 38.0, 44.0, 48.0, 42.0, 50.0, 61.0, 50.0, 47.0, 52.0, 48.0, 72.0, 47.0, 54.0, 35.0, 40.0, 28.0, 25.0, 28.0, 26.0, 16.0, 20.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-29.659461975097656, -28.878816604614258, -28.098173141479492, -27.317527770996094, -26.536882400512695, -25.756237030029297, -24.97559356689453, -24.194948196411133, -23.414302825927734, -22.633657455444336, -21.85301399230957, -21.072368621826172, -20.291723251342773, -19.511077880859375, -18.73043441772461, -17.94978904724121, -17.169145584106445, -16.388500213623047, -15.607855796813965, -14.827211380004883, -14.046566009521484, -13.265921592712402, -12.48527717590332, -11.704631805419922, -10.92398738861084, -10.143342971801758, -9.36269760131836, -8.582053184509277, -7.801408290863037, -7.020763397216797, -6.240118980407715, -5.459474086761475, -4.678831100463867, -3.898186206817627, -3.117541551589966, -2.3368968963623047, -1.5562520027160645, -0.7756071090698242, 0.0050373077392578125, 0.785682201385498, 1.5663270950317383, 2.3469719886779785, 3.1276166439056396, 3.908261299133301, 4.688906192779541, 5.469551086425781, 6.250195503234863, 7.0308403968811035, 7.811485290527344, 8.592129707336426, 9.372775077819824, 10.153419494628906, 10.934064865112305, 11.714709281921387, 12.495353698730469, 13.275999069213867, 14.05664348602295, 14.837287902832031, 15.61793327331543, 16.398578643798828, 17.179222106933594, 17.959867477416992, 18.74051284790039, 19.521156311035156, 20.301801681518555]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 9.0, 10.0, 24.0, 31.0, 49.0, 80.0, 92.0, 164.0, 254.0, 382.0, 682.0, 1149.0, 1864.0, 3700.0, 7424.0, 17842.0, 52885.0, 227400.0, 536797.0, 135087.0, 36270.0, 13213.0, 5961.0, 3064.0, 1580.0, 940.0, 540.0, 346.0, 229.0, 146.0, 104.0, 63.0, 47.0, 27.0, 20.0, 17.0, 17.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.1640625, -7.92633056640625, -7.6885986328125, -7.45086669921875, -7.213134765625, -6.97540283203125, -6.7376708984375, -6.49993896484375, -6.26220703125, -6.02447509765625, -5.7867431640625, -5.54901123046875, -5.311279296875, -5.07354736328125, -4.8358154296875, -4.59808349609375, -4.3603515625, -4.12261962890625, -3.8848876953125, -3.64715576171875, -3.409423828125, -3.17169189453125, -2.9339599609375, -2.69622802734375, -2.45849609375, -2.22076416015625, -1.9830322265625, -1.74530029296875, -1.507568359375, -1.26983642578125, -1.0321044921875, -0.79437255859375, -0.556640625, -0.31890869140625, -0.0811767578125, 0.15655517578125, 0.394287109375, 0.63201904296875, 0.8697509765625, 1.10748291015625, 1.34521484375, 1.58294677734375, 1.8206787109375, 2.05841064453125, 2.296142578125, 2.53387451171875, 2.7716064453125, 3.00933837890625, 3.2470703125, 3.48480224609375, 3.7225341796875, 3.96026611328125, 4.197998046875, 4.43572998046875, 4.6734619140625, 4.91119384765625, 5.14892578125, 5.38665771484375, 5.6243896484375, 5.86212158203125, 6.099853515625, 6.33758544921875, 6.5753173828125, 6.81304931640625, 7.05078125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 13.0, 17.0, 23.0, 33.0, 74.0, 85.0, 90.0, 105.0, 87.0, 127.0, 90.0, 59.0, 52.0, 37.0, 24.0, 16.0, 11.0, 8.0, 3.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1623382568359375, -1.112762451171875, -1.0631866455078125, -1.01361083984375, -0.9640350341796875, -0.914459228515625, -0.8648834228515625, -0.8153076171875, -0.7657318115234375, -0.716156005859375, -0.6665802001953125, -0.61700439453125, -0.5674285888671875, -0.517852783203125, -0.4682769775390625, -0.418701171875, -0.3691253662109375, -0.319549560546875, -0.2699737548828125, -0.22039794921875, -0.1708221435546875, -0.121246337890625, -0.0716705322265625, -0.0220947265625, 0.0274810791015625, 0.077056884765625, 0.1266326904296875, 0.17620849609375, 0.2257843017578125, 0.275360107421875, 0.3249359130859375, 0.37451171875, 0.4240875244140625, 0.473663330078125, 0.5232391357421875, 0.57281494140625, 0.6223907470703125, 0.671966552734375, 0.7215423583984375, 0.7711181640625, 0.8206939697265625, 0.870269775390625, 0.9198455810546875, 0.96942138671875, 1.0189971923828125, 1.068572998046875, 1.1181488037109375, 1.167724609375, 1.2173004150390625, 1.266876220703125, 1.3164520263671875, 1.36602783203125, 1.4156036376953125, 1.465179443359375, 1.5147552490234375, 1.5643310546875, 1.6139068603515625, 1.663482666015625, 1.7130584716796875, 1.76263427734375, 1.8122100830078125, 1.861785888671875, 1.9113616943359375, 1.9609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 5.0, 9.0, 12.0, 9.0, 14.0, 23.0, 25.0, 46.0, 58.0, 76.0, 115.0, 200.0, 275.0, 389.0, 634.0, 986.0, 1646.0, 2846.0, 5288.0, 9717.0, 19221.0, 40968.0, 99352.0, 262071.0, 350337.0, 143967.0, 56635.0, 25654.0, 12350.0, 6491.0, 3677.0, 2041.0, 1241.0, 724.0, 503.0, 316.0, 180.0, 119.0, 115.0, 67.0, 35.0, 40.0, 20.0, 19.0, 13.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.046875, -4.88507080078125, -4.7232666015625, -4.56146240234375, -4.399658203125, -4.23785400390625, -4.0760498046875, -3.91424560546875, -3.75244140625, -3.59063720703125, -3.4288330078125, -3.26702880859375, -3.105224609375, -2.94342041015625, -2.7816162109375, -2.61981201171875, -2.4580078125, -2.29620361328125, -2.1343994140625, -1.97259521484375, -1.810791015625, -1.64898681640625, -1.4871826171875, -1.32537841796875, -1.16357421875, -1.00177001953125, -0.8399658203125, -0.67816162109375, -0.516357421875, -0.35455322265625, -0.1927490234375, -0.03094482421875, 0.130859375, 0.29266357421875, 0.4544677734375, 0.61627197265625, 0.778076171875, 0.93988037109375, 1.1016845703125, 1.26348876953125, 1.42529296875, 1.58709716796875, 1.7489013671875, 1.91070556640625, 2.072509765625, 2.23431396484375, 2.3961181640625, 2.55792236328125, 2.7197265625, 2.88153076171875, 3.0433349609375, 3.20513916015625, 3.366943359375, 3.52874755859375, 3.6905517578125, 3.85235595703125, 4.01416015625, 4.17596435546875, 4.3377685546875, 4.49957275390625, 4.661376953125, 4.82318115234375, 4.9849853515625, 5.14678955078125, 5.30859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 5.0, 2.0, 7.0, 5.0, 7.0, 8.0, 10.0, 15.0, 14.0, 22.0, 23.0, 20.0, 21.0, 21.0, 24.0, 42.0, 37.0, 27.0, 28.0, 36.0, 31.0, 41.0, 37.0, 42.0, 38.0, 37.0, 39.0, 32.0, 34.0, 24.0, 25.0, 22.0, 28.0, 27.0, 25.0, 25.0, 15.0, 14.0, 13.0, 12.0, 10.0, 9.0, 9.0, 9.0, 13.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.6953125, -4.5338134765625, -4.372314453125, -4.2108154296875, -4.04931640625, -3.8878173828125, -3.726318359375, -3.5648193359375, -3.4033203125, -3.2418212890625, -3.080322265625, -2.9188232421875, -2.75732421875, -2.5958251953125, -2.434326171875, -2.2728271484375, -2.111328125, -1.9498291015625, -1.788330078125, -1.6268310546875, -1.46533203125, -1.3038330078125, -1.142333984375, -0.9808349609375, -0.8193359375, -0.6578369140625, -0.496337890625, -0.3348388671875, -0.17333984375, -0.0118408203125, 0.149658203125, 0.3111572265625, 0.47265625, 0.6341552734375, 0.795654296875, 0.9571533203125, 1.11865234375, 1.2801513671875, 1.441650390625, 1.6031494140625, 1.7646484375, 1.9261474609375, 2.087646484375, 2.2491455078125, 2.41064453125, 2.5721435546875, 2.733642578125, 2.8951416015625, 3.056640625, 3.2181396484375, 3.379638671875, 3.5411376953125, 3.70263671875, 3.8641357421875, 4.025634765625, 4.1871337890625, 4.3486328125, 4.5101318359375, 4.671630859375, 4.8331298828125, 4.99462890625, 5.1561279296875, 5.317626953125, 5.4791259765625, 5.640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 3.0, 13.0, 27.0, 25.0, 50.0, 58.0, 109.0, 176.0, 278.0, 522.0, 1069.0, 2262.0, 5683.0, 17705.0, 83540.0, 614545.0, 267782.0, 37446.0, 10191.0, 3656.0, 1570.0, 775.0, 422.0, 223.0, 162.0, 99.0, 38.0, 31.0, 26.0, 16.0, 19.0, 7.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.8157958984375, -12.436279296875, -12.0567626953125, -11.67724609375, -11.2977294921875, -10.918212890625, -10.5386962890625, -10.1591796875, -9.7796630859375, -9.400146484375, -9.0206298828125, -8.64111328125, -8.2615966796875, -7.882080078125, -7.5025634765625, -7.123046875, -6.7435302734375, -6.364013671875, -5.9844970703125, -5.60498046875, -5.2254638671875, -4.845947265625, -4.4664306640625, -4.0869140625, -3.7073974609375, -3.327880859375, -2.9483642578125, -2.56884765625, -2.1893310546875, -1.809814453125, -1.4302978515625, -1.05078125, -0.6712646484375, -0.291748046875, 0.0877685546875, 0.46728515625, 0.8468017578125, 1.226318359375, 1.6058349609375, 1.9853515625, 2.3648681640625, 2.744384765625, 3.1239013671875, 3.50341796875, 3.8829345703125, 4.262451171875, 4.6419677734375, 5.021484375, 5.4010009765625, 5.780517578125, 6.1600341796875, 6.53955078125, 6.9190673828125, 7.298583984375, 7.6781005859375, 8.0576171875, 8.4371337890625, 8.816650390625, 9.1961669921875, 9.57568359375, 9.9552001953125, 10.334716796875, 10.7142333984375, 11.09375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 8.0, 8.0, 10.0, 12.0, 18.0, 31.0, 54.0, 61.0, 74.0, 100.0, 93.0, 129.0, 93.0, 67.0, 60.0, 63.0, 39.0, 18.0, 17.0, 11.0, 7.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044727325439453125, -0.0004345551133155823, -0.0004218369722366333, -0.0004091188311576843, -0.00039640069007873535, -0.0003836825489997864, -0.0003709644079208374, -0.00035824626684188843, -0.00034552812576293945, -0.0003328099846839905, -0.0003200918436050415, -0.00030737370252609253, -0.00029465556144714355, -0.0002819374203681946, -0.0002692192792892456, -0.00025650113821029663, -0.00024378299713134766, -0.00023106485605239868, -0.0002183467149734497, -0.00020562857389450073, -0.00019291043281555176, -0.00018019229173660278, -0.0001674741506576538, -0.00015475600957870483, -0.00014203786849975586, -0.00012931972742080688, -0.00011660158634185791, -0.00010388344526290894, -9.116530418395996e-05, -7.844716310501099e-05, -6.572902202606201e-05, -5.301088094711304e-05, -4.029273986816406e-05, -2.7574598789215088e-05, -1.4856457710266113e-05, -2.1383166313171387e-06, 1.0579824447631836e-05, 2.329796552658081e-05, 3.6016106605529785e-05, 4.873424768447876e-05, 6.145238876342773e-05, 7.417052984237671e-05, 8.688867092132568e-05, 9.960681200027466e-05, 0.00011232495307922363, 0.0001250430941581726, 0.00013776123523712158, 0.00015047937631607056, 0.00016319751739501953, 0.0001759156584739685, 0.00018863379955291748, 0.00020135194063186646, 0.00021407008171081543, 0.0002267882227897644, 0.00023950636386871338, 0.00025222450494766235, 0.00026494264602661133, 0.0002776607871055603, 0.0002903789281845093, 0.00030309706926345825, 0.0003158152103424072, 0.0003285333514213562, 0.0003412514925003052, 0.00035396963357925415, 0.0003666877746582031]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 13.0, 17.0, 25.0, 36.0, 60.0, 65.0, 132.0, 216.0, 393.0, 762.0, 1630.0, 3767.0, 9880.0, 32453.0, 159182.0, 610948.0, 176374.0, 34871.0, 10371.0, 3940.0, 1626.0, 773.0, 383.0, 241.0, 145.0, 107.0, 54.0, 27.0, 18.0, 12.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.3203125, -10.982666015625, -10.64501953125, -10.307373046875, -9.9697265625, -9.632080078125, -9.29443359375, -8.956787109375, -8.619140625, -8.281494140625, -7.94384765625, -7.606201171875, -7.2685546875, -6.930908203125, -6.59326171875, -6.255615234375, -5.91796875, -5.580322265625, -5.24267578125, -4.905029296875, -4.5673828125, -4.229736328125, -3.89208984375, -3.554443359375, -3.216796875, -2.879150390625, -2.54150390625, -2.203857421875, -1.8662109375, -1.528564453125, -1.19091796875, -0.853271484375, -0.515625, -0.177978515625, 0.15966796875, 0.497314453125, 0.8349609375, 1.172607421875, 1.51025390625, 1.847900390625, 2.185546875, 2.523193359375, 2.86083984375, 3.198486328125, 3.5361328125, 3.873779296875, 4.21142578125, 4.549072265625, 4.88671875, 5.224365234375, 5.56201171875, 5.899658203125, 6.2373046875, 6.574951171875, 6.91259765625, 7.250244140625, 7.587890625, 7.925537109375, 8.26318359375, 8.600830078125, 8.9384765625, 9.276123046875, 9.61376953125, 9.951416015625, 10.2890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 10.0, 13.0, 13.0, 19.0, 18.0, 37.0, 35.0, 43.0, 40.0, 53.0, 78.0, 81.0, 70.0, 82.0, 74.0, 60.0, 54.0, 38.0, 40.0, 24.0, 20.0, 15.0, 13.0, 19.0, 12.0, 9.0, 9.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0546875, -4.86639404296875, -4.6781005859375, -4.48980712890625, -4.301513671875, -4.11322021484375, -3.9249267578125, -3.73663330078125, -3.54833984375, -3.36004638671875, -3.1717529296875, -2.98345947265625, -2.795166015625, -2.60687255859375, -2.4185791015625, -2.23028564453125, -2.0419921875, -1.85369873046875, -1.6654052734375, -1.47711181640625, -1.288818359375, -1.10052490234375, -0.9122314453125, -0.72393798828125, -0.53564453125, -0.34735107421875, -0.1590576171875, 0.02923583984375, 0.217529296875, 0.40582275390625, 0.5941162109375, 0.78240966796875, 0.970703125, 1.15899658203125, 1.3472900390625, 1.53558349609375, 1.723876953125, 1.91217041015625, 2.1004638671875, 2.28875732421875, 2.47705078125, 2.66534423828125, 2.8536376953125, 3.04193115234375, 3.230224609375, 3.41851806640625, 3.6068115234375, 3.79510498046875, 3.9833984375, 4.17169189453125, 4.3599853515625, 4.54827880859375, 4.736572265625, 4.92486572265625, 5.1131591796875, 5.30145263671875, 5.48974609375, 5.67803955078125, 5.8663330078125, 6.05462646484375, 6.242919921875, 6.43121337890625, 6.6195068359375, 6.80780029296875, 6.99609375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 32.0, 59.0, 194.0, 312.0, 218.0, 80.0, 31.0, 15.0, 13.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.64065551757812, -134.39913940429688, -130.15762329101562, -125.9161148071289, -121.67460632324219, -117.43309020996094, -113.19157409667969, -108.95005798339844, -104.70854949951172, -100.46703338623047, -96.22552490234375, -91.9840087890625, -87.74249267578125, -83.50098419189453, -79.25946807861328, -75.01795959472656, -70.77644348144531, -66.53492736816406, -62.293418884277344, -58.051902770996094, -53.81039047241211, -49.568878173828125, -45.327362060546875, -41.08584976196289, -36.844337463378906, -32.60282516479492, -28.361310958862305, -24.119796752929688, -19.878284454345703, -15.636772155761719, -11.395257949829102, -7.153743743896484, -2.9122314453125, 1.3292818069458008, 5.570795059204102, 9.812308311462402, 14.053821563720703, 18.295333862304688, 22.536848068237305, 26.778362274169922, 31.019874572753906, 35.26138687133789, 39.502899169921875, 43.744415283203125, 47.98592758178711, 52.227439880371094, 56.468955993652344, 60.71046829223633, 64.95198059082031, 69.19349670410156, 73.43500518798828, 77.67652130126953, 81.91802978515625, 86.1595458984375, 90.40106201171875, 94.642578125, 98.88408660888672, 103.12560272216797, 107.36711120605469, 111.60862731933594, 115.85014343261719, 120.0916519165039, 124.33316802978516, 128.57467651367188, 132.81619262695312]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 5.0, 17.0, 12.0, 24.0, 37.0, 78.0, 131.0, 188.0, 154.0, 126.0, 79.0, 46.0, 33.0, 10.0, 12.0, 8.0, 5.0, 4.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.78155517578125, -139.55946350097656, -135.33738708496094, -131.11529541015625, -126.89320373535156, -122.6711196899414, -118.44903564453125, -114.22694396972656, -110.0048599243164, -105.78277587890625, -101.56068420410156, -97.3386001586914, -93.11651611328125, -88.89442443847656, -84.6723403930664, -80.45025634765625, -76.22816467285156, -72.0060806274414, -67.78398895263672, -63.56190490722656, -59.33981704711914, -55.11772918701172, -50.89564514160156, -46.67355728149414, -42.45146942138672, -38.2293815612793, -34.007293701171875, -29.78520965576172, -25.563121795654297, -21.341033935546875, -17.118947982788086, -12.896862030029297, -8.674789428710938, -4.452702522277832, -0.23061561584472656, 3.991471290588379, 8.213558197021484, 12.435646057128906, 16.657732009887695, 20.879817962646484, 25.101905822753906, 29.323993682861328, 33.54608154296875, 37.768165588378906, 41.99025344848633, 46.21234130859375, 50.434425354003906, 54.65651321411133, 58.87860107421875, 63.10068893432617, 67.3227767944336, 71.54486083984375, 75.76695251464844, 79.9890365600586, 84.21112060546875, 88.43321228027344, 92.6552963256836, 96.87738037109375, 101.09947204589844, 105.3215560913086, 109.54364013671875, 113.76573181152344, 117.9878158569336, 122.20989990234375, 126.43199157714844]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 7.0, 14.0, 15.0, 39.0, 46.0, 82.0, 108.0, 176.0, 302.0, 462.0, 861.0, 1494.0, 3088.0, 6604.0, 16966.0, 59366.0, 564421.0, 3381351.0, 114517.0, 26177.0, 9377.0, 4099.0, 2041.0, 1094.0, 583.0, 343.0, 223.0, 135.0, 97.0, 51.0, 37.0, 26.0, 19.0, 11.0, 19.0, 4.0, 1.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.634033203125, -19.84619140625, -19.058349609375, -18.2705078125, -17.482666015625, -16.69482421875, -15.906982421875, -15.119140625, -14.331298828125, -13.54345703125, -12.755615234375, -11.9677734375, -11.179931640625, -10.39208984375, -9.604248046875, -8.81640625, -8.028564453125, -7.24072265625, -6.452880859375, -5.6650390625, -4.877197265625, -4.08935546875, -3.301513671875, -2.513671875, -1.725830078125, -0.93798828125, -0.150146484375, 0.6376953125, 1.425537109375, 2.21337890625, 3.001220703125, 3.7890625, 4.576904296875, 5.36474609375, 6.152587890625, 6.9404296875, 7.728271484375, 8.51611328125, 9.303955078125, 10.091796875, 10.879638671875, 11.66748046875, 12.455322265625, 13.2431640625, 14.031005859375, 14.81884765625, 15.606689453125, 16.39453125, 17.182373046875, 17.97021484375, 18.758056640625, 19.5458984375, 20.333740234375, 21.12158203125, 21.909423828125, 22.697265625, 23.485107421875, 24.27294921875, 25.060791015625, 25.8486328125, 26.636474609375, 27.42431640625, 28.212158203125, 29.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 21.0, 16.0, 25.0, 38.0, 50.0, 76.0, 86.0, 113.0, 100.0, 91.0, 107.0, 73.0, 45.0, 31.0, 35.0, 17.0, 10.0, 19.0, 6.0, 4.0, 3.0, 9.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.3835296630859375, -1.331512451171875, -1.2794952392578125, -1.22747802734375, -1.1754608154296875, -1.123443603515625, -1.0714263916015625, -1.0194091796875, -0.9673919677734375, -0.915374755859375, -0.8633575439453125, -0.81134033203125, -0.7593231201171875, -0.707305908203125, -0.6552886962890625, -0.603271484375, -0.5512542724609375, -0.499237060546875, -0.4472198486328125, -0.39520263671875, -0.3431854248046875, -0.291168212890625, -0.2391510009765625, -0.1871337890625, -0.1351165771484375, -0.083099365234375, -0.0310821533203125, 0.02093505859375, 0.0729522705078125, 0.124969482421875, 0.1769866943359375, 0.22900390625, 0.2810211181640625, 0.333038330078125, 0.3850555419921875, 0.43707275390625, 0.4890899658203125, 0.541107177734375, 0.5931243896484375, 0.6451416015625, 0.6971588134765625, 0.749176025390625, 0.8011932373046875, 0.85321044921875, 0.9052276611328125, 0.957244873046875, 1.0092620849609375, 1.061279296875, 1.1132965087890625, 1.165313720703125, 1.2173309326171875, 1.26934814453125, 1.3213653564453125, 1.373382568359375, 1.4253997802734375, 1.4774169921875, 1.5294342041015625, 1.581451416015625, 1.6334686279296875, 1.68548583984375, 1.7375030517578125, 1.789520263671875, 1.8415374755859375, 1.8935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 11.0, 14.0, 16.0, 22.0, 45.0, 59.0, 71.0, 124.0, 209.0, 321.0, 509.0, 811.0, 1438.0, 2533.0, 4581.0, 8796.0, 18435.0, 41620.0, 109276.0, 388045.0, 2684178.0, 675498.0, 155870.0, 54884.0, 22998.0, 10996.0, 5551.0, 3070.0, 1721.0, 1009.0, 583.0, 345.0, 215.0, 144.0, 104.0, 57.0, 39.0, 25.0, 16.0, 12.0, 5.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -14.9718017578125, -14.467041015625, -13.9622802734375, -13.45751953125, -12.9527587890625, -12.447998046875, -11.9432373046875, -11.4384765625, -10.9337158203125, -10.428955078125, -9.9241943359375, -9.41943359375, -8.9146728515625, -8.409912109375, -7.9051513671875, -7.400390625, -6.8956298828125, -6.390869140625, -5.8861083984375, -5.38134765625, -4.8765869140625, -4.371826171875, -3.8670654296875, -3.3623046875, -2.8575439453125, -2.352783203125, -1.8480224609375, -1.34326171875, -0.8385009765625, -0.333740234375, 0.1710205078125, 0.67578125, 1.1805419921875, 1.685302734375, 2.1900634765625, 2.69482421875, 3.1995849609375, 3.704345703125, 4.2091064453125, 4.7138671875, 5.2186279296875, 5.723388671875, 6.2281494140625, 6.73291015625, 7.2376708984375, 7.742431640625, 8.2471923828125, 8.751953125, 9.2567138671875, 9.761474609375, 10.2662353515625, 10.77099609375, 11.2757568359375, 11.780517578125, 12.2852783203125, 12.7900390625, 13.2947998046875, 13.799560546875, 14.3043212890625, 14.80908203125, 15.3138427734375, 15.818603515625, 16.3233642578125, 16.828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 11.0, 10.0, 13.0, 22.0, 27.0, 27.0, 32.0, 39.0, 62.0, 90.0, 113.0, 175.0, 254.0, 460.0, 1185.0, 570.0, 309.0, 213.0, 119.0, 92.0, 67.0, 41.0, 43.0, 22.0, 14.0, 11.0, 11.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.4552001953125, -2.359619140625, -2.2640380859375, -2.16845703125, -2.0728759765625, -1.977294921875, -1.8817138671875, -1.7861328125, -1.6905517578125, -1.594970703125, -1.4993896484375, -1.40380859375, -1.3082275390625, -1.212646484375, -1.1170654296875, -1.021484375, -0.9259033203125, -0.830322265625, -0.7347412109375, -0.63916015625, -0.5435791015625, -0.447998046875, -0.3524169921875, -0.2568359375, -0.1612548828125, -0.065673828125, 0.0299072265625, 0.12548828125, 0.2210693359375, 0.316650390625, 0.4122314453125, 0.5078125, 0.6033935546875, 0.698974609375, 0.7945556640625, 0.89013671875, 0.9857177734375, 1.081298828125, 1.1768798828125, 1.2724609375, 1.3680419921875, 1.463623046875, 1.5592041015625, 1.65478515625, 1.7503662109375, 1.845947265625, 1.9415283203125, 2.037109375, 2.1326904296875, 2.228271484375, 2.3238525390625, 2.41943359375, 2.5150146484375, 2.610595703125, 2.7061767578125, 2.8017578125, 2.8973388671875, 2.992919921875, 3.0885009765625, 3.18408203125, 3.2796630859375, 3.375244140625, 3.4708251953125, 3.56640625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 12.0, 19.0, 42.0, 68.0, 138.0, 191.0, 215.0, 152.0, 79.0, 41.0, 22.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.28657531738281, -61.82771682739258, -60.36885452270508, -58.909996032714844, -57.451133728027344, -55.99227523803711, -54.533416748046875, -53.074554443359375, -51.61569595336914, -50.156837463378906, -48.697975158691406, -47.23911666870117, -45.78025436401367, -44.32139587402344, -42.86253356933594, -41.4036750793457, -39.94481658935547, -38.485958099365234, -37.027095794677734, -35.5682373046875, -34.109375, -32.650516510009766, -31.1916561126709, -29.73279571533203, -28.27393341064453, -26.815073013305664, -25.356212615966797, -23.897354125976562, -22.438493728637695, -20.979633331298828, -19.52077293395996, -18.061912536621094, -16.60305404663086, -15.144193649291992, -13.685334205627441, -12.226473808288574, -10.767614364624023, -9.308753967285156, -7.849893569946289, -6.391034126281738, -4.932173728942871, -3.473313808441162, -2.014453649520874, -0.5555934906005859, 0.903266429901123, 2.362126350402832, 3.820986747741699, 5.27984619140625, 6.738706588745117, 8.197566986083984, 9.656426429748535, 11.115286827087402, 12.574146270751953, 14.03300666809082, 15.491867065429688, 16.950725555419922, 18.409587860107422, 19.86844825744629, 21.327308654785156, 22.78616714477539, 24.245027542114258, 25.703887939453125, 27.162748336791992, 28.62160873413086, 30.080467224121094]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 2.0, 4.0, 10.0, 8.0, 13.0, 24.0, 22.0, 25.0, 33.0, 47.0, 52.0, 52.0, 44.0, 70.0, 64.0, 81.0, 54.0, 59.0, 65.0, 46.0, 47.0, 41.0, 44.0, 27.0, 14.0, 17.0, 10.0, 12.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.258581161499023, -25.616727828979492, -24.974876403808594, -24.333023071289062, -23.69116973876953, -23.04931640625, -22.4074649810791, -21.76561164855957, -21.123760223388672, -20.48190689086914, -19.840055465698242, -19.19820213317871, -18.55634880065918, -17.91449737548828, -17.27264404296875, -16.63079071044922, -15.988937377929688, -15.347084999084473, -14.705231666564941, -14.063379287719727, -13.421525955200195, -12.77967357635498, -12.137821197509766, -11.495967864990234, -10.85411548614502, -10.212263107299805, -9.570409774780273, -8.928557395935059, -8.286705017089844, -7.6448516845703125, -7.002999305725098, -6.361146450042725, -5.719295501708984, -5.077442646026611, -4.435589790344238, -3.7937374114990234, -3.1518845558166504, -2.5100317001342773, -1.8681790828704834, -1.2263264656066895, -0.5844736099243164, 0.05737912654876709, 0.6992318630218506, 1.341084599494934, 1.9829373359680176, 2.6247901916503906, 3.2666428089141846, 3.9084954261779785, 4.550348281860352, 5.192201137542725, 5.834053993225098, 6.4759063720703125, 7.1177592277526855, 7.759612083435059, 8.401464462280273, 9.043317794799805, 9.68517017364502, 10.327022552490234, 10.968875885009766, 11.61072826385498, 12.252580642700195, 12.894433975219727, 13.536286354064941, 14.178138732910156, 14.819992065429688]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 6.0, 8.0, 5.0, 13.0, 21.0, 28.0, 39.0, 73.0, 299.0, 1467.0, 16729.0, 833914.0, 188932.0, 5804.0, 805.0, 186.0, 75.0, 47.0, 25.0, 20.0, 11.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.125, -45.3671875, -43.609375, -41.8515625, -40.09375, -38.3359375, -36.578125, -34.8203125, -33.0625, -31.3046875, -29.546875, -27.7890625, -26.03125, -24.2734375, -22.515625, -20.7578125, -19.0, -17.2421875, -15.484375, -13.7265625, -11.96875, -10.2109375, -8.453125, -6.6953125, -4.9375, -3.1796875, -1.421875, 0.3359375, 2.09375, 3.8515625, 5.609375, 7.3671875, 9.125, 10.8828125, 12.640625, 14.3984375, 16.15625, 17.9140625, 19.671875, 21.4296875, 23.1875, 24.9453125, 26.703125, 28.4609375, 30.21875, 31.9765625, 33.734375, 35.4921875, 37.25, 39.0078125, 40.765625, 42.5234375, 44.28125, 46.0390625, 47.796875, 49.5546875, 51.3125, 53.0703125, 54.828125, 56.5859375, 58.34375, 60.1015625, 61.859375, 63.6171875, 65.375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 22.0, 31.0, 55.0, 75.0, 121.0, 153.0, 147.0, 129.0, 99.0, 64.0, 47.0, 21.0, 11.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.66796875, -4.576690673828125, -4.48541259765625, -4.394134521484375, -4.3028564453125, -4.211578369140625, -4.12030029296875, -4.029022216796875, -3.937744140625, -3.846466064453125, -3.75518798828125, -3.663909912109375, -3.5726318359375, -3.481353759765625, -3.39007568359375, -3.298797607421875, -3.20751953125, -3.116241455078125, -3.02496337890625, -2.933685302734375, -2.8424072265625, -2.751129150390625, -2.65985107421875, -2.568572998046875, -2.477294921875, -2.386016845703125, -2.29473876953125, -2.203460693359375, -2.1121826171875, -2.020904541015625, -1.92962646484375, -1.838348388671875, -1.7470703125, -1.655792236328125, -1.56451416015625, -1.473236083984375, -1.3819580078125, -1.290679931640625, -1.19940185546875, -1.108123779296875, -1.016845703125, -0.925567626953125, -0.83428955078125, -0.743011474609375, -0.6517333984375, -0.560455322265625, -0.46917724609375, -0.377899169921875, -0.28662109375, -0.195343017578125, -0.10406494140625, -0.012786865234375, 0.0784912109375, 0.169769287109375, 0.26104736328125, 0.352325439453125, 0.443603515625, 0.534881591796875, 0.62615966796875, 0.717437744140625, 0.8087158203125, 0.899993896484375, 0.99127197265625, 1.082550048828125, 1.173828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 16.0, 14.0, 26.0, 44.0, 59.0, 103.0, 158.0, 297.0, 560.0, 1083.0, 2075.0, 4706.0, 11608.0, 32771.0, 109503.0, 389548.0, 350134.0, 96682.0, 29717.0, 10757.0, 4466.0, 2019.0, 976.0, 523.0, 304.0, 152.0, 74.0, 59.0, 41.0, 18.0, 14.0, 8.0, 7.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.765625, -11.3973388671875, -11.029052734375, -10.6607666015625, -10.29248046875, -9.9241943359375, -9.555908203125, -9.1876220703125, -8.8193359375, -8.4510498046875, -8.082763671875, -7.7144775390625, -7.34619140625, -6.9779052734375, -6.609619140625, -6.2413330078125, -5.873046875, -5.5047607421875, -5.136474609375, -4.7681884765625, -4.39990234375, -4.0316162109375, -3.663330078125, -3.2950439453125, -2.9267578125, -2.5584716796875, -2.190185546875, -1.8218994140625, -1.45361328125, -1.0853271484375, -0.717041015625, -0.3487548828125, 0.01953125, 0.3878173828125, 0.756103515625, 1.1243896484375, 1.49267578125, 1.8609619140625, 2.229248046875, 2.5975341796875, 2.9658203125, 3.3341064453125, 3.702392578125, 4.0706787109375, 4.43896484375, 4.8072509765625, 5.175537109375, 5.5438232421875, 5.912109375, 6.2803955078125, 6.648681640625, 7.0169677734375, 7.38525390625, 7.7535400390625, 8.121826171875, 8.4901123046875, 8.8583984375, 9.2266845703125, 9.594970703125, 9.9632568359375, 10.33154296875, 10.6998291015625, 11.068115234375, 11.4364013671875, 11.8046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 8.0, 11.0, 12.0, 13.0, 14.0, 16.0, 19.0, 24.0, 20.0, 25.0, 29.0, 38.0, 36.0, 36.0, 41.0, 50.0, 37.0, 52.0, 43.0, 47.0, 38.0, 45.0, 34.0, 36.0, 28.0, 29.0, 32.0, 26.0, 25.0, 20.0, 18.0, 23.0, 11.0, 10.0, 11.0, 5.0, 12.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.30230712890625, -5.1358642578125, -4.96942138671875, -4.802978515625, -4.63653564453125, -4.4700927734375, -4.30364990234375, -4.13720703125, -3.97076416015625, -3.8043212890625, -3.63787841796875, -3.471435546875, -3.30499267578125, -3.1385498046875, -2.97210693359375, -2.8056640625, -2.63922119140625, -2.4727783203125, -2.30633544921875, -2.139892578125, -1.97344970703125, -1.8070068359375, -1.64056396484375, -1.47412109375, -1.30767822265625, -1.1412353515625, -0.97479248046875, -0.808349609375, -0.64190673828125, -0.4754638671875, -0.30902099609375, -0.142578125, 0.02386474609375, 0.1903076171875, 0.35675048828125, 0.523193359375, 0.68963623046875, 0.8560791015625, 1.02252197265625, 1.18896484375, 1.35540771484375, 1.5218505859375, 1.68829345703125, 1.854736328125, 2.02117919921875, 2.1876220703125, 2.35406494140625, 2.5205078125, 2.68695068359375, 2.8533935546875, 3.01983642578125, 3.186279296875, 3.35272216796875, 3.5191650390625, 3.68560791015625, 3.85205078125, 4.01849365234375, 4.1849365234375, 4.35137939453125, 4.517822265625, 4.68426513671875, 4.8507080078125, 5.01715087890625, 5.18359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 15.0, 24.0, 51.0, 130.0, 393.0, 1281.0, 4884.0, 28871.0, 278891.0, 633766.0, 85636.0, 11174.0, 2410.0, 654.0, 225.0, 81.0, 30.0, 21.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -15.909912109375, -15.19482421875, -14.479736328125, -13.7646484375, -13.049560546875, -12.33447265625, -11.619384765625, -10.904296875, -10.189208984375, -9.47412109375, -8.759033203125, -8.0439453125, -7.328857421875, -6.61376953125, -5.898681640625, -5.18359375, -4.468505859375, -3.75341796875, -3.038330078125, -2.3232421875, -1.608154296875, -0.89306640625, -0.177978515625, 0.537109375, 1.252197265625, 1.96728515625, 2.682373046875, 3.3974609375, 4.112548828125, 4.82763671875, 5.542724609375, 6.2578125, 6.972900390625, 7.68798828125, 8.403076171875, 9.1181640625, 9.833251953125, 10.54833984375, 11.263427734375, 11.978515625, 12.693603515625, 13.40869140625, 14.123779296875, 14.8388671875, 15.553955078125, 16.26904296875, 16.984130859375, 17.69921875, 18.414306640625, 19.12939453125, 19.844482421875, 20.5595703125, 21.274658203125, 21.98974609375, 22.704833984375, 23.419921875, 24.135009765625, 24.85009765625, 25.565185546875, 26.2802734375, 26.995361328125, 27.71044921875, 28.425537109375, 29.140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 8.0, 10.0, 11.0, 30.0, 64.0, 108.0, 212.0, 227.0, 143.0, 65.0, 30.0, 31.0, 16.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001377105712890625, -0.001331329345703125, -0.001285552978515625, -0.001239776611328125, -0.001194000244140625, -0.001148223876953125, -0.001102447509765625, -0.001056671142578125, -0.001010894775390625, -0.000965118408203125, -0.000919342041015625, -0.000873565673828125, -0.000827789306640625, -0.000782012939453125, -0.000736236572265625, -0.000690460205078125, -0.000644683837890625, -0.000598907470703125, -0.000553131103515625, -0.000507354736328125, -0.000461578369140625, -0.000415802001953125, -0.000370025634765625, -0.000324249267578125, -0.000278472900390625, -0.000232696533203125, -0.000186920166015625, -0.000141143798828125, -9.5367431640625e-05, -4.9591064453125e-05, -3.814697265625e-06, 4.1961669921875e-05, 8.7738037109375e-05, 0.000133514404296875, 0.000179290771484375, 0.000225067138671875, 0.000270843505859375, 0.000316619873046875, 0.000362396240234375, 0.000408172607421875, 0.000453948974609375, 0.000499725341796875, 0.000545501708984375, 0.000591278076171875, 0.000637054443359375, 0.000682830810546875, 0.000728607177734375, 0.000774383544921875, 0.000820159912109375, 0.000865936279296875, 0.000911712646484375, 0.000957489013671875, 0.001003265380859375, 0.001049041748046875, 0.001094818115234375, 0.001140594482421875, 0.001186370849609375, 0.001232147216796875, 0.001277923583984375, 0.001323699951171875, 0.001369476318359375, 0.001415252685546875, 0.001461029052734375, 0.001506805419921875, 0.001552581787109375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 9.0, 18.0, 20.0, 48.0, 66.0, 96.0, 181.0, 308.0, 518.0, 937.0, 1780.0, 3207.0, 6472.0, 14050.0, 32179.0, 76121.0, 175795.0, 296560.0, 238996.0, 113636.0, 47679.0, 20488.0, 9390.0, 4633.0, 2386.0, 1270.0, 697.0, 413.0, 230.0, 136.0, 82.0, 46.0, 42.0, 19.0, 10.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.2720947265625, -9.005126953125, -8.7381591796875, -8.47119140625, -8.2042236328125, -7.937255859375, -7.6702880859375, -7.4033203125, -7.1363525390625, -6.869384765625, -6.6024169921875, -6.33544921875, -6.0684814453125, -5.801513671875, -5.5345458984375, -5.267578125, -5.0006103515625, -4.733642578125, -4.4666748046875, -4.19970703125, -3.9327392578125, -3.665771484375, -3.3988037109375, -3.1318359375, -2.8648681640625, -2.597900390625, -2.3309326171875, -2.06396484375, -1.7969970703125, -1.530029296875, -1.2630615234375, -0.99609375, -0.7291259765625, -0.462158203125, -0.1951904296875, 0.07177734375, 0.3387451171875, 0.605712890625, 0.8726806640625, 1.1396484375, 1.4066162109375, 1.673583984375, 1.9405517578125, 2.20751953125, 2.4744873046875, 2.741455078125, 3.0084228515625, 3.275390625, 3.5423583984375, 3.809326171875, 4.0762939453125, 4.34326171875, 4.6102294921875, 4.877197265625, 5.1441650390625, 5.4111328125, 5.6781005859375, 5.945068359375, 6.2120361328125, 6.47900390625, 6.7459716796875, 7.012939453125, 7.2799072265625, 7.546875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 5.0, 5.0, 12.0, 10.0, 22.0, 17.0, 23.0, 29.0, 29.0, 36.0, 30.0, 39.0, 35.0, 37.0, 36.0, 53.0, 37.0, 50.0, 57.0, 49.0, 47.0, 37.0, 34.0, 36.0, 25.0, 23.0, 21.0, 32.0, 24.0, 23.0, 8.0, 14.0, 10.0, 9.0, 6.0, 4.0, 8.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.12890625, -3.99749755859375, -3.8660888671875, -3.73468017578125, -3.603271484375, -3.47186279296875, -3.3404541015625, -3.20904541015625, -3.07763671875, -2.94622802734375, -2.8148193359375, -2.68341064453125, -2.552001953125, -2.42059326171875, -2.2891845703125, -2.15777587890625, -2.0263671875, -1.89495849609375, -1.7635498046875, -1.63214111328125, -1.500732421875, -1.36932373046875, -1.2379150390625, -1.10650634765625, -0.97509765625, -0.84368896484375, -0.7122802734375, -0.58087158203125, -0.449462890625, -0.31805419921875, -0.1866455078125, -0.05523681640625, 0.076171875, 0.20758056640625, 0.3389892578125, 0.47039794921875, 0.601806640625, 0.73321533203125, 0.8646240234375, 0.99603271484375, 1.12744140625, 1.25885009765625, 1.3902587890625, 1.52166748046875, 1.653076171875, 1.78448486328125, 1.9158935546875, 2.04730224609375, 2.1787109375, 2.31011962890625, 2.4415283203125, 2.57293701171875, 2.704345703125, 2.83575439453125, 2.9671630859375, 3.09857177734375, 3.22998046875, 3.36138916015625, 3.4927978515625, 3.62420654296875, 3.755615234375, 3.88702392578125, 4.0184326171875, 4.14984130859375, 4.28125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 12.0, 9.0, 29.0, 36.0, 54.0, 91.0, 132.0, 195.0, 148.0, 113.0, 85.0, 39.0, 26.0, 13.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-123.0362548828125, -120.19639587402344, -117.35653686523438, -114.51667785644531, -111.67681884765625, -108.83695983886719, -105.99710083007812, -103.15724182128906, -100.3173828125, -97.47752380371094, -94.63766479492188, -91.79780578613281, -88.95794677734375, -86.11808776855469, -83.27822875976562, -80.43836975097656, -77.59851837158203, -74.75865936279297, -71.9188003540039, -69.07894134521484, -66.23908233642578, -63.39922332763672, -60.55936813354492, -57.71950912475586, -54.8796501159668, -52.039791107177734, -49.19993209838867, -46.360076904296875, -43.52021789550781, -40.68035888671875, -37.84049987792969, -35.000640869140625, -32.16078186035156, -29.3209228515625, -26.481063842773438, -23.641206741333008, -20.801347732543945, -17.961488723754883, -15.121631622314453, -12.28177261352539, -9.441913604736328, -6.602055072784424, -3.7621965408325195, -0.9223384857177734, 1.917520523071289, 4.757379531860352, 7.597236633300781, 10.437095642089844, 13.276954650878906, 16.11681365966797, 18.95667266845703, 21.79652976989746, 24.636388778686523, 27.476247787475586, 30.316104888916016, 33.15596389770508, 35.99582290649414, 38.8356819152832, 41.675540924072266, 44.51539611816406, 47.355255126953125, 50.19511413574219, 53.03497314453125, 55.87483215332031, 58.714691162109375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 16.0, 14.0, 35.0, 47.0, 71.0, 88.0, 97.0, 123.0, 108.0, 103.0, 81.0, 64.0, 58.0, 32.0, 28.0, 13.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.49119567871094, -69.84510803222656, -67.19901275634766, -64.55292510986328, -61.906837463378906, -59.260746002197266, -56.614654541015625, -53.96856689453125, -51.322479248046875, -48.676387786865234, -46.03030014038086, -43.38420867919922, -40.738121032714844, -38.0920295715332, -35.44593811035156, -32.79985046386719, -30.153759002685547, -27.50766944885254, -24.86157989501953, -22.21548843383789, -19.569400787353516, -16.923309326171875, -14.277219772338867, -11.63113021850586, -8.985040664672852, -6.338951110839844, -3.6928610801696777, -1.0467710494995117, 1.599318504333496, 4.245408058166504, 6.891498565673828, 9.537588119506836, 12.183677673339844, 14.829767227172852, 17.47585678100586, 20.1219482421875, 22.768035888671875, 25.414127349853516, 28.060216903686523, 30.70630645751953, 33.352394104003906, 35.99848556518555, 38.64457321166992, 41.29066467285156, 43.93675231933594, 46.58284378051758, 49.22893524169922, 51.875022888183594, 54.521114349365234, 57.167205810546875, 59.81329345703125, 62.45938491821289, 65.10547637939453, 67.7515640258789, 70.39765167236328, 73.04374694824219, 75.68983459472656, 78.33592224121094, 80.98201751708984, 83.62810516357422, 86.2741928100586, 88.92028045654297, 91.56637573242188, 94.21246337890625, 96.85855102539062]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 7.0, 10.0, 9.0, 6.0, 13.0, 15.0, 11.0, 16.0, 29.0, 30.0, 46.0, 72.0, 162.0, 385.0, 905.0, 2910.0, 12490.0, 115480.0, 3945689.0, 100393.0, 11708.0, 2649.0, 785.0, 268.0, 77.0, 46.0, 20.0, 15.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-100.9375, -98.7177734375, -96.498046875, -94.2783203125, -92.05859375, -89.8388671875, -87.619140625, -85.3994140625, -83.1796875, -80.9599609375, -78.740234375, -76.5205078125, -74.30078125, -72.0810546875, -69.861328125, -67.6416015625, -65.421875, -63.2021484375, -60.982421875, -58.7626953125, -56.54296875, -54.3232421875, -52.103515625, -49.8837890625, -47.6640625, -45.4443359375, -43.224609375, -41.0048828125, -38.78515625, -36.5654296875, -34.345703125, -32.1259765625, -29.90625, -27.6865234375, -25.466796875, -23.2470703125, -21.02734375, -18.8076171875, -16.587890625, -14.3681640625, -12.1484375, -9.9287109375, -7.708984375, -5.4892578125, -3.26953125, -1.0498046875, 1.169921875, 3.3896484375, 5.609375, 7.8291015625, 10.048828125, 12.2685546875, 14.48828125, 16.7080078125, 18.927734375, 21.1474609375, 23.3671875, 25.5869140625, 27.806640625, 30.0263671875, 32.24609375, 34.4658203125, 36.685546875, 38.9052734375, 41.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 4.0, 9.0, 13.0, 11.0, 10.0, 20.0, 19.0, 24.0, 29.0, 33.0, 35.0, 46.0, 43.0, 42.0, 62.0, 50.0, 45.0, 53.0, 50.0, 49.0, 44.0, 47.0, 35.0, 35.0, 25.0, 30.0, 22.0, 15.0, 16.0, 15.0, 12.0, 12.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9345703125, -0.9020538330078125, -0.869537353515625, -0.8370208740234375, -0.80450439453125, -0.7719879150390625, -0.739471435546875, -0.7069549560546875, -0.6744384765625, -0.6419219970703125, -0.609405517578125, -0.5768890380859375, -0.54437255859375, -0.5118560791015625, -0.479339599609375, -0.4468231201171875, -0.414306640625, -0.3817901611328125, -0.349273681640625, -0.3167572021484375, -0.28424072265625, -0.2517242431640625, -0.219207763671875, -0.1866912841796875, -0.1541748046875, -0.1216583251953125, -0.089141845703125, -0.0566253662109375, -0.02410888671875, 0.0084075927734375, 0.040924072265625, 0.0734405517578125, 0.10595703125, 0.1384735107421875, 0.170989990234375, 0.2035064697265625, 0.23602294921875, 0.2685394287109375, 0.301055908203125, 0.3335723876953125, 0.3660888671875, 0.3986053466796875, 0.431121826171875, 0.4636383056640625, 0.49615478515625, 0.5286712646484375, 0.561187744140625, 0.5937042236328125, 0.626220703125, 0.6587371826171875, 0.691253662109375, 0.7237701416015625, 0.75628662109375, 0.7888031005859375, 0.821319580078125, 0.8538360595703125, 0.8863525390625, 0.9188690185546875, 0.951385498046875, 0.9839019775390625, 1.01641845703125, 1.0489349365234375, 1.081451416015625, 1.1139678955078125, 1.146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 11.0, 11.0, 17.0, 18.0, 32.0, 39.0, 94.0, 141.0, 350.0, 1395.0, 15823.0, 3539656.0, 626797.0, 8273.0, 959.0, 288.0, 124.0, 89.0, 52.0, 24.0, 24.0, 16.0, 15.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.0, -122.3896484375, -118.779296875, -115.1689453125, -111.55859375, -107.9482421875, -104.337890625, -100.7275390625, -97.1171875, -93.5068359375, -89.896484375, -86.2861328125, -82.67578125, -79.0654296875, -75.455078125, -71.8447265625, -68.234375, -64.6240234375, -61.013671875, -57.4033203125, -53.79296875, -50.1826171875, -46.572265625, -42.9619140625, -39.3515625, -35.7412109375, -32.130859375, -28.5205078125, -24.91015625, -21.2998046875, -17.689453125, -14.0791015625, -10.46875, -6.8583984375, -3.248046875, 0.3623046875, 3.97265625, 7.5830078125, 11.193359375, 14.8037109375, 18.4140625, 22.0244140625, 25.634765625, 29.2451171875, 32.85546875, 36.4658203125, 40.076171875, 43.6865234375, 47.296875, 50.9072265625, 54.517578125, 58.1279296875, 61.73828125, 65.3486328125, 68.958984375, 72.5693359375, 76.1796875, 79.7900390625, 83.400390625, 87.0107421875, 90.62109375, 94.2314453125, 97.841796875, 101.4521484375, 105.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 6.0, 12.0, 20.0, 23.0, 20.0, 29.0, 63.0, 61.0, 90.0, 147.0, 231.0, 416.0, 1345.0, 690.0, 336.0, 187.0, 122.0, 86.0, 51.0, 24.0, 24.0, 14.0, 12.0, 16.0, 6.0, 10.0, 8.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.97943115234375, -3.8455810546875, -3.71173095703125, -3.577880859375, -3.44403076171875, -3.3101806640625, -3.17633056640625, -3.04248046875, -2.90863037109375, -2.7747802734375, -2.64093017578125, -2.507080078125, -2.37322998046875, -2.2393798828125, -2.10552978515625, -1.9716796875, -1.83782958984375, -1.7039794921875, -1.57012939453125, -1.436279296875, -1.30242919921875, -1.1685791015625, -1.03472900390625, -0.90087890625, -0.76702880859375, -0.6331787109375, -0.49932861328125, -0.365478515625, -0.23162841796875, -0.0977783203125, 0.03607177734375, 0.169921875, 0.30377197265625, 0.4376220703125, 0.57147216796875, 0.705322265625, 0.83917236328125, 0.9730224609375, 1.10687255859375, 1.24072265625, 1.37457275390625, 1.5084228515625, 1.64227294921875, 1.776123046875, 1.90997314453125, 2.0438232421875, 2.17767333984375, 2.3115234375, 2.44537353515625, 2.5792236328125, 2.71307373046875, 2.846923828125, 2.98077392578125, 3.1146240234375, 3.24847412109375, 3.38232421875, 3.51617431640625, 3.6500244140625, 3.78387451171875, 3.917724609375, 4.05157470703125, 4.1854248046875, 4.31927490234375, 4.453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 3.0, 8.0, 11.0, 17.0, 13.0, 22.0, 26.0, 37.0, 38.0, 52.0, 68.0, 79.0, 87.0, 79.0, 79.0, 82.0, 85.0, 46.0, 40.0, 31.0, 24.0, 13.0, 14.0, 12.0, 5.0, 4.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.251728057861328, -15.519047737121582, -14.786367416381836, -14.053686141967773, -13.321006774902344, -12.588325500488281, -11.855645179748535, -11.122964859008789, -10.390284538269043, -9.657604217529297, -8.92492389678955, -8.192243576049805, -7.4595627784729, -6.726882457733154, -5.99420166015625, -5.261521339416504, -4.528841018676758, -3.7961606979370117, -3.0634801387786865, -2.3307995796203613, -1.5981192588806152, -0.8654389381408691, -0.13275814056396484, 0.5999221801757812, 1.3326025009155273, 2.0652828216552734, 2.7979633808135986, 3.530643939971924, 4.26332426071167, 4.996004581451416, 5.72868537902832, 6.461365699768066, 7.194047927856445, 7.926728248596191, 8.659408569335938, 9.39208984375, 10.12476921081543, 10.857450485229492, 11.590130805969238, 12.322811126708984, 13.05549144744873, 13.788171768188477, 14.520852088928223, 15.253532409667969, 15.986213684082031, 16.71889305114746, 17.451574325561523, 18.184253692626953, 18.916934967041016, 19.649616241455078, 20.382295608520508, 21.11497688293457, 21.84765625, 22.580337524414062, 23.313018798828125, 24.045698165893555, 24.778377532958984, 25.511058807373047, 26.243738174438477, 26.97641944885254, 27.70909881591797, 28.44178009033203, 29.174461364746094, 29.907140731811523, 30.639822006225586]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 12.0, 4.0, 10.0, 12.0, 19.0, 27.0, 22.0, 31.0, 26.0, 26.0, 37.0, 33.0, 35.0, 32.0, 47.0, 58.0, 58.0, 41.0, 43.0, 44.0, 44.0, 37.0, 36.0, 31.0, 24.0, 31.0, 25.0, 19.0, 20.0, 22.0, 16.0, 12.0, 17.0, 13.0, 6.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.285501480102539, -12.823211669921875, -12.360921859741211, -11.898632049560547, -11.436342239379883, -10.974052429199219, -10.511762619018555, -10.049471855163574, -9.58718204498291, -9.124892234802246, -8.662602424621582, -8.200312614440918, -7.738022327423096, -7.275732517242432, -6.813442707061768, -6.351152420043945, -5.8888630867004395, -5.426573276519775, -4.964283466339111, -4.501993179321289, -4.039703369140625, -3.577413558959961, -3.115123748779297, -2.6528337001800537, -2.1905438899993896, -1.728253960609436, -1.2659640312194824, -0.8036742210388184, -0.34138429164886475, 0.12090563774108887, 0.5831954479217529, 1.045485496520996, 1.5077753067016602, 1.9700652360916138, 2.4323551654815674, 2.8946449756622314, 3.3569350242614746, 3.8192248344421387, 4.281514644622803, 4.743804931640625, 5.206094741821289, 5.668384552001953, 6.130674362182617, 6.592964172363281, 7.0552544593811035, 7.517544269561768, 7.979834079742432, 8.442124366760254, 8.904413223266602, 9.366703033447266, 9.82899284362793, 10.291282653808594, 10.753572463989258, 11.215862274169922, 11.678152084350586, 12.140442848205566, 12.60273265838623, 13.065022468566895, 13.527312278747559, 13.989602088928223, 14.451891899108887, 14.914182662963867, 15.376472473144531, 15.838762283325195, 16.30105209350586]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 4.0, 6.0, 4.0, 15.0, 21.0, 23.0, 28.0, 49.0, 81.0, 110.0, 163.0, 315.0, 512.0, 888.0, 1508.0, 2829.0, 5354.0, 10768.0, 21689.0, 44064.0, 89099.0, 166830.0, 243063.0, 211792.0, 123830.0, 62996.0, 30561.0, 15218.0, 7732.0, 3857.0, 2137.0, 1209.0, 674.0, 406.0, 212.0, 154.0, 102.0, 78.0, 46.0, 39.0, 27.0, 12.0, 18.0, 9.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.9609375, -11.584228515625, -11.20751953125, -10.830810546875, -10.4541015625, -10.077392578125, -9.70068359375, -9.323974609375, -8.947265625, -8.570556640625, -8.19384765625, -7.817138671875, -7.4404296875, -7.063720703125, -6.68701171875, -6.310302734375, -5.93359375, -5.556884765625, -5.18017578125, -4.803466796875, -4.4267578125, -4.050048828125, -3.67333984375, -3.296630859375, -2.919921875, -2.543212890625, -2.16650390625, -1.789794921875, -1.4130859375, -1.036376953125, -0.65966796875, -0.282958984375, 0.09375, 0.470458984375, 0.84716796875, 1.223876953125, 1.6005859375, 1.977294921875, 2.35400390625, 2.730712890625, 3.107421875, 3.484130859375, 3.86083984375, 4.237548828125, 4.6142578125, 4.990966796875, 5.36767578125, 5.744384765625, 6.12109375, 6.497802734375, 6.87451171875, 7.251220703125, 7.6279296875, 8.004638671875, 8.38134765625, 8.758056640625, 9.134765625, 9.511474609375, 9.88818359375, 10.264892578125, 10.6416015625, 11.018310546875, 11.39501953125, 11.771728515625, 12.1484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 10.0, 12.0, 13.0, 19.0, 18.0, 34.0, 37.0, 41.0, 45.0, 75.0, 69.0, 76.0, 59.0, 65.0, 64.0, 54.0, 42.0, 50.0, 46.0, 27.0, 33.0, 22.0, 20.0, 19.0, 12.0, 9.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7763671875, -1.7316741943359375, -1.686981201171875, -1.6422882080078125, -1.59759521484375, -1.5529022216796875, -1.508209228515625, -1.4635162353515625, -1.4188232421875, -1.3741302490234375, -1.329437255859375, -1.2847442626953125, -1.24005126953125, -1.1953582763671875, -1.150665283203125, -1.1059722900390625, -1.061279296875, -1.0165863037109375, -0.971893310546875, -0.9272003173828125, -0.88250732421875, -0.8378143310546875, -0.793121337890625, -0.7484283447265625, -0.7037353515625, -0.6590423583984375, -0.614349365234375, -0.5696563720703125, -0.52496337890625, -0.4802703857421875, -0.435577392578125, -0.3908843994140625, -0.34619140625, -0.3014984130859375, -0.256805419921875, -0.2121124267578125, -0.16741943359375, -0.1227264404296875, -0.078033447265625, -0.0333404541015625, 0.0113525390625, 0.0560455322265625, 0.100738525390625, 0.1454315185546875, 0.19012451171875, 0.2348175048828125, 0.279510498046875, 0.3242034912109375, 0.368896484375, 0.4135894775390625, 0.458282470703125, 0.5029754638671875, 0.54766845703125, 0.5923614501953125, 0.637054443359375, 0.6817474365234375, 0.7264404296875, 0.7711334228515625, 0.815826416015625, 0.8605194091796875, 0.90521240234375, 0.9499053955078125, 0.994598388671875, 1.0392913818359375, 1.083984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 12.0, 20.0, 24.0, 35.0, 49.0, 58.0, 100.0, 128.0, 198.0, 273.0, 432.0, 677.0, 1086.0, 2051.0, 4229.0, 10064.0, 27076.0, 77830.0, 202458.0, 341179.0, 233457.0, 92812.0, 32236.0, 11692.0, 4828.0, 2279.0, 1183.0, 729.0, 434.0, 277.0, 199.0, 130.0, 95.0, 72.0, 46.0, 21.0, 27.0, 18.0, 14.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.799560546875, -18.23974609375, -17.679931640625, -17.1201171875, -16.560302734375, -16.00048828125, -15.440673828125, -14.880859375, -14.321044921875, -13.76123046875, -13.201416015625, -12.6416015625, -12.081787109375, -11.52197265625, -10.962158203125, -10.40234375, -9.842529296875, -9.28271484375, -8.722900390625, -8.1630859375, -7.603271484375, -7.04345703125, -6.483642578125, -5.923828125, -5.364013671875, -4.80419921875, -4.244384765625, -3.6845703125, -3.124755859375, -2.56494140625, -2.005126953125, -1.4453125, -0.885498046875, -0.32568359375, 0.234130859375, 0.7939453125, 1.353759765625, 1.91357421875, 2.473388671875, 3.033203125, 3.593017578125, 4.15283203125, 4.712646484375, 5.2724609375, 5.832275390625, 6.39208984375, 6.951904296875, 7.51171875, 8.071533203125, 8.63134765625, 9.191162109375, 9.7509765625, 10.310791015625, 10.87060546875, 11.430419921875, 11.990234375, 12.550048828125, 13.10986328125, 13.669677734375, 14.2294921875, 14.789306640625, 15.34912109375, 15.908935546875, 16.46875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 11.0, 10.0, 5.0, 7.0, 5.0, 17.0, 18.0, 24.0, 20.0, 15.0, 31.0, 26.0, 34.0, 40.0, 48.0, 31.0, 46.0, 37.0, 37.0, 29.0, 29.0, 40.0, 44.0, 46.0, 46.0, 34.0, 35.0, 43.0, 31.0, 25.0, 16.0, 24.0, 18.0, 16.0, 9.0, 11.0, 5.0, 6.0, 5.0, 2.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.18359375, -6.9678955078125, -6.752197265625, -6.5364990234375, -6.32080078125, -6.1051025390625, -5.889404296875, -5.6737060546875, -5.4580078125, -5.2423095703125, -5.026611328125, -4.8109130859375, -4.59521484375, -4.3795166015625, -4.163818359375, -3.9481201171875, -3.732421875, -3.5167236328125, -3.301025390625, -3.0853271484375, -2.86962890625, -2.6539306640625, -2.438232421875, -2.2225341796875, -2.0068359375, -1.7911376953125, -1.575439453125, -1.3597412109375, -1.14404296875, -0.9283447265625, -0.712646484375, -0.4969482421875, -0.28125, -0.0655517578125, 0.150146484375, 0.3658447265625, 0.58154296875, 0.7972412109375, 1.012939453125, 1.2286376953125, 1.4443359375, 1.6600341796875, 1.875732421875, 2.0914306640625, 2.30712890625, 2.5228271484375, 2.738525390625, 2.9542236328125, 3.169921875, 3.3856201171875, 3.601318359375, 3.8170166015625, 4.03271484375, 4.2484130859375, 4.464111328125, 4.6798095703125, 4.8955078125, 5.1112060546875, 5.326904296875, 5.5426025390625, 5.75830078125, 5.9739990234375, 6.189697265625, 6.4053955078125, 6.62109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 14.0, 33.0, 46.0, 71.0, 106.0, 189.0, 265.0, 524.0, 870.0, 1709.0, 3662.0, 8293.0, 21956.0, 68802.0, 222268.0, 398449.0, 216787.0, 67338.0, 21786.0, 8044.0, 3557.0, 1642.0, 842.0, 470.0, 317.0, 156.0, 109.0, 69.0, 54.0, 35.0, 19.0, 22.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.294921875, -11.84765625, -11.400390625, -10.953125, -10.505859375, -10.05859375, -9.611328125, -9.1640625, -8.716796875, -8.26953125, -7.822265625, -7.375, -6.927734375, -6.48046875, -6.033203125, -5.5859375, -5.138671875, -4.69140625, -4.244140625, -3.796875, -3.349609375, -2.90234375, -2.455078125, -2.0078125, -1.560546875, -1.11328125, -0.666015625, -0.21875, 0.228515625, 0.67578125, 1.123046875, 1.5703125, 2.017578125, 2.46484375, 2.912109375, 3.359375, 3.806640625, 4.25390625, 4.701171875, 5.1484375, 5.595703125, 6.04296875, 6.490234375, 6.9375, 7.384765625, 7.83203125, 8.279296875, 8.7265625, 9.173828125, 9.62109375, 10.068359375, 10.515625, 10.962890625, 11.41015625, 11.857421875, 12.3046875, 12.751953125, 13.19921875, 13.646484375, 14.09375, 14.541015625, 14.98828125, 15.435546875, 15.8828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 7.0, 17.0, 21.0, 24.0, 39.0, 50.0, 86.0, 87.0, 122.0, 109.0, 109.0, 104.0, 72.0, 37.0, 38.0, 20.0, 17.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018520355224609375, -0.0017689168453216553, -0.001685798168182373, -0.0016026794910430908, -0.0015195608139038086, -0.0014364421367645264, -0.0013533234596252441, -0.001270204782485962, -0.0011870861053466797, -0.0011039674282073975, -0.0010208487510681152, -0.000937730073928833, -0.0008546113967895508, -0.0007714927196502686, -0.0006883740425109863, -0.0006052553653717041, -0.0005221366882324219, -0.00043901801109313965, -0.0003558993339538574, -0.0002727806568145752, -0.00018966197967529297, -0.00010654330253601074, -2.3424625396728516e-05, 5.969405174255371e-05, 0.00014281272888183594, 0.00022593140602111816, 0.0003090500831604004, 0.0003921687602996826, 0.00047528743743896484, 0.0005584061145782471, 0.0006415247917175293, 0.0007246434688568115, 0.0008077621459960938, 0.000890880823135376, 0.0009739995002746582, 0.0010571181774139404, 0.0011402368545532227, 0.0012233555316925049, 0.0013064742088317871, 0.0013895928859710693, 0.0014727115631103516, 0.0015558302402496338, 0.001638948917388916, 0.0017220675945281982, 0.0018051862716674805, 0.0018883049488067627, 0.001971423625946045, 0.002054542303085327, 0.0021376609802246094, 0.0022207796573638916, 0.002303898334503174, 0.002387017011642456, 0.0024701356887817383, 0.0025532543659210205, 0.0026363730430603027, 0.002719491720199585, 0.002802610397338867, 0.0028857290744781494, 0.0029688477516174316, 0.003051966428756714, 0.003135085105895996, 0.0032182037830352783, 0.0033013224601745605, 0.0033844411373138428, 0.003467559814453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 15.0, 18.0, 25.0, 40.0, 53.0, 78.0, 135.0, 182.0, 319.0, 527.0, 963.0, 1964.0, 4159.0, 10503.0, 29785.0, 93503.0, 274610.0, 375550.0, 170946.0, 53797.0, 18185.0, 6919.0, 2909.0, 1414.0, 763.0, 436.0, 241.0, 162.0, 116.0, 67.0, 42.0, 25.0, 21.0, 17.0, 15.0, 8.0, 9.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3046875, -11.8841552734375, -11.463623046875, -11.0430908203125, -10.62255859375, -10.2020263671875, -9.781494140625, -9.3609619140625, -8.9404296875, -8.5198974609375, -8.099365234375, -7.6788330078125, -7.25830078125, -6.8377685546875, -6.417236328125, -5.9967041015625, -5.576171875, -5.1556396484375, -4.735107421875, -4.3145751953125, -3.89404296875, -3.4735107421875, -3.052978515625, -2.6324462890625, -2.2119140625, -1.7913818359375, -1.370849609375, -0.9503173828125, -0.52978515625, -0.1092529296875, 0.311279296875, 0.7318115234375, 1.15234375, 1.5728759765625, 1.993408203125, 2.4139404296875, 2.83447265625, 3.2550048828125, 3.675537109375, 4.0960693359375, 4.5166015625, 4.9371337890625, 5.357666015625, 5.7781982421875, 6.19873046875, 6.6192626953125, 7.039794921875, 7.4603271484375, 7.880859375, 8.3013916015625, 8.721923828125, 9.1424560546875, 9.56298828125, 9.9835205078125, 10.404052734375, 10.8245849609375, 11.2451171875, 11.6656494140625, 12.086181640625, 12.5067138671875, 12.92724609375, 13.3477783203125, 13.768310546875, 14.1888427734375, 14.609375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 8.0, 12.0, 7.0, 13.0, 12.0, 16.0, 23.0, 19.0, 24.0, 32.0, 42.0, 45.0, 59.0, 51.0, 61.0, 68.0, 47.0, 62.0, 51.0, 55.0, 37.0, 36.0, 31.0, 33.0, 33.0, 22.0, 21.0, 12.0, 14.0, 11.0, 13.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5546875, -5.38043212890625, -5.2061767578125, -5.03192138671875, -4.857666015625, -4.68341064453125, -4.5091552734375, -4.33489990234375, -4.16064453125, -3.98638916015625, -3.8121337890625, -3.63787841796875, -3.463623046875, -3.28936767578125, -3.1151123046875, -2.94085693359375, -2.7666015625, -2.59234619140625, -2.4180908203125, -2.24383544921875, -2.069580078125, -1.89532470703125, -1.7210693359375, -1.54681396484375, -1.37255859375, -1.19830322265625, -1.0240478515625, -0.84979248046875, -0.675537109375, -0.50128173828125, -0.3270263671875, -0.15277099609375, 0.021484375, 0.19573974609375, 0.3699951171875, 0.54425048828125, 0.718505859375, 0.89276123046875, 1.0670166015625, 1.24127197265625, 1.41552734375, 1.58978271484375, 1.7640380859375, 1.93829345703125, 2.112548828125, 2.28680419921875, 2.4610595703125, 2.63531494140625, 2.8095703125, 2.98382568359375, 3.1580810546875, 3.33233642578125, 3.506591796875, 3.68084716796875, 3.8551025390625, 4.02935791015625, 4.20361328125, 4.37786865234375, 4.5521240234375, 4.72637939453125, 4.900634765625, 5.07489013671875, 5.2491455078125, 5.42340087890625, 5.59765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 15.0, 10.0, 18.0, 31.0, 68.0, 105.0, 175.0, 156.0, 168.0, 102.0, 61.0, 37.0, 15.0, 17.0, 8.0, 3.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.0747833251953, -165.66006469726562, -160.245361328125, -154.8306427001953, -149.41592407226562, -144.001220703125, -138.5865020751953, -133.17178344726562, -127.75707244873047, -122.34236145019531, -116.92764282226562, -111.51293182373047, -106.09822082519531, -100.68350219726562, -95.26879119873047, -89.85408020019531, -84.43936157226562, -79.02465057373047, -73.60993194580078, -68.19522094726562, -62.7805061340332, -57.36579132080078, -51.951080322265625, -46.5363655090332, -41.12165069580078, -35.70693588256836, -30.29222297668457, -24.87751007080078, -19.46279525756836, -14.048080444335938, -8.633369445800781, -3.2186546325683594, 2.196075439453125, 7.6107892990112305, 13.025503158569336, 18.440216064453125, 23.854930877685547, 29.26964569091797, 34.684356689453125, 40.09907150268555, 45.51378631591797, 50.92850112915039, 56.34321594238281, 61.75792694091797, 67.17263793945312, 72.58735656738281, 78.00206756591797, 83.41677856445312, 88.83149719238281, 94.24620819091797, 99.66092681884766, 105.07563781738281, 110.4903564453125, 115.90506744384766, 121.31977844238281, 126.7344970703125, 132.14920043945312, 137.5639190673828, 142.97862243652344, 148.39334106445312, 153.8080596923828, 159.2227783203125, 164.63748168945312, 170.0522003173828, 175.4669189453125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 6.0, 16.0, 11.0, 15.0, 18.0, 33.0, 41.0, 34.0, 43.0, 50.0, 44.0, 58.0, 62.0, 57.0, 53.0, 63.0, 59.0, 46.0, 55.0, 38.0, 35.0, 33.0, 24.0, 20.0, 15.0, 16.0, 8.0, 11.0, 8.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.20414733886719, -79.92383575439453, -77.64352416992188, -75.36321258544922, -73.08290100097656, -70.8025894165039, -68.52227783203125, -66.24197387695312, -63.9616584777832, -61.68134689331055, -59.40103530883789, -57.120723724365234, -54.840415954589844, -52.56010437011719, -50.27979278564453, -47.999481201171875, -45.71916961669922, -43.43885803222656, -41.158546447753906, -38.87823486328125, -36.597923278808594, -34.31761169433594, -32.03730392456055, -29.75699234008789, -27.476680755615234, -25.196369171142578, -22.916057586669922, -20.6357479095459, -18.355436325073242, -16.075124740600586, -13.794814109802246, -11.514503479003906, -9.234184265136719, -6.953873157501221, -4.673562049865723, -2.3932509422302246, -0.11293983459472656, 2.1673717498779297, 4.4476823806762695, 6.727993011474609, 9.008304595947266, 11.288616180419922, 13.568926811218262, 15.849237442016602, 18.129549026489258, 20.409860610961914, 22.690170288085938, 24.970481872558594, 27.25079345703125, 29.531105041503906, 31.811416625976562, 34.09172821044922, 36.372039794921875, 38.65235137939453, 40.93265914916992, 43.21297073364258, 45.493282318115234, 47.77359390258789, 50.05390548706055, 52.3342170715332, 54.614524841308594, 56.89483642578125, 59.175148010253906, 61.45545959472656, 63.73577117919922]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 11.0, 12.0, 24.0, 32.0, 53.0, 95.0, 135.0, 249.0, 565.0, 1492.0, 6250.0, 39249.0, 2761268.0, 1340776.0, 36684.0, 5605.0, 1153.0, 314.0, 114.0, 57.0, 37.0, 26.0, 23.0, 15.0, 12.0, 9.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.875, -90.36328125, -87.8515625, -85.33984375, -82.828125, -80.31640625, -77.8046875, -75.29296875, -72.78125, -70.26953125, -67.7578125, -65.24609375, -62.734375, -60.22265625, -57.7109375, -55.19921875, -52.6875, -50.17578125, -47.6640625, -45.15234375, -42.640625, -40.12890625, -37.6171875, -35.10546875, -32.59375, -30.08203125, -27.5703125, -25.05859375, -22.546875, -20.03515625, -17.5234375, -15.01171875, -12.5, -9.98828125, -7.4765625, -4.96484375, -2.453125, 0.05859375, 2.5703125, 5.08203125, 7.59375, 10.10546875, 12.6171875, 15.12890625, 17.640625, 20.15234375, 22.6640625, 25.17578125, 27.6875, 30.19921875, 32.7109375, 35.22265625, 37.734375, 40.24609375, 42.7578125, 45.26953125, 47.78125, 50.29296875, 52.8046875, 55.31640625, 57.828125, 60.33984375, 62.8515625, 65.36328125, 67.875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 23.0, 25.0, 28.0, 22.0, 50.0, 60.0, 67.0, 83.0, 74.0, 67.0, 74.0, 69.0, 65.0, 46.0, 43.0, 46.0, 27.0, 32.0, 14.0, 19.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.74609375, -2.6749267578125, -2.603759765625, -2.5325927734375, -2.46142578125, -2.3902587890625, -2.319091796875, -2.2479248046875, -2.1767578125, -2.1055908203125, -2.034423828125, -1.9632568359375, -1.89208984375, -1.8209228515625, -1.749755859375, -1.6785888671875, -1.607421875, -1.5362548828125, -1.465087890625, -1.3939208984375, -1.32275390625, -1.2515869140625, -1.180419921875, -1.1092529296875, -1.0380859375, -0.9669189453125, -0.895751953125, -0.8245849609375, -0.75341796875, -0.6822509765625, -0.611083984375, -0.5399169921875, -0.46875, -0.3975830078125, -0.326416015625, -0.2552490234375, -0.18408203125, -0.1129150390625, -0.041748046875, 0.0294189453125, 0.1005859375, 0.1717529296875, 0.242919921875, 0.3140869140625, 0.38525390625, 0.4564208984375, 0.527587890625, 0.5987548828125, 0.669921875, 0.7410888671875, 0.812255859375, 0.8834228515625, 0.95458984375, 1.0257568359375, 1.096923828125, 1.1680908203125, 1.2392578125, 1.3104248046875, 1.381591796875, 1.4527587890625, 1.52392578125, 1.5950927734375, 1.666259765625, 1.7374267578125, 1.80859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 1.0, 4.0, 4.0, 17.0, 14.0, 12.0, 16.0, 29.0, 25.0, 56.0, 73.0, 162.0, 283.0, 753.0, 2592.0, 10330.0, 62120.0, 965665.0, 3030253.0, 101999.0, 15009.0, 3193.0, 877.0, 327.0, 155.0, 97.0, 58.0, 41.0, 23.0, 21.0, 16.0, 15.0, 10.0, 9.0, 5.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.59375, -42.74462890625, -40.8955078125, -39.04638671875, -37.197265625, -35.34814453125, -33.4990234375, -31.64990234375, -29.80078125, -27.95166015625, -26.1025390625, -24.25341796875, -22.404296875, -20.55517578125, -18.7060546875, -16.85693359375, -15.0078125, -13.15869140625, -11.3095703125, -9.46044921875, -7.611328125, -5.76220703125, -3.9130859375, -2.06396484375, -0.21484375, 1.63427734375, 3.4833984375, 5.33251953125, 7.181640625, 9.03076171875, 10.8798828125, 12.72900390625, 14.578125, 16.42724609375, 18.2763671875, 20.12548828125, 21.974609375, 23.82373046875, 25.6728515625, 27.52197265625, 29.37109375, 31.22021484375, 33.0693359375, 34.91845703125, 36.767578125, 38.61669921875, 40.4658203125, 42.31494140625, 44.1640625, 46.01318359375, 47.8623046875, 49.71142578125, 51.560546875, 53.40966796875, 55.2587890625, 57.10791015625, 58.95703125, 60.80615234375, 62.6552734375, 64.50439453125, 66.353515625, 68.20263671875, 70.0517578125, 71.90087890625, 73.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 6.0, 11.0, 14.0, 20.0, 25.0, 21.0, 38.0, 74.0, 96.0, 188.0, 282.0, 622.0, 1408.0, 534.0, 275.0, 146.0, 104.0, 67.0, 44.0, 22.0, 15.0, 14.0, 13.0, 9.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55859375, -6.32781982421875, -6.0970458984375, -5.86627197265625, -5.635498046875, -5.40472412109375, -5.1739501953125, -4.94317626953125, -4.71240234375, -4.48162841796875, -4.2508544921875, -4.02008056640625, -3.789306640625, -3.55853271484375, -3.3277587890625, -3.09698486328125, -2.8662109375, -2.63543701171875, -2.4046630859375, -2.17388916015625, -1.943115234375, -1.71234130859375, -1.4815673828125, -1.25079345703125, -1.02001953125, -0.78924560546875, -0.5584716796875, -0.32769775390625, -0.096923828125, 0.13385009765625, 0.3646240234375, 0.59539794921875, 0.826171875, 1.05694580078125, 1.2877197265625, 1.51849365234375, 1.749267578125, 1.98004150390625, 2.2108154296875, 2.44158935546875, 2.67236328125, 2.90313720703125, 3.1339111328125, 3.36468505859375, 3.595458984375, 3.82623291015625, 4.0570068359375, 4.28778076171875, 4.5185546875, 4.74932861328125, 4.9801025390625, 5.21087646484375, 5.441650390625, 5.67242431640625, 5.9031982421875, 6.13397216796875, 6.36474609375, 6.59552001953125, 6.8262939453125, 7.05706787109375, 7.287841796875, 7.51861572265625, 7.7493896484375, 7.98016357421875, 8.2109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 11.0, 10.0, 10.0, 33.0, 39.0, 72.0, 106.0, 110.0, 148.0, 139.0, 108.0, 84.0, 54.0, 24.0, 20.0, 11.0, 10.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.40202331542969, -75.40481567382812, -73.4076156616211, -71.41040802001953, -69.41320037841797, -67.41600036621094, -65.41879272460938, -63.42158889770508, -61.42438507080078, -59.427181243896484, -57.42997360229492, -55.432769775390625, -53.43556594848633, -51.43836212158203, -49.44115447998047, -47.44395065307617, -45.44674301147461, -43.44953918457031, -41.45233154296875, -39.45512771606445, -37.457923889160156, -35.460716247558594, -33.4635124206543, -31.46630859375, -29.46910285949707, -27.47189712524414, -25.474693298339844, -23.477487564086914, -21.480281829833984, -19.483078002929688, -17.485872268676758, -15.488667488098145, -13.491462707519531, -11.494257926940918, -9.497053146362305, -7.499847412109375, -5.502642631530762, -3.5054378509521484, -1.5082321166992188, 0.48897266387939453, 2.486177444458008, 4.483382225036621, 6.480587482452393, 8.477792739868164, 10.474997520446777, 12.47220230102539, 14.46940803527832, 16.46661376953125, 18.463817596435547, 20.461023330688477, 22.458227157592773, 24.455432891845703, 26.45263671875, 28.44984245300293, 30.44704818725586, 32.444252014160156, 34.44145965576172, 36.438663482666016, 38.43587112426758, 40.433074951171875, 42.43027877807617, 44.42748260498047, 46.42469024658203, 48.42189407348633, 50.419097900390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 7.0, 2.0, 6.0, 7.0, 15.0, 19.0, 14.0, 26.0, 22.0, 38.0, 32.0, 27.0, 23.0, 34.0, 37.0, 33.0, 44.0, 49.0, 49.0, 42.0, 46.0, 49.0, 55.0, 32.0, 39.0, 32.0, 30.0, 32.0, 33.0, 25.0, 22.0, 16.0, 18.0, 10.0, 8.0, 9.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.50879669189453, -22.656274795532227, -21.803754806518555, -20.95123291015625, -20.098712921142578, -19.246191024780273, -18.39366912841797, -17.541149139404297, -16.688629150390625, -15.836108207702637, -14.983587265014648, -14.131065368652344, -13.278545379638672, -12.426023483276367, -11.573502540588379, -10.72098159790039, -9.868459701538086, -9.015938758850098, -8.16341781616211, -7.310896396636963, -6.458375453948975, -5.605854511260986, -4.75333309173584, -3.9008121490478516, -3.0482912063598633, -2.195770263671875, -1.3432490825653076, -0.49072790145874023, 0.36179304122924805, 1.2143139839172363, 2.066835403442383, 2.919356346130371, 3.771879196166992, 4.6244001388549805, 5.476921081542969, 6.329442501068115, 7.1819634437561035, 8.03448486328125, 8.887005805969238, 9.739526748657227, 10.592047691345215, 11.444568634033203, 12.297089576721191, 13.14961051940918, 14.002132415771484, 14.854652404785156, 15.707174301147461, 16.559696197509766, 17.412216186523438, 18.264738082885742, 19.117258071899414, 19.96977996826172, 20.82229995727539, 21.674821853637695, 22.52734375, 23.379863739013672, 24.232383728027344, 25.08490562438965, 25.93742561340332, 26.789947509765625, 27.642467498779297, 28.4949893951416, 29.347511291503906, 30.200031280517578, 31.052553176879883]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 0.0, 5.0, 5.0, 9.0, 8.0, 17.0, 16.0, 27.0, 54.0, 66.0, 95.0, 138.0, 202.0, 249.0, 423.0, 576.0, 958.0, 1786.0, 3721.0, 8773.0, 24107.0, 69050.0, 180749.0, 322013.0, 257312.0, 112466.0, 40408.0, 14004.0, 5420.0, 2476.0, 1264.0, 703.0, 398.0, 285.0, 214.0, 152.0, 91.0, 83.0, 71.0, 40.0, 33.0, 28.0, 14.0, 13.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.015625, -18.434814453125, -17.85400390625, -17.273193359375, -16.6923828125, -16.111572265625, -15.53076171875, -14.949951171875, -14.369140625, -13.788330078125, -13.20751953125, -12.626708984375, -12.0458984375, -11.465087890625, -10.88427734375, -10.303466796875, -9.72265625, -9.141845703125, -8.56103515625, -7.980224609375, -7.3994140625, -6.818603515625, -6.23779296875, -5.656982421875, -5.076171875, -4.495361328125, -3.91455078125, -3.333740234375, -2.7529296875, -2.172119140625, -1.59130859375, -1.010498046875, -0.4296875, 0.151123046875, 0.73193359375, 1.312744140625, 1.8935546875, 2.474365234375, 3.05517578125, 3.635986328125, 4.216796875, 4.797607421875, 5.37841796875, 5.959228515625, 6.5400390625, 7.120849609375, 7.70166015625, 8.282470703125, 8.86328125, 9.444091796875, 10.02490234375, 10.605712890625, 11.1865234375, 11.767333984375, 12.34814453125, 12.928955078125, 13.509765625, 14.090576171875, 14.67138671875, 15.252197265625, 15.8330078125, 16.413818359375, 16.99462890625, 17.575439453125, 18.15625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 7.0, 10.0, 17.0, 25.0, 34.0, 36.0, 68.0, 73.0, 83.0, 105.0, 72.0, 89.0, 72.0, 64.0, 68.0, 47.0, 45.0, 30.0, 14.0, 14.0, 6.0, 8.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.505859375, -3.4100341796875, -3.314208984375, -3.2183837890625, -3.12255859375, -3.0267333984375, -2.930908203125, -2.8350830078125, -2.7392578125, -2.6434326171875, -2.547607421875, -2.4517822265625, -2.35595703125, -2.2601318359375, -2.164306640625, -2.0684814453125, -1.97265625, -1.8768310546875, -1.781005859375, -1.6851806640625, -1.58935546875, -1.4935302734375, -1.397705078125, -1.3018798828125, -1.2060546875, -1.1102294921875, -1.014404296875, -0.9185791015625, -0.82275390625, -0.7269287109375, -0.631103515625, -0.5352783203125, -0.439453125, -0.3436279296875, -0.247802734375, -0.1519775390625, -0.05615234375, 0.0396728515625, 0.135498046875, 0.2313232421875, 0.3271484375, 0.4229736328125, 0.518798828125, 0.6146240234375, 0.71044921875, 0.8062744140625, 0.902099609375, 0.9979248046875, 1.09375, 1.1895751953125, 1.285400390625, 1.3812255859375, 1.47705078125, 1.5728759765625, 1.668701171875, 1.7645263671875, 1.8603515625, 1.9561767578125, 2.052001953125, 2.1478271484375, 2.24365234375, 2.3394775390625, 2.435302734375, 2.5311279296875, 2.626953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 6.0, 15.0, 13.0, 23.0, 44.0, 58.0, 90.0, 133.0, 172.0, 248.0, 405.0, 717.0, 1161.0, 2222.0, 4920.0, 13536.0, 45617.0, 165341.0, 403871.0, 285200.0, 85612.0, 24264.0, 7777.0, 3092.0, 1609.0, 859.0, 522.0, 341.0, 213.0, 175.0, 88.0, 48.0, 49.0, 32.0, 20.0, 15.0, 8.0, 15.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.234375, -24.486572265625, -23.73876953125, -22.990966796875, -22.2431640625, -21.495361328125, -20.74755859375, -19.999755859375, -19.251953125, -18.504150390625, -17.75634765625, -17.008544921875, -16.2607421875, -15.512939453125, -14.76513671875, -14.017333984375, -13.26953125, -12.521728515625, -11.77392578125, -11.026123046875, -10.2783203125, -9.530517578125, -8.78271484375, -8.034912109375, -7.287109375, -6.539306640625, -5.79150390625, -5.043701171875, -4.2958984375, -3.548095703125, -2.80029296875, -2.052490234375, -1.3046875, -0.556884765625, 0.19091796875, 0.938720703125, 1.6865234375, 2.434326171875, 3.18212890625, 3.929931640625, 4.677734375, 5.425537109375, 6.17333984375, 6.921142578125, 7.6689453125, 8.416748046875, 9.16455078125, 9.912353515625, 10.66015625, 11.407958984375, 12.15576171875, 12.903564453125, 13.6513671875, 14.399169921875, 15.14697265625, 15.894775390625, 16.642578125, 17.390380859375, 18.13818359375, 18.885986328125, 19.6337890625, 20.381591796875, 21.12939453125, 21.877197265625, 22.625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 10.0, 10.0, 11.0, 18.0, 27.0, 32.0, 26.0, 34.0, 45.0, 38.0, 49.0, 49.0, 37.0, 52.0, 47.0, 50.0, 45.0, 47.0, 60.0, 47.0, 49.0, 44.0, 26.0, 26.0, 26.0, 15.0, 19.0, 12.0, 11.0, 7.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5625, -14.1451416015625, -13.727783203125, -13.3104248046875, -12.89306640625, -12.4757080078125, -12.058349609375, -11.6409912109375, -11.2236328125, -10.8062744140625, -10.388916015625, -9.9715576171875, -9.55419921875, -9.1368408203125, -8.719482421875, -8.3021240234375, -7.884765625, -7.4674072265625, -7.050048828125, -6.6326904296875, -6.21533203125, -5.7979736328125, -5.380615234375, -4.9632568359375, -4.5458984375, -4.1285400390625, -3.711181640625, -3.2938232421875, -2.87646484375, -2.4591064453125, -2.041748046875, -1.6243896484375, -1.20703125, -0.7896728515625, -0.372314453125, 0.0450439453125, 0.46240234375, 0.8797607421875, 1.297119140625, 1.7144775390625, 2.1318359375, 2.5491943359375, 2.966552734375, 3.3839111328125, 3.80126953125, 4.2186279296875, 4.635986328125, 5.0533447265625, 5.470703125, 5.8880615234375, 6.305419921875, 6.7227783203125, 7.14013671875, 7.5574951171875, 7.974853515625, 8.3922119140625, 8.8095703125, 9.2269287109375, 9.644287109375, 10.0616455078125, 10.47900390625, 10.8963623046875, 11.313720703125, 11.7310791015625, 12.1484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 12.0, 14.0, 46.0, 97.0, 212.0, 520.0, 1563.0, 8117.0, 143068.0, 827432.0, 60673.0, 4914.0, 1118.0, 383.0, 183.0, 91.0, 32.0, 24.0, 16.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.8828125, -33.734375, -32.5859375, -31.4375, -30.2890625, -29.140625, -27.9921875, -26.84375, -25.6953125, -24.546875, -23.3984375, -22.25, -21.1015625, -19.953125, -18.8046875, -17.65625, -16.5078125, -15.359375, -14.2109375, -13.0625, -11.9140625, -10.765625, -9.6171875, -8.46875, -7.3203125, -6.171875, -5.0234375, -3.875, -2.7265625, -1.578125, -0.4296875, 0.71875, 1.8671875, 3.015625, 4.1640625, 5.3125, 6.4609375, 7.609375, 8.7578125, 9.90625, 11.0546875, 12.203125, 13.3515625, 14.5, 15.6484375, 16.796875, 17.9453125, 19.09375, 20.2421875, 21.390625, 22.5390625, 23.6875, 24.8359375, 25.984375, 27.1328125, 28.28125, 29.4296875, 30.578125, 31.7265625, 32.875, 34.0234375, 35.171875, 36.3203125, 37.46875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 10.0, 5.0, 12.0, 11.0, 14.0, 27.0, 35.0, 34.0, 61.0, 52.0, 84.0, 79.0, 100.0, 86.0, 71.0, 67.0, 49.0, 41.0, 36.0, 27.0, 15.0, 12.0, 8.0, 10.0, 10.0, 6.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002193450927734375, -0.002135351300239563, -0.002077251672744751, -0.002019152045249939, -0.001961052417755127, -0.001902952790260315, -0.001844853162765503, -0.001786753535270691, -0.001728653907775879, -0.001670554280281067, -0.0016124546527862549, -0.0015543550252914429, -0.0014962553977966309, -0.0014381557703018188, -0.0013800561428070068, -0.0013219565153121948, -0.0012638568878173828, -0.0012057572603225708, -0.0011476576328277588, -0.0010895580053329468, -0.0010314583778381348, -0.0009733587503433228, -0.0009152591228485107, -0.0008571594953536987, -0.0007990598678588867, -0.0007409602403640747, -0.0006828606128692627, -0.0006247609853744507, -0.0005666613578796387, -0.0005085617303848267, -0.00045046210289001465, -0.00039236247539520264, -0.0003342628479003906, -0.0002761632204055786, -0.0002180635929107666, -0.0001599639654159546, -0.00010186433792114258, -4.3764710426330566e-05, 1.4334917068481445e-05, 7.243454456329346e-05, 0.00013053417205810547, 0.00018863379955291748, 0.0002467334270477295, 0.0003048330545425415, 0.0003629326820373535, 0.00042103230953216553, 0.00047913193702697754, 0.0005372315645217896, 0.0005953311920166016, 0.0006534308195114136, 0.0007115304470062256, 0.0007696300745010376, 0.0008277297019958496, 0.0008858293294906616, 0.0009439289569854736, 0.0010020285844802856, 0.0010601282119750977, 0.0011182278394699097, 0.0011763274669647217, 0.0012344270944595337, 0.0012925267219543457, 0.0013506263494491577, 0.0014087259769439697, 0.0014668256044387817, 0.0015249252319335938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 6.0, 4.0, 9.0, 18.0, 19.0, 32.0, 37.0, 91.0, 163.0, 256.0, 518.0, 994.0, 2340.0, 6880.0, 29146.0, 188219.0, 601217.0, 179322.0, 28068.0, 6725.0, 2335.0, 1021.0, 474.0, 238.0, 168.0, 95.0, 64.0, 37.0, 28.0, 9.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.8603515625, -18.220703125, -17.5810546875, -16.94140625, -16.3017578125, -15.662109375, -15.0224609375, -14.3828125, -13.7431640625, -13.103515625, -12.4638671875, -11.82421875, -11.1845703125, -10.544921875, -9.9052734375, -9.265625, -8.6259765625, -7.986328125, -7.3466796875, -6.70703125, -6.0673828125, -5.427734375, -4.7880859375, -4.1484375, -3.5087890625, -2.869140625, -2.2294921875, -1.58984375, -0.9501953125, -0.310546875, 0.3291015625, 0.96875, 1.6083984375, 2.248046875, 2.8876953125, 3.52734375, 4.1669921875, 4.806640625, 5.4462890625, 6.0859375, 6.7255859375, 7.365234375, 8.0048828125, 8.64453125, 9.2841796875, 9.923828125, 10.5634765625, 11.203125, 11.8427734375, 12.482421875, 13.1220703125, 13.76171875, 14.4013671875, 15.041015625, 15.6806640625, 16.3203125, 16.9599609375, 17.599609375, 18.2392578125, 18.87890625, 19.5185546875, 20.158203125, 20.7978515625, 21.4375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 9.0, 11.0, 12.0, 22.0, 25.0, 36.0, 36.0, 63.0, 70.0, 93.0, 106.0, 89.0, 78.0, 50.0, 58.0, 52.0, 42.0, 38.0, 30.0, 26.0, 15.0, 8.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.5626220703125, -6.265869140625, -5.9691162109375, -5.67236328125, -5.3756103515625, -5.078857421875, -4.7821044921875, -4.4853515625, -4.1885986328125, -3.891845703125, -3.5950927734375, -3.29833984375, -3.0015869140625, -2.704833984375, -2.4080810546875, -2.111328125, -1.8145751953125, -1.517822265625, -1.2210693359375, -0.92431640625, -0.6275634765625, -0.330810546875, -0.0340576171875, 0.2626953125, 0.5594482421875, 0.856201171875, 1.1529541015625, 1.44970703125, 1.7464599609375, 2.043212890625, 2.3399658203125, 2.63671875, 2.9334716796875, 3.230224609375, 3.5269775390625, 3.82373046875, 4.1204833984375, 4.417236328125, 4.7139892578125, 5.0107421875, 5.3074951171875, 5.604248046875, 5.9010009765625, 6.19775390625, 6.4945068359375, 6.791259765625, 7.0880126953125, 7.384765625, 7.6815185546875, 7.978271484375, 8.2750244140625, 8.57177734375, 8.8685302734375, 9.165283203125, 9.4620361328125, 9.7587890625, 10.0555419921875, 10.352294921875, 10.6490478515625, 10.94580078125, 11.2425537109375, 11.539306640625, 11.8360595703125, 12.1328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 17.0, 22.0, 53.0, 77.0, 134.0, 172.0, 169.0, 140.0, 89.0, 56.0, 31.0, 10.0, 10.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.27069091796875, -200.38583374023438, -194.5009765625, -188.61611938476562, -182.73126220703125, -176.84640502929688, -170.9615478515625, -165.0767059326172, -159.1918487548828, -153.30699157714844, -147.42213439941406, -141.5372772216797, -135.6524200439453, -129.767578125, -123.8827133178711, -117.99786376953125, -112.11299896240234, -106.22814178466797, -100.3432846069336, -94.45843505859375, -88.57357788085938, -82.688720703125, -76.80386352539062, -70.91900634765625, -65.03414916992188, -59.1492919921875, -53.26443862915039, -47.379581451416016, -41.494728088378906, -35.60987091064453, -29.725013732910156, -23.840160369873047, -17.955307006835938, -12.070451736450195, -6.185595512390137, -0.3007392883300781, 5.584115982055664, 11.468971252441406, 17.35382843017578, 23.23868179321289, 29.123538970947266, 35.00839614868164, 40.89324951171875, 46.778106689453125, 52.6629638671875, 58.54781723022461, 64.43267822265625, 70.3175277709961, 76.20238494873047, 82.08724212646484, 87.97209930419922, 93.85694885253906, 99.74180603027344, 105.62666320800781, 111.51152038574219, 117.39637756347656, 123.28123474121094, 129.1660919189453, 135.0509490966797, 140.93580627441406, 146.82066345214844, 152.70550537109375, 158.59036254882812, 164.4752197265625, 170.36007690429688]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 8.0, 12.0, 10.0, 10.0, 29.0, 30.0, 19.0, 27.0, 28.0, 43.0, 47.0, 38.0, 46.0, 56.0, 51.0, 55.0, 55.0, 60.0, 62.0, 50.0, 40.0, 40.0, 30.0, 36.0, 21.0, 27.0, 21.0, 17.0, 4.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-106.69535827636719, -103.6173324584961, -100.53931427001953, -97.46128845214844, -94.38327026367188, -91.30524444580078, -88.22721862792969, -85.14920043945312, -82.07118225097656, -78.99315643310547, -75.9151382446289, -72.83711242675781, -69.75909423828125, -66.68106842041016, -63.60304641723633, -60.5250244140625, -57.446998596191406, -54.36897659301758, -51.29095458984375, -48.212928771972656, -45.134910583496094, -42.056884765625, -38.97886276245117, -35.900840759277344, -32.822818756103516, -29.744796752929688, -26.66677474975586, -23.5887508392334, -20.51072883605957, -17.432706832885742, -14.354682922363281, -11.276660919189453, -8.198646545410156, -5.12062406539917, -2.0426015853881836, 1.035421371459961, 4.113443374633789, 7.191465377807617, 10.269489288330078, 13.347511291503906, 16.425533294677734, 19.503555297851562, 22.58157730102539, 25.65960121154785, 28.73762321472168, 31.815645217895508, 34.89366912841797, 37.9716911315918, 41.049713134765625, 44.12773513793945, 47.20575714111328, 50.283782958984375, 53.36180114746094, 56.43982696533203, 59.51784896850586, 62.59587097167969, 65.67388916015625, 68.75191497802734, 71.8299331665039, 74.907958984375, 77.98597717285156, 81.06400299072266, 84.14202880859375, 87.22004699707031, 90.2980728149414]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 8.0, 9.0, 11.0, 10.0, 12.0, 23.0, 32.0, 50.0, 62.0, 130.0, 194.0, 472.0, 1226.0, 3736.0, 14035.0, 83615.0, 3769360.0, 284324.0, 27181.0, 6395.0, 2040.0, 703.0, 295.0, 149.0, 71.0, 42.0, 27.0, 23.0, 15.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-68.0625, -66.4306640625, -64.798828125, -63.1669921875, -61.53515625, -59.9033203125, -58.271484375, -56.6396484375, -55.0078125, -53.3759765625, -51.744140625, -50.1123046875, -48.48046875, -46.8486328125, -45.216796875, -43.5849609375, -41.953125, -40.3212890625, -38.689453125, -37.0576171875, -35.42578125, -33.7939453125, -32.162109375, -30.5302734375, -28.8984375, -27.2666015625, -25.634765625, -24.0029296875, -22.37109375, -20.7392578125, -19.107421875, -17.4755859375, -15.84375, -14.2119140625, -12.580078125, -10.9482421875, -9.31640625, -7.6845703125, -6.052734375, -4.4208984375, -2.7890625, -1.1572265625, 0.474609375, 2.1064453125, 3.73828125, 5.3701171875, 7.001953125, 8.6337890625, 10.265625, 11.8974609375, 13.529296875, 15.1611328125, 16.79296875, 18.4248046875, 20.056640625, 21.6884765625, 23.3203125, 24.9521484375, 26.583984375, 28.2158203125, 29.84765625, 31.4794921875, 33.111328125, 34.7431640625, 36.375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 6.0, 11.0, 9.0, 8.0, 15.0, 10.0, 20.0, 30.0, 26.0, 31.0, 31.0, 46.0, 40.0, 61.0, 53.0, 46.0, 60.0, 51.0, 57.0, 40.0, 55.0, 35.0, 39.0, 39.0, 39.0, 30.0, 24.0, 24.0, 12.0, 15.0, 6.0, 14.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.9453125, -2.8698883056640625, -2.794464111328125, -2.7190399169921875, -2.64361572265625, -2.5681915283203125, -2.492767333984375, -2.4173431396484375, -2.3419189453125, -2.2664947509765625, -2.191070556640625, -2.1156463623046875, -2.04022216796875, -1.9647979736328125, -1.889373779296875, -1.8139495849609375, -1.738525390625, -1.6631011962890625, -1.587677001953125, -1.5122528076171875, -1.43682861328125, -1.3614044189453125, -1.285980224609375, -1.2105560302734375, -1.1351318359375, -1.0597076416015625, -0.984283447265625, -0.9088592529296875, -0.83343505859375, -0.7580108642578125, -0.682586669921875, -0.6071624755859375, -0.53173828125, -0.4563140869140625, -0.380889892578125, -0.3054656982421875, -0.23004150390625, -0.1546173095703125, -0.079193115234375, -0.0037689208984375, 0.0716552734375, 0.1470794677734375, 0.222503662109375, 0.2979278564453125, 0.37335205078125, 0.4487762451171875, 0.524200439453125, 0.5996246337890625, 0.675048828125, 0.7504730224609375, 0.825897216796875, 0.9013214111328125, 0.97674560546875, 1.0521697998046875, 1.127593994140625, 1.2030181884765625, 1.2784423828125, 1.3538665771484375, 1.429290771484375, 1.5047149658203125, 1.58013916015625, 1.6555633544921875, 1.730987548828125, 1.8064117431640625, 1.8818359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 12.0, 15.0, 29.0, 39.0, 58.0, 97.0, 138.0, 293.0, 508.0, 913.0, 1727.0, 3637.0, 8416.0, 23120.0, 82072.0, 527860.0, 3187616.0, 270410.0, 55532.0, 17730.0, 6959.0, 3220.0, 1599.0, 876.0, 552.0, 281.0, 208.0, 124.0, 54.0, 56.0, 37.0, 23.0, 16.0, 9.0, 9.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-29.6875, -28.8232421875, -27.958984375, -27.0947265625, -26.23046875, -25.3662109375, -24.501953125, -23.6376953125, -22.7734375, -21.9091796875, -21.044921875, -20.1806640625, -19.31640625, -18.4521484375, -17.587890625, -16.7236328125, -15.859375, -14.9951171875, -14.130859375, -13.2666015625, -12.40234375, -11.5380859375, -10.673828125, -9.8095703125, -8.9453125, -8.0810546875, -7.216796875, -6.3525390625, -5.48828125, -4.6240234375, -3.759765625, -2.8955078125, -2.03125, -1.1669921875, -0.302734375, 0.5615234375, 1.42578125, 2.2900390625, 3.154296875, 4.0185546875, 4.8828125, 5.7470703125, 6.611328125, 7.4755859375, 8.33984375, 9.2041015625, 10.068359375, 10.9326171875, 11.796875, 12.6611328125, 13.525390625, 14.3896484375, 15.25390625, 16.1181640625, 16.982421875, 17.8466796875, 18.7109375, 19.5751953125, 20.439453125, 21.3037109375, 22.16796875, 23.0322265625, 23.896484375, 24.7607421875, 25.625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 16.0, 18.0, 24.0, 34.0, 42.0, 81.0, 112.0, 186.0, 333.0, 819.0, 1229.0, 444.0, 237.0, 139.0, 95.0, 58.0, 36.0, 42.0, 20.0, 22.0, 14.0, 6.0, 10.0, 5.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.3087158203125, -5.113525390625, -4.9183349609375, -4.72314453125, -4.5279541015625, -4.332763671875, -4.1375732421875, -3.9423828125, -3.7471923828125, -3.552001953125, -3.3568115234375, -3.16162109375, -2.9664306640625, -2.771240234375, -2.5760498046875, -2.380859375, -2.1856689453125, -1.990478515625, -1.7952880859375, -1.60009765625, -1.4049072265625, -1.209716796875, -1.0145263671875, -0.8193359375, -0.6241455078125, -0.428955078125, -0.2337646484375, -0.03857421875, 0.1566162109375, 0.351806640625, 0.5469970703125, 0.7421875, 0.9373779296875, 1.132568359375, 1.3277587890625, 1.52294921875, 1.7181396484375, 1.913330078125, 2.1085205078125, 2.3037109375, 2.4989013671875, 2.694091796875, 2.8892822265625, 3.08447265625, 3.2796630859375, 3.474853515625, 3.6700439453125, 3.865234375, 4.0604248046875, 4.255615234375, 4.4508056640625, 4.64599609375, 4.8411865234375, 5.036376953125, 5.2315673828125, 5.4267578125, 5.6219482421875, 5.817138671875, 6.0123291015625, 6.20751953125, 6.4027099609375, 6.597900390625, 6.7930908203125, 6.98828125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 6.0, 11.0, 21.0, 36.0, 81.0, 119.0, 172.0, 195.0, 148.0, 85.0, 59.0, 23.0, 19.0, 7.0, 10.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.731101989746094, -35.66511535644531, -33.59912872314453, -31.533143997192383, -29.4671573638916, -27.40117073059082, -25.335186004638672, -23.26919937133789, -21.20321273803711, -19.137226104736328, -17.071239471435547, -15.005254745483398, -12.939268112182617, -10.873281478881836, -8.807295799255371, -6.741310119628906, -4.675323486328125, -2.609337329864502, -0.5433511734008789, 1.5226349830627441, 3.588621139526367, 5.654607772827148, 7.720593452453613, 9.786579132080078, 11.85256576538086, 13.91855239868164, 15.984538078308105, 18.05052375793457, 20.11651039123535, 22.182497024536133, 24.24848175048828, 26.314468383789062, 28.380447387695312, 30.446434020996094, 32.512420654296875, 34.578407287597656, 36.64439392089844, 38.71038055419922, 40.776363372802734, 42.842350006103516, 44.9083366394043, 46.97432327270508, 49.04030990600586, 51.10629653930664, 53.172279357910156, 55.23826599121094, 57.30425262451172, 59.3702392578125, 61.43622589111328, 63.50221252441406, 65.56819915771484, 67.63418579101562, 69.7001724243164, 71.76615905761719, 73.83214569091797, 75.89813232421875, 77.964111328125, 80.03009796142578, 82.09608459472656, 84.16207122802734, 86.22805786132812, 88.2940444946289, 90.36003112792969, 92.42601013183594, 94.49200439453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 9.0, 14.0, 19.0, 23.0, 33.0, 29.0, 41.0, 48.0, 57.0, 60.0, 64.0, 81.0, 66.0, 63.0, 51.0, 51.0, 55.0, 45.0, 46.0, 41.0, 28.0, 23.0, 16.0, 11.0, 12.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.18926239013672, -40.104164123535156, -39.01906204223633, -37.933963775634766, -36.84886169433594, -35.763763427734375, -34.67866134643555, -33.593563079833984, -32.508460998535156, -31.42336082458496, -30.338260650634766, -29.25316047668457, -28.168060302734375, -27.082962036132812, -25.997861862182617, -24.912761688232422, -23.82766342163086, -22.742563247680664, -21.65746307373047, -20.572362899780273, -19.487262725830078, -18.402164459228516, -17.31706428527832, -16.231964111328125, -15.14686393737793, -14.061763763427734, -12.976663589477539, -11.89156436920166, -10.806464195251465, -9.72136402130127, -8.63626480102539, -7.551164627075195, -6.466068267822266, -5.38096809387207, -4.295868396759033, -3.210768461227417, -2.125668525695801, -1.0405683517456055, 0.04453134536743164, 1.1296310424804688, 2.214731216430664, 3.2998311519622803, 4.3849310874938965, 5.470030784606934, 6.555130958557129, 7.640231132507324, 8.725330352783203, 9.810430526733398, 10.895530700683594, 11.980630874633789, 13.065731048583984, 14.150830268859863, 15.235930442810059, 16.321029663085938, 17.406129837036133, 18.491230010986328, 19.576330184936523, 20.66143035888672, 21.746530532836914, 22.83163070678711, 23.916728973388672, 25.0018310546875, 26.086929321289062, 27.172029495239258, 28.257129669189453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 9.0, 9.0, 10.0, 14.0, 19.0, 29.0, 33.0, 43.0, 75.0, 108.0, 157.0, 233.0, 364.0, 616.0, 1026.0, 1845.0, 3269.0, 6709.0, 14389.0, 31663.0, 70512.0, 146909.0, 255062.0, 248845.0, 140850.0, 67712.0, 30357.0, 13731.0, 6346.0, 3225.0, 1695.0, 992.0, 578.0, 366.0, 244.0, 154.0, 105.0, 78.0, 52.0, 36.0, 20.0, 19.0, 15.0, 8.0, 7.0, 5.0, 2.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.734375, -12.3360595703125, -11.937744140625, -11.5394287109375, -11.14111328125, -10.7427978515625, -10.344482421875, -9.9461669921875, -9.5478515625, -9.1495361328125, -8.751220703125, -8.3529052734375, -7.95458984375, -7.5562744140625, -7.157958984375, -6.7596435546875, -6.361328125, -5.9630126953125, -5.564697265625, -5.1663818359375, -4.76806640625, -4.3697509765625, -3.971435546875, -3.5731201171875, -3.1748046875, -2.7764892578125, -2.378173828125, -1.9798583984375, -1.58154296875, -1.1832275390625, -0.784912109375, -0.3865966796875, 0.01171875, 0.4100341796875, 0.808349609375, 1.2066650390625, 1.60498046875, 2.0032958984375, 2.401611328125, 2.7999267578125, 3.1982421875, 3.5965576171875, 3.994873046875, 4.3931884765625, 4.79150390625, 5.1898193359375, 5.588134765625, 5.9864501953125, 6.384765625, 6.7830810546875, 7.181396484375, 7.5797119140625, 7.97802734375, 8.3763427734375, 8.774658203125, 9.1729736328125, 9.5712890625, 9.9696044921875, 10.367919921875, 10.7662353515625, 11.16455078125, 11.5628662109375, 11.961181640625, 12.3594970703125, 12.7578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 10.0, 15.0, 14.0, 23.0, 23.0, 35.0, 40.0, 44.0, 54.0, 61.0, 59.0, 52.0, 78.0, 63.0, 50.0, 63.0, 44.0, 50.0, 47.0, 32.0, 30.0, 23.0, 20.0, 15.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.051513671875, -2.96630859375, -2.881103515625, -2.7958984375, -2.710693359375, -2.62548828125, -2.540283203125, -2.455078125, -2.369873046875, -2.28466796875, -2.199462890625, -2.1142578125, -2.029052734375, -1.94384765625, -1.858642578125, -1.7734375, -1.688232421875, -1.60302734375, -1.517822265625, -1.4326171875, -1.347412109375, -1.26220703125, -1.177001953125, -1.091796875, -1.006591796875, -0.92138671875, -0.836181640625, -0.7509765625, -0.665771484375, -0.58056640625, -0.495361328125, -0.41015625, -0.324951171875, -0.23974609375, -0.154541015625, -0.0693359375, 0.015869140625, 0.10107421875, 0.186279296875, 0.271484375, 0.356689453125, 0.44189453125, 0.527099609375, 0.6123046875, 0.697509765625, 0.78271484375, 0.867919921875, 0.953125, 1.038330078125, 1.12353515625, 1.208740234375, 1.2939453125, 1.379150390625, 1.46435546875, 1.549560546875, 1.634765625, 1.719970703125, 1.80517578125, 1.890380859375, 1.9755859375, 2.060791015625, 2.14599609375, 2.231201171875, 2.31640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 18.0, 19.0, 42.0, 34.0, 56.0, 80.0, 91.0, 139.0, 171.0, 262.0, 338.0, 545.0, 816.0, 1415.0, 2554.0, 5199.0, 11915.0, 29149.0, 73051.0, 173344.0, 307364.0, 245502.0, 114596.0, 46579.0, 18538.0, 8037.0, 3572.0, 1863.0, 1043.0, 666.0, 434.0, 271.0, 227.0, 143.0, 133.0, 79.0, 65.0, 39.0, 34.0, 28.0, 18.0, 18.0, 11.0, 10.0, 11.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.921875, -13.5093994140625, -13.096923828125, -12.6844482421875, -12.27197265625, -11.8594970703125, -11.447021484375, -11.0345458984375, -10.6220703125, -10.2095947265625, -9.797119140625, -9.3846435546875, -8.97216796875, -8.5596923828125, -8.147216796875, -7.7347412109375, -7.322265625, -6.9097900390625, -6.497314453125, -6.0848388671875, -5.67236328125, -5.2598876953125, -4.847412109375, -4.4349365234375, -4.0224609375, -3.6099853515625, -3.197509765625, -2.7850341796875, -2.37255859375, -1.9600830078125, -1.547607421875, -1.1351318359375, -0.72265625, -0.3101806640625, 0.102294921875, 0.5147705078125, 0.92724609375, 1.3397216796875, 1.752197265625, 2.1646728515625, 2.5771484375, 2.9896240234375, 3.402099609375, 3.8145751953125, 4.22705078125, 4.6395263671875, 5.052001953125, 5.4644775390625, 5.876953125, 6.2894287109375, 6.701904296875, 7.1143798828125, 7.52685546875, 7.9393310546875, 8.351806640625, 8.7642822265625, 9.1767578125, 9.5892333984375, 10.001708984375, 10.4141845703125, 10.82666015625, 11.2391357421875, 11.651611328125, 12.0640869140625, 12.4765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 8.0, 6.0, 8.0, 14.0, 13.0, 24.0, 17.0, 19.0, 31.0, 22.0, 23.0, 28.0, 33.0, 42.0, 35.0, 39.0, 35.0, 32.0, 48.0, 35.0, 41.0, 27.0, 50.0, 43.0, 40.0, 40.0, 41.0, 23.0, 34.0, 23.0, 18.0, 14.0, 17.0, 15.0, 10.0, 7.0, 3.0, 2.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8260498046875, -8.519287109375, -8.2125244140625, -7.90576171875, -7.5989990234375, -7.292236328125, -6.9854736328125, -6.6787109375, -6.3719482421875, -6.065185546875, -5.7584228515625, -5.45166015625, -5.1448974609375, -4.838134765625, -4.5313720703125, -4.224609375, -3.9178466796875, -3.611083984375, -3.3043212890625, -2.99755859375, -2.6907958984375, -2.384033203125, -2.0772705078125, -1.7705078125, -1.4637451171875, -1.156982421875, -0.8502197265625, -0.54345703125, -0.2366943359375, 0.070068359375, 0.3768310546875, 0.68359375, 0.9903564453125, 1.297119140625, 1.6038818359375, 1.91064453125, 2.2174072265625, 2.524169921875, 2.8309326171875, 3.1376953125, 3.4444580078125, 3.751220703125, 4.0579833984375, 4.36474609375, 4.6715087890625, 4.978271484375, 5.2850341796875, 5.591796875, 5.8985595703125, 6.205322265625, 6.5120849609375, 6.81884765625, 7.1256103515625, 7.432373046875, 7.7391357421875, 8.0458984375, 8.3526611328125, 8.659423828125, 8.9661865234375, 9.27294921875, 9.5797119140625, 9.886474609375, 10.1932373046875, 10.5]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 5.0, 9.0, 8.0, 20.0, 22.0, 29.0, 46.0, 56.0, 82.0, 127.0, 218.0, 369.0, 738.0, 1640.0, 4698.0, 16792.0, 84487.0, 449611.0, 397034.0, 70501.0, 14664.0, 4172.0, 1614.0, 655.0, 332.0, 211.0, 133.0, 81.0, 53.0, 41.0, 25.0, 23.0, 13.0, 13.0, 6.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.59375, -12.2333984375, -11.873046875, -11.5126953125, -11.15234375, -10.7919921875, -10.431640625, -10.0712890625, -9.7109375, -9.3505859375, -8.990234375, -8.6298828125, -8.26953125, -7.9091796875, -7.548828125, -7.1884765625, -6.828125, -6.4677734375, -6.107421875, -5.7470703125, -5.38671875, -5.0263671875, -4.666015625, -4.3056640625, -3.9453125, -3.5849609375, -3.224609375, -2.8642578125, -2.50390625, -2.1435546875, -1.783203125, -1.4228515625, -1.0625, -0.7021484375, -0.341796875, 0.0185546875, 0.37890625, 0.7392578125, 1.099609375, 1.4599609375, 1.8203125, 2.1806640625, 2.541015625, 2.9013671875, 3.26171875, 3.6220703125, 3.982421875, 4.3427734375, 4.703125, 5.0634765625, 5.423828125, 5.7841796875, 6.14453125, 6.5048828125, 6.865234375, 7.2255859375, 7.5859375, 7.9462890625, 8.306640625, 8.6669921875, 9.02734375, 9.3876953125, 9.748046875, 10.1083984375, 10.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 9.0, 11.0, 12.0, 17.0, 18.0, 38.0, 39.0, 46.0, 60.0, 67.0, 91.0, 90.0, 110.0, 75.0, 58.0, 63.0, 40.0, 33.0, 26.0, 21.0, 17.0, 14.0, 8.0, 6.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012025833129882812, -0.0011607706546783447, -0.0011189579963684082, -0.0010771453380584717, -0.0010353326797485352, -0.0009935200214385986, -0.0009517073631286621, -0.0009098947048187256, -0.0008680820465087891, -0.0008262693881988525, -0.000784456729888916, -0.0007426440715789795, -0.000700831413269043, -0.0006590187549591064, -0.0006172060966491699, -0.0005753934383392334, -0.0005335807800292969, -0.0004917681217193604, -0.00044995546340942383, -0.0004081428050994873, -0.0003663301467895508, -0.00032451748847961426, -0.00028270483016967773, -0.0002408921718597412, -0.0001990795135498047, -0.00015726685523986816, -0.00011545419692993164, -7.364153861999512e-05, -3.1828880310058594e-05, 9.98377799987793e-06, 5.179643630981445e-05, 9.360909461975098e-05, 0.0001354217529296875, 0.00017723441123962402, 0.00021904706954956055, 0.00026085972785949707, 0.0003026723861694336, 0.0003444850444793701, 0.00038629770278930664, 0.00042811036109924316, 0.0004699230194091797, 0.0005117356777191162, 0.0005535483360290527, 0.0005953609943389893, 0.0006371736526489258, 0.0006789863109588623, 0.0007207989692687988, 0.0007626116275787354, 0.0008044242858886719, 0.0008462369441986084, 0.0008880496025085449, 0.0009298622608184814, 0.000971674919128418, 0.0010134875774383545, 0.001055300235748291, 0.0010971128940582275, 0.001138925552368164, 0.0011807382106781006, 0.0012225508689880371, 0.0012643635272979736, 0.0013061761856079102, 0.0013479888439178467, 0.0013898015022277832, 0.0014316141605377197, 0.0014734268188476562]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 4.0, 6.0, 8.0, 17.0, 16.0, 23.0, 36.0, 48.0, 75.0, 123.0, 165.0, 320.0, 589.0, 1089.0, 2268.0, 5623.0, 16530.0, 61690.0, 279208.0, 482501.0, 146995.0, 33672.0, 10128.0, 3749.0, 1669.0, 837.0, 449.0, 247.0, 153.0, 97.0, 57.0, 55.0, 34.0, 23.0, 16.0, 8.0, 6.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.0723876953125, -9.769775390625, -9.4671630859375, -9.16455078125, -8.8619384765625, -8.559326171875, -8.2567138671875, -7.9541015625, -7.6514892578125, -7.348876953125, -7.0462646484375, -6.74365234375, -6.4410400390625, -6.138427734375, -5.8358154296875, -5.533203125, -5.2305908203125, -4.927978515625, -4.6253662109375, -4.32275390625, -4.0201416015625, -3.717529296875, -3.4149169921875, -3.1123046875, -2.8096923828125, -2.507080078125, -2.2044677734375, -1.90185546875, -1.5992431640625, -1.296630859375, -0.9940185546875, -0.69140625, -0.3887939453125, -0.086181640625, 0.2164306640625, 0.51904296875, 0.8216552734375, 1.124267578125, 1.4268798828125, 1.7294921875, 2.0321044921875, 2.334716796875, 2.6373291015625, 2.93994140625, 3.2425537109375, 3.545166015625, 3.8477783203125, 4.150390625, 4.4530029296875, 4.755615234375, 5.0582275390625, 5.36083984375, 5.6634521484375, 5.966064453125, 6.2686767578125, 6.5712890625, 6.8739013671875, 7.176513671875, 7.4791259765625, 7.78173828125, 8.0843505859375, 8.386962890625, 8.6895751953125, 8.9921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 7.0, 5.0, 11.0, 15.0, 22.0, 16.0, 26.0, 39.0, 38.0, 48.0, 73.0, 63.0, 63.0, 64.0, 62.0, 60.0, 78.0, 50.0, 50.0, 40.0, 32.0, 20.0, 18.0, 16.0, 14.0, 10.0, 10.0, 7.0, 9.0, 6.0, 6.0, 0.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.63421630859375, -4.4793701171875, -4.32452392578125, -4.169677734375, -4.01483154296875, -3.8599853515625, -3.70513916015625, -3.55029296875, -3.39544677734375, -3.2406005859375, -3.08575439453125, -2.930908203125, -2.77606201171875, -2.6212158203125, -2.46636962890625, -2.3115234375, -2.15667724609375, -2.0018310546875, -1.84698486328125, -1.692138671875, -1.53729248046875, -1.3824462890625, -1.22760009765625, -1.07275390625, -0.91790771484375, -0.7630615234375, -0.60821533203125, -0.453369140625, -0.29852294921875, -0.1436767578125, 0.01116943359375, 0.166015625, 0.32086181640625, 0.4757080078125, 0.63055419921875, 0.785400390625, 0.94024658203125, 1.0950927734375, 1.24993896484375, 1.40478515625, 1.55963134765625, 1.7144775390625, 1.86932373046875, 2.024169921875, 2.17901611328125, 2.3338623046875, 2.48870849609375, 2.6435546875, 2.79840087890625, 2.9532470703125, 3.10809326171875, 3.262939453125, 3.41778564453125, 3.5726318359375, 3.72747802734375, 3.88232421875, 4.03717041015625, 4.1920166015625, 4.34686279296875, 4.501708984375, 4.65655517578125, 4.8114013671875, 4.96624755859375, 5.12109375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 5.0, 9.0, 25.0, 32.0, 45.0, 67.0, 81.0, 112.0, 145.0, 114.0, 92.0, 97.0, 47.0, 44.0, 26.0, 23.0, 14.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.5039291381836, -123.97856903076172, -120.45320129394531, -116.92784118652344, -113.40248107910156, -109.87712097167969, -106.35176086425781, -102.8263931274414, -99.30103302001953, -95.77567291259766, -92.25030517578125, -88.72494506835938, -85.1995849609375, -81.67422485351562, -78.14886474609375, -74.62349700927734, -71.09813690185547, -67.5727767944336, -64.04740905761719, -60.52204895019531, -56.99668884277344, -53.47132873535156, -49.94596481323242, -46.42060089111328, -42.895240783691406, -39.36988067626953, -35.84451675415039, -32.31915283203125, -28.793792724609375, -25.268430709838867, -21.74306869506836, -18.21770668029785, -14.692344665527344, -11.166982650756836, -7.641620635986328, -4.11625862121582, -0.5908966064453125, 2.9344654083251953, 6.459827423095703, 9.985189437866211, 13.510551452636719, 17.035913467407227, 20.561275482177734, 24.086637496948242, 27.61199951171875, 31.137361526489258, 34.662723541259766, 38.188087463378906, 41.71344757080078, 45.238807678222656, 48.7641716003418, 52.28953552246094, 55.81489562988281, 59.34025573730469, 62.86561965942383, 66.39098358154297, 69.91634368896484, 73.44170379638672, 76.96707153320312, 80.492431640625, 84.01779174804688, 87.54315185546875, 91.06851196289062, 94.59387969970703, 98.1192398071289]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 5.0, 5.0, 8.0, 15.0, 9.0, 14.0, 20.0, 19.0, 14.0, 32.0, 26.0, 39.0, 40.0, 36.0, 47.0, 50.0, 46.0, 44.0, 37.0, 51.0, 49.0, 45.0, 41.0, 40.0, 38.0, 37.0, 24.0, 30.0, 26.0, 16.0, 8.0, 13.0, 9.0, 12.0, 5.0, 8.0, 6.0, 7.0, 3.0, 1.0, 3.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-74.10862731933594, -72.0201187133789, -69.93160247802734, -67.84309387207031, -65.75458526611328, -63.666072845458984, -61.57756042480469, -59.489051818847656, -57.40053939819336, -55.31202697753906, -53.22351837158203, -51.135005950927734, -49.04649353027344, -46.957984924316406, -44.86947250366211, -42.78096008300781, -40.69245147705078, -38.603939056396484, -36.51543045043945, -34.426918029785156, -32.338409423828125, -30.249897003173828, -28.16138458251953, -26.072874069213867, -23.984363555908203, -21.89585304260254, -19.807342529296875, -17.718830108642578, -15.630319595336914, -13.54180908203125, -11.45329761505127, -9.364786148071289, -7.276271820068359, -5.187760829925537, -3.099249839782715, -1.0107388496398926, 1.0777721405029297, 3.1662826538085938, 5.254794120788574, 7.343305587768555, 9.431816101074219, 11.520326614379883, 13.608838081359863, 15.697349548339844, 17.785860061645508, 19.874370574951172, 21.96288299560547, 24.051393508911133, 26.139904022216797, 28.22841453552246, 30.316925048828125, 32.40543746948242, 34.49394989013672, 36.58245849609375, 38.67097091674805, 40.759483337402344, 42.847991943359375, 44.93650436401367, 47.0250129699707, 49.113525390625, 51.20203399658203, 53.29054641723633, 55.379058837890625, 57.467567443847656, 59.55607986450195]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 12.0, 14.0, 15.0, 24.0, 29.0, 61.0, 94.0, 137.0, 192.0, 353.0, 721.0, 1340.0, 2843.0, 6856.0, 19921.0, 81763.0, 2975604.0, 1009488.0, 65868.0, 17144.0, 6195.0, 2655.0, 1310.0, 727.0, 364.0, 210.0, 121.0, 66.0, 53.0, 32.0, 19.0, 12.0, 12.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.24951171875, -17.5458984375, -16.84228515625, -16.138671875, -15.43505859375, -14.7314453125, -14.02783203125, -13.32421875, -12.62060546875, -11.9169921875, -11.21337890625, -10.509765625, -9.80615234375, -9.1025390625, -8.39892578125, -7.6953125, -6.99169921875, -6.2880859375, -5.58447265625, -4.880859375, -4.17724609375, -3.4736328125, -2.77001953125, -2.06640625, -1.36279296875, -0.6591796875, 0.04443359375, 0.748046875, 1.45166015625, 2.1552734375, 2.85888671875, 3.5625, 4.26611328125, 4.9697265625, 5.67333984375, 6.376953125, 7.08056640625, 7.7841796875, 8.48779296875, 9.19140625, 9.89501953125, 10.5986328125, 11.30224609375, 12.005859375, 12.70947265625, 13.4130859375, 14.11669921875, 14.8203125, 15.52392578125, 16.2275390625, 16.93115234375, 17.634765625, 18.33837890625, 19.0419921875, 19.74560546875, 20.44921875, 21.15283203125, 21.8564453125, 22.56005859375, 23.263671875, 23.96728515625, 24.6708984375, 25.37451171875, 26.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 8.0, 15.0, 14.0, 17.0, 27.0, 36.0, 32.0, 38.0, 35.0, 44.0, 50.0, 58.0, 52.0, 49.0, 57.0, 48.0, 52.0, 40.0, 47.0, 33.0, 33.0, 36.0, 22.0, 22.0, 32.0, 20.0, 11.0, 9.0, 18.0, 7.0, 9.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.3984375, -2.326812744140625, -2.25518798828125, -2.183563232421875, -2.1119384765625, -2.040313720703125, -1.96868896484375, -1.897064208984375, -1.825439453125, -1.753814697265625, -1.68218994140625, -1.610565185546875, -1.5389404296875, -1.467315673828125, -1.39569091796875, -1.324066162109375, -1.25244140625, -1.180816650390625, -1.10919189453125, -1.037567138671875, -0.9659423828125, -0.894317626953125, -0.82269287109375, -0.751068115234375, -0.679443359375, -0.607818603515625, -0.53619384765625, -0.464569091796875, -0.3929443359375, -0.321319580078125, -0.24969482421875, -0.178070068359375, -0.1064453125, -0.034820556640625, 0.03680419921875, 0.108428955078125, 0.1800537109375, 0.251678466796875, 0.32330322265625, 0.394927978515625, 0.466552734375, 0.538177490234375, 0.60980224609375, 0.681427001953125, 0.7530517578125, 0.824676513671875, 0.89630126953125, 0.967926025390625, 1.03955078125, 1.111175537109375, 1.18280029296875, 1.254425048828125, 1.3260498046875, 1.397674560546875, 1.46929931640625, 1.540924072265625, 1.612548828125, 1.684173583984375, 1.75579833984375, 1.827423095703125, 1.8990478515625, 1.970672607421875, 2.04229736328125, 2.113922119140625, 2.185546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 13.0, 18.0, 35.0, 45.0, 77.0, 124.0, 211.0, 307.0, 532.0, 920.0, 1913.0, 4306.0, 10687.0, 31239.0, 122346.0, 1564899.0, 2272359.0, 131818.0, 32805.0, 11078.0, 4298.0, 1905.0, 937.0, 524.0, 330.0, 168.0, 119.0, 83.0, 45.0, 36.0, 28.0, 13.0, 12.0, 10.0, 7.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.586181640625, -17.00048828125, -16.414794921875, -15.8291015625, -15.243408203125, -14.65771484375, -14.072021484375, -13.486328125, -12.900634765625, -12.31494140625, -11.729248046875, -11.1435546875, -10.557861328125, -9.97216796875, -9.386474609375, -8.80078125, -8.215087890625, -7.62939453125, -7.043701171875, -6.4580078125, -5.872314453125, -5.28662109375, -4.700927734375, -4.115234375, -3.529541015625, -2.94384765625, -2.358154296875, -1.7724609375, -1.186767578125, -0.60107421875, -0.015380859375, 0.5703125, 1.156005859375, 1.74169921875, 2.327392578125, 2.9130859375, 3.498779296875, 4.08447265625, 4.670166015625, 5.255859375, 5.841552734375, 6.42724609375, 7.012939453125, 7.5986328125, 8.184326171875, 8.77001953125, 9.355712890625, 9.94140625, 10.527099609375, 11.11279296875, 11.698486328125, 12.2841796875, 12.869873046875, 13.45556640625, 14.041259765625, 14.626953125, 15.212646484375, 15.79833984375, 16.384033203125, 16.9697265625, 17.555419921875, 18.14111328125, 18.726806640625, 19.3125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 10.0, 9.0, 15.0, 22.0, 36.0, 50.0, 81.0, 126.0, 194.0, 465.0, 1559.0, 783.0, 292.0, 135.0, 100.0, 52.0, 37.0, 26.0, 23.0, 11.0, 9.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8671875, -4.691650390625, -4.51611328125, -4.340576171875, -4.1650390625, -3.989501953125, -3.81396484375, -3.638427734375, -3.462890625, -3.287353515625, -3.11181640625, -2.936279296875, -2.7607421875, -2.585205078125, -2.40966796875, -2.234130859375, -2.05859375, -1.883056640625, -1.70751953125, -1.531982421875, -1.3564453125, -1.180908203125, -1.00537109375, -0.829833984375, -0.654296875, -0.478759765625, -0.30322265625, -0.127685546875, 0.0478515625, 0.223388671875, 0.39892578125, 0.574462890625, 0.75, 0.925537109375, 1.10107421875, 1.276611328125, 1.4521484375, 1.627685546875, 1.80322265625, 1.978759765625, 2.154296875, 2.329833984375, 2.50537109375, 2.680908203125, 2.8564453125, 3.031982421875, 3.20751953125, 3.383056640625, 3.55859375, 3.734130859375, 3.90966796875, 4.085205078125, 4.2607421875, 4.436279296875, 4.61181640625, 4.787353515625, 4.962890625, 5.138427734375, 5.31396484375, 5.489501953125, 5.6650390625, 5.840576171875, 6.01611328125, 6.191650390625, 6.3671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 12.0, 11.0, 21.0, 26.0, 39.0, 70.0, 99.0, 133.0, 145.0, 127.0, 102.0, 70.0, 57.0, 36.0, 21.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.837711334228516, -42.76536178588867, -41.69300842285156, -40.62065887451172, -39.548309326171875, -38.47595977783203, -37.40360641479492, -36.33125686645508, -35.25890350341797, -34.186553955078125, -33.114200592041016, -32.04185104370117, -30.969501495361328, -29.89715003967285, -28.824798583984375, -27.75244903564453, -26.680099487304688, -25.60774803161621, -24.535398483276367, -23.46304702758789, -22.390697479248047, -21.31834602355957, -20.245994567871094, -19.17364501953125, -18.101293563842773, -17.028942108154297, -15.956592559814453, -14.884241104125977, -13.811890602111816, -12.739540100097656, -11.66718864440918, -10.59483814239502, -9.522483825683594, -8.450133323669434, -7.377782344818115, -6.305431365966797, -5.233080863952637, -4.160730361938477, -3.088379383087158, -2.01602840423584, -0.9436779022216797, 0.12867283821105957, 1.2010235786437988, 2.273374319076538, 3.3457250595092773, 4.4180755615234375, 5.490426540374756, 6.562777519226074, 7.635128021240234, 8.707478523254395, 9.779829025268555, 10.852180480957031, 11.924530982971191, 12.996881484985352, 14.069232940673828, 15.141583442687988, 16.21393394470215, 17.286285400390625, 18.35863494873047, 19.430986404418945, 20.503337860107422, 21.575687408447266, 22.648038864135742, 23.72039031982422, 24.792739868164062]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 15.0, 9.0, 12.0, 14.0, 16.0, 27.0, 28.0, 33.0, 48.0, 46.0, 47.0, 58.0, 45.0, 28.0, 51.0, 61.0, 72.0, 48.0, 49.0, 49.0, 45.0, 32.0, 36.0, 27.0, 17.0, 18.0, 16.0, 12.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.641159057617188, -19.009654998779297, -18.378150939941406, -17.74664878845215, -17.115144729614258, -16.483640670776367, -15.852137565612793, -15.220634460449219, -14.589130401611328, -13.957626342773438, -13.326123237609863, -12.694620132446289, -12.063116073608398, -11.431612014770508, -10.800108909606934, -10.16860580444336, -9.537101745605469, -8.905597686767578, -8.274094581604004, -7.6425909996032715, -7.011087417602539, -6.379583835601807, -5.748080253601074, -5.116576671600342, -4.485073089599609, -3.853569507598877, -3.2220659255981445, -2.590562343597412, -1.9590587615966797, -1.3275551795959473, -0.6960515975952148, -0.06454801559448242, 0.5669536590576172, 1.1984572410583496, 1.829960823059082, 2.4614644050598145, 3.092967987060547, 3.7244715690612793, 4.355975151062012, 4.987478733062744, 5.618982315063477, 6.250485897064209, 6.881989479064941, 7.513493061065674, 8.144996643066406, 8.776500701904297, 9.408003807067871, 10.039506912231445, 10.671010971069336, 11.302515029907227, 11.9340181350708, 12.565521240234375, 13.197025299072266, 13.828529357910156, 14.46003246307373, 15.091535568237305, 15.723039627075195, 16.354543685913086, 16.986045837402344, 17.617549896240234, 18.249053955078125, 18.880558013916016, 19.512062072753906, 20.143564224243164, 20.775068283081055]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 12.0, 12.0, 17.0, 18.0, 27.0, 41.0, 91.0, 112.0, 176.0, 270.0, 454.0, 796.0, 1475.0, 2824.0, 6439.0, 16585.0, 46385.0, 128303.0, 299141.0, 317150.0, 143912.0, 51859.0, 18350.0, 7260.0, 3153.0, 1549.0, 885.0, 468.0, 252.0, 165.0, 100.0, 61.0, 50.0, 38.0, 29.0, 18.0, 19.0, 9.0, 9.0, 8.0, 11.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-17.015625, -16.543701171875, -16.07177734375, -15.599853515625, -15.1279296875, -14.656005859375, -14.18408203125, -13.712158203125, -13.240234375, -12.768310546875, -12.29638671875, -11.824462890625, -11.3525390625, -10.880615234375, -10.40869140625, -9.936767578125, -9.46484375, -8.992919921875, -8.52099609375, -8.049072265625, -7.5771484375, -7.105224609375, -6.63330078125, -6.161376953125, -5.689453125, -5.217529296875, -4.74560546875, -4.273681640625, -3.8017578125, -3.329833984375, -2.85791015625, -2.385986328125, -1.9140625, -1.442138671875, -0.97021484375, -0.498291015625, -0.0263671875, 0.445556640625, 0.91748046875, 1.389404296875, 1.861328125, 2.333251953125, 2.80517578125, 3.277099609375, 3.7490234375, 4.220947265625, 4.69287109375, 5.164794921875, 5.63671875, 6.108642578125, 6.58056640625, 7.052490234375, 7.5244140625, 7.996337890625, 8.46826171875, 8.940185546875, 9.412109375, 9.884033203125, 10.35595703125, 10.827880859375, 11.2998046875, 11.771728515625, 12.24365234375, 12.715576171875, 13.1875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 7.0, 11.0, 13.0, 13.0, 22.0, 36.0, 34.0, 42.0, 46.0, 38.0, 50.0, 48.0, 55.0, 47.0, 58.0, 55.0, 51.0, 45.0, 46.0, 37.0, 33.0, 23.0, 29.0, 24.0, 29.0, 15.0, 19.0, 12.0, 8.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.48046875, -2.4106597900390625, -2.340850830078125, -2.2710418701171875, -2.20123291015625, -2.1314239501953125, -2.061614990234375, -1.9918060302734375, -1.9219970703125, -1.8521881103515625, -1.782379150390625, -1.7125701904296875, -1.64276123046875, -1.5729522705078125, -1.503143310546875, -1.4333343505859375, -1.363525390625, -1.2937164306640625, -1.223907470703125, -1.1540985107421875, -1.08428955078125, -1.0144805908203125, -0.944671630859375, -0.8748626708984375, -0.8050537109375, -0.7352447509765625, -0.665435791015625, -0.5956268310546875, -0.52581787109375, -0.4560089111328125, -0.386199951171875, -0.3163909912109375, -0.24658203125, -0.1767730712890625, -0.106964111328125, -0.0371551513671875, 0.03265380859375, 0.1024627685546875, 0.172271728515625, 0.2420806884765625, 0.3118896484375, 0.3816986083984375, 0.451507568359375, 0.5213165283203125, 0.59112548828125, 0.6609344482421875, 0.730743408203125, 0.8005523681640625, 0.870361328125, 0.9401702880859375, 1.009979248046875, 1.0797882080078125, 1.14959716796875, 1.2194061279296875, 1.289215087890625, 1.3590240478515625, 1.4288330078125, 1.4986419677734375, 1.568450927734375, 1.6382598876953125, 1.70806884765625, 1.7778778076171875, 1.847686767578125, 1.9174957275390625, 1.9873046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 15.0, 15.0, 21.0, 22.0, 32.0, 49.0, 71.0, 126.0, 144.0, 239.0, 338.0, 518.0, 822.0, 1351.0, 2664.0, 6030.0, 15432.0, 44825.0, 133364.0, 313828.0, 317931.0, 136342.0, 46132.0, 15692.0, 6061.0, 2650.0, 1367.0, 815.0, 487.0, 361.0, 248.0, 148.0, 119.0, 92.0, 54.0, 44.0, 35.0, 20.0, 18.0, 7.0, 9.0, 10.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.2401123046875, -10.823974609375, -10.4078369140625, -9.99169921875, -9.5755615234375, -9.159423828125, -8.7432861328125, -8.3271484375, -7.9110107421875, -7.494873046875, -7.0787353515625, -6.66259765625, -6.2464599609375, -5.830322265625, -5.4141845703125, -4.998046875, -4.5819091796875, -4.165771484375, -3.7496337890625, -3.33349609375, -2.9173583984375, -2.501220703125, -2.0850830078125, -1.6689453125, -1.2528076171875, -0.836669921875, -0.4205322265625, -0.00439453125, 0.4117431640625, 0.827880859375, 1.2440185546875, 1.66015625, 2.0762939453125, 2.492431640625, 2.9085693359375, 3.32470703125, 3.7408447265625, 4.156982421875, 4.5731201171875, 4.9892578125, 5.4053955078125, 5.821533203125, 6.2376708984375, 6.65380859375, 7.0699462890625, 7.486083984375, 7.9022216796875, 8.318359375, 8.7344970703125, 9.150634765625, 9.5667724609375, 9.98291015625, 10.3990478515625, 10.815185546875, 11.2313232421875, 11.6474609375, 12.0635986328125, 12.479736328125, 12.8958740234375, 13.31201171875, 13.7281494140625, 14.144287109375, 14.5604248046875, 14.9765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 1.0, 9.0, 9.0, 8.0, 7.0, 15.0, 10.0, 11.0, 30.0, 11.0, 32.0, 26.0, 32.0, 35.0, 43.0, 43.0, 33.0, 33.0, 49.0, 45.0, 46.0, 49.0, 52.0, 45.0, 42.0, 36.0, 24.0, 30.0, 20.0, 35.0, 32.0, 21.0, 22.0, 9.0, 12.0, 5.0, 8.0, 13.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8828125, -8.5869140625, -8.291015625, -7.9951171875, -7.69921875, -7.4033203125, -7.107421875, -6.8115234375, -6.515625, -6.2197265625, -5.923828125, -5.6279296875, -5.33203125, -5.0361328125, -4.740234375, -4.4443359375, -4.1484375, -3.8525390625, -3.556640625, -3.2607421875, -2.96484375, -2.6689453125, -2.373046875, -2.0771484375, -1.78125, -1.4853515625, -1.189453125, -0.8935546875, -0.59765625, -0.3017578125, -0.005859375, 0.2900390625, 0.5859375, 0.8818359375, 1.177734375, 1.4736328125, 1.76953125, 2.0654296875, 2.361328125, 2.6572265625, 2.953125, 3.2490234375, 3.544921875, 3.8408203125, 4.13671875, 4.4326171875, 4.728515625, 5.0244140625, 5.3203125, 5.6162109375, 5.912109375, 6.2080078125, 6.50390625, 6.7998046875, 7.095703125, 7.3916015625, 7.6875, 7.9833984375, 8.279296875, 8.5751953125, 8.87109375, 9.1669921875, 9.462890625, 9.7587890625, 10.0546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 10.0, 6.0, 9.0, 15.0, 15.0, 29.0, 45.0, 76.0, 141.0, 249.0, 565.0, 1604.0, 5643.0, 50968.0, 845903.0, 130874.0, 8835.0, 2111.0, 734.0, 322.0, 162.0, 73.0, 46.0, 38.0, 18.0, 18.0, 9.0, 5.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-23.90625, -23.27099609375, -22.6357421875, -22.00048828125, -21.365234375, -20.72998046875, -20.0947265625, -19.45947265625, -18.82421875, -18.18896484375, -17.5537109375, -16.91845703125, -16.283203125, -15.64794921875, -15.0126953125, -14.37744140625, -13.7421875, -13.10693359375, -12.4716796875, -11.83642578125, -11.201171875, -10.56591796875, -9.9306640625, -9.29541015625, -8.66015625, -8.02490234375, -7.3896484375, -6.75439453125, -6.119140625, -5.48388671875, -4.8486328125, -4.21337890625, -3.578125, -2.94287109375, -2.3076171875, -1.67236328125, -1.037109375, -0.40185546875, 0.2333984375, 0.86865234375, 1.50390625, 2.13916015625, 2.7744140625, 3.40966796875, 4.044921875, 4.68017578125, 5.3154296875, 5.95068359375, 6.5859375, 7.22119140625, 7.8564453125, 8.49169921875, 9.126953125, 9.76220703125, 10.3974609375, 11.03271484375, 11.66796875, 12.30322265625, 12.9384765625, 13.57373046875, 14.208984375, 14.84423828125, 15.4794921875, 16.11474609375, 16.75]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 3.0, 12.0, 7.0, 14.0, 11.0, 24.0, 27.0, 35.0, 46.0, 65.0, 79.0, 102.0, 103.0, 95.0, 91.0, 53.0, 37.0, 38.0, 31.0, 23.0, 26.0, 11.0, 7.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013828277587890625, -0.001345023512840271, -0.0013072192668914795, -0.001269415020942688, -0.0012316107749938965, -0.001193806529045105, -0.0011560022830963135, -0.001118198037147522, -0.0010803937911987305, -0.001042589545249939, -0.0010047852993011475, -0.000966981053352356, -0.0009291768074035645, -0.000891372561454773, -0.0008535683155059814, -0.0008157640695571899, -0.0007779598236083984, -0.0007401555776596069, -0.0007023513317108154, -0.0006645470857620239, -0.0006267428398132324, -0.0005889385938644409, -0.0005511343479156494, -0.0005133301019668579, -0.0004755258560180664, -0.0004377216100692749, -0.0003999173641204834, -0.0003621131181716919, -0.0003243088722229004, -0.0002865046262741089, -0.0002487003803253174, -0.00021089613437652588, -0.00017309188842773438, -0.00013528764247894287, -9.748339653015137e-05, -5.967915058135986e-05, -2.187490463256836e-05, 1.5929341316223145e-05, 5.373358726501465e-05, 9.153783321380615e-05, 0.00012934207916259766, 0.00016714632511138916, 0.00020495057106018066, 0.00024275481700897217, 0.00028055906295776367, 0.0003183633089065552, 0.0003561675548553467, 0.0003939718008041382, 0.0004317760467529297, 0.0004695802927017212, 0.0005073845386505127, 0.0005451887845993042, 0.0005829930305480957, 0.0006207972764968872, 0.0006586015224456787, 0.0006964057683944702, 0.0007342100143432617, 0.0007720142602920532, 0.0008098185062408447, 0.0008476227521896362, 0.0008854269981384277, 0.0009232312440872192, 0.0009610354900360107, 0.0009988397359848022, 0.0010366439819335938]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 2.0, 10.0, 14.0, 21.0, 23.0, 33.0, 51.0, 108.0, 167.0, 292.0, 717.0, 1912.0, 6492.0, 58248.0, 931631.0, 40134.0, 5591.0, 1798.0, 650.0, 276.0, 157.0, 73.0, 61.0, 26.0, 23.0, 19.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -21.97607421875, -21.0771484375, -20.17822265625, -19.279296875, -18.38037109375, -17.4814453125, -16.58251953125, -15.68359375, -14.78466796875, -13.8857421875, -12.98681640625, -12.087890625, -11.18896484375, -10.2900390625, -9.39111328125, -8.4921875, -7.59326171875, -6.6943359375, -5.79541015625, -4.896484375, -3.99755859375, -3.0986328125, -2.19970703125, -1.30078125, -0.40185546875, 0.4970703125, 1.39599609375, 2.294921875, 3.19384765625, 4.0927734375, 4.99169921875, 5.890625, 6.78955078125, 7.6884765625, 8.58740234375, 9.486328125, 10.38525390625, 11.2841796875, 12.18310546875, 13.08203125, 13.98095703125, 14.8798828125, 15.77880859375, 16.677734375, 17.57666015625, 18.4755859375, 19.37451171875, 20.2734375, 21.17236328125, 22.0712890625, 22.97021484375, 23.869140625, 24.76806640625, 25.6669921875, 26.56591796875, 27.46484375, 28.36376953125, 29.2626953125, 30.16162109375, 31.060546875, 31.95947265625, 32.8583984375, 33.75732421875, 34.65625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 15.0, 25.0, 68.0, 159.0, 282.0, 241.0, 95.0, 46.0, 20.0, 8.0, 4.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.5291748046875, -10.972412109375, -10.4156494140625, -9.85888671875, -9.3021240234375, -8.745361328125, -8.1885986328125, -7.6318359375, -7.0750732421875, -6.518310546875, -5.9615478515625, -5.40478515625, -4.8480224609375, -4.291259765625, -3.7344970703125, -3.177734375, -2.6209716796875, -2.064208984375, -1.5074462890625, -0.95068359375, -0.3939208984375, 0.162841796875, 0.7196044921875, 1.2763671875, 1.8331298828125, 2.389892578125, 2.9466552734375, 3.50341796875, 4.0601806640625, 4.616943359375, 5.1737060546875, 5.73046875, 6.2872314453125, 6.843994140625, 7.4007568359375, 7.95751953125, 8.5142822265625, 9.071044921875, 9.6278076171875, 10.1845703125, 10.7413330078125, 11.298095703125, 11.8548583984375, 12.41162109375, 12.9683837890625, 13.525146484375, 14.0819091796875, 14.638671875, 15.1954345703125, 15.752197265625, 16.3089599609375, 16.86572265625, 17.4224853515625, 17.979248046875, 18.5360107421875, 19.0927734375, 19.6495361328125, 20.206298828125, 20.7630615234375, 21.31982421875, 21.8765869140625, 22.433349609375, 22.9901123046875, 23.546875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 12.0, 10.0, 27.0, 64.0, 106.0, 207.0, 225.0, 163.0, 107.0, 43.0, 19.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.01022338867188, -123.25325775146484, -117.49628448486328, -111.73931884765625, -105.98235321044922, -100.22538757324219, -94.46841430664062, -88.7114486694336, -82.95448303222656, -77.19751739501953, -71.44054412841797, -65.68357849121094, -59.926612854003906, -54.16964340209961, -48.41267395019531, -42.65570831298828, -36.89873504638672, -31.141767501831055, -25.38479995727539, -19.627830505371094, -13.87086296081543, -8.113895416259766, -2.3569259643554688, 3.4000396728515625, 9.15700912475586, 14.913976669311523, 20.670944213867188, 26.427913665771484, 32.18488311767578, 37.94184875488281, 43.69881820678711, 49.45578384399414, 55.21275329589844, 60.969722747802734, 66.72669219970703, 72.48365783691406, 78.2406234741211, 83.99758911132812, 89.75456237792969, 95.51152801513672, 101.26849365234375, 107.02545928955078, 112.78243255615234, 118.53939819335938, 124.2963638305664, 130.05332946777344, 135.810302734375, 141.5672607421875, 147.32424926757812, 153.0812225341797, 158.8381805419922, 164.59515380859375, 170.3521270751953, 176.1090850830078, 181.86605834960938, 187.62301635742188, 193.37998962402344, 199.136962890625, 204.8939208984375, 210.65089416503906, 216.40786743164062, 222.16482543945312, 227.9217987060547, 233.67877197265625, 239.43572998046875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 5.0, 3.0, 1.0, 6.0, 8.0, 10.0, 13.0, 13.0, 21.0, 16.0, 21.0, 29.0, 34.0, 31.0, 32.0, 55.0, 58.0, 51.0, 62.0, 72.0, 57.0, 48.0, 53.0, 47.0, 44.0, 28.0, 39.0, 20.0, 29.0, 27.0, 23.0, 12.0, 11.0, 7.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-75.6527099609375, -73.4660873413086, -71.27947235107422, -69.09284973144531, -66.90623474121094, -64.71961212158203, -62.53299331665039, -60.34637451171875, -58.15975570678711, -55.97313690185547, -53.78651809692383, -51.59989929199219, -49.41327667236328, -47.226661682128906, -45.0400390625, -42.85342025756836, -40.66680145263672, -38.48018264770508, -36.29356384277344, -34.1069450378418, -31.920324325561523, -29.733705520629883, -27.54708480834961, -25.36046600341797, -23.173847198486328, -20.987228393554688, -18.800609588623047, -16.613988876342773, -14.427370071411133, -12.240751266479492, -10.054131507873535, -7.867511749267578, -5.680885314941406, -3.4942660331726074, -1.3076467514038086, 0.8789725303649902, 3.065591812133789, 5.25221061706543, 7.438830375671387, 9.625450134277344, 11.812068939208984, 13.998687744140625, 16.185306549072266, 18.37192726135254, 20.55854606628418, 22.74516487121582, 24.931785583496094, 27.118404388427734, 29.305023193359375, 31.491641998291016, 33.678260803222656, 35.8648796081543, 38.05149841308594, 40.238121032714844, 42.424739837646484, 44.611358642578125, 46.797977447509766, 48.984596252441406, 51.17121505737305, 53.35783386230469, 55.544456481933594, 57.73107147216797, 59.917694091796875, 62.104312896728516, 64.29093170166016]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 2.0, 3.0, 8.0, 6.0, 16.0, 13.0, 23.0, 25.0, 34.0, 36.0, 64.0, 69.0, 96.0, 123.0, 162.0, 254.0, 380.0, 599.0, 945.0, 1548.0, 2520.0, 4681.0, 9193.0, 19874.0, 50802.0, 174799.0, 2464975.0, 1238593.0, 143552.0, 44114.0, 17748.0, 8300.0, 4327.0, 2385.0, 1351.0, 850.0, 570.0, 376.0, 265.0, 163.0, 132.0, 83.0, 51.0, 38.0, 28.0, 23.0, 19.0, 22.0, 13.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.6796875, -13.2374267578125, -12.795166015625, -12.3529052734375, -11.91064453125, -11.4683837890625, -11.026123046875, -10.5838623046875, -10.1416015625, -9.6993408203125, -9.257080078125, -8.8148193359375, -8.37255859375, -7.9302978515625, -7.488037109375, -7.0457763671875, -6.603515625, -6.1612548828125, -5.718994140625, -5.2767333984375, -4.83447265625, -4.3922119140625, -3.949951171875, -3.5076904296875, -3.0654296875, -2.6231689453125, -2.180908203125, -1.7386474609375, -1.29638671875, -0.8541259765625, -0.411865234375, 0.0303955078125, 0.47265625, 0.9149169921875, 1.357177734375, 1.7994384765625, 2.24169921875, 2.6839599609375, 3.126220703125, 3.5684814453125, 4.0107421875, 4.4530029296875, 4.895263671875, 5.3375244140625, 5.77978515625, 6.2220458984375, 6.664306640625, 7.1065673828125, 7.548828125, 7.9910888671875, 8.433349609375, 8.8756103515625, 9.31787109375, 9.7601318359375, 10.202392578125, 10.6446533203125, 11.0869140625, 11.5291748046875, 11.971435546875, 12.4136962890625, 12.85595703125, 13.2982177734375, 13.740478515625, 14.1827392578125, 14.625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 12.0, 14.0, 17.0, 24.0, 27.0, 23.0, 43.0, 48.0, 45.0, 57.0, 45.0, 54.0, 54.0, 68.0, 51.0, 48.0, 56.0, 46.0, 33.0, 34.0, 30.0, 24.0, 31.0, 16.0, 17.0, 14.0, 20.0, 11.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.267578125, -2.193145751953125, -2.11871337890625, -2.044281005859375, -1.9698486328125, -1.895416259765625, -1.82098388671875, -1.746551513671875, -1.672119140625, -1.597686767578125, -1.52325439453125, -1.448822021484375, -1.3743896484375, -1.299957275390625, -1.22552490234375, -1.151092529296875, -1.07666015625, -1.002227783203125, -0.92779541015625, -0.853363037109375, -0.7789306640625, -0.704498291015625, -0.63006591796875, -0.555633544921875, -0.481201171875, -0.406768798828125, -0.33233642578125, -0.257904052734375, -0.1834716796875, -0.109039306640625, -0.03460693359375, 0.039825439453125, 0.1142578125, 0.188690185546875, 0.26312255859375, 0.337554931640625, 0.4119873046875, 0.486419677734375, 0.56085205078125, 0.635284423828125, 0.709716796875, 0.784149169921875, 0.85858154296875, 0.933013916015625, 1.0074462890625, 1.081878662109375, 1.15631103515625, 1.230743408203125, 1.30517578125, 1.379608154296875, 1.45404052734375, 1.528472900390625, 1.6029052734375, 1.677337646484375, 1.75177001953125, 1.826202392578125, 1.900634765625, 1.975067138671875, 2.04949951171875, 2.123931884765625, 2.1983642578125, 2.272796630859375, 2.34722900390625, 2.421661376953125, 2.49609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 9.0, 11.0, 17.0, 19.0, 35.0, 59.0, 105.0, 179.0, 312.0, 483.0, 889.0, 1681.0, 3446.0, 9158.0, 38310.0, 402666.0, 3509349.0, 189940.0, 25025.0, 6821.0, 2722.0, 1371.0, 688.0, 395.0, 241.0, 130.0, 58.0, 54.0, 29.0, 23.0, 17.0, 10.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.316650390625, -20.50830078125, -19.699951171875, -18.8916015625, -18.083251953125, -17.27490234375, -16.466552734375, -15.658203125, -14.849853515625, -14.04150390625, -13.233154296875, -12.4248046875, -11.616455078125, -10.80810546875, -9.999755859375, -9.19140625, -8.383056640625, -7.57470703125, -6.766357421875, -5.9580078125, -5.149658203125, -4.34130859375, -3.532958984375, -2.724609375, -1.916259765625, -1.10791015625, -0.299560546875, 0.5087890625, 1.317138671875, 2.12548828125, 2.933837890625, 3.7421875, 4.550537109375, 5.35888671875, 6.167236328125, 6.9755859375, 7.783935546875, 8.59228515625, 9.400634765625, 10.208984375, 11.017333984375, 11.82568359375, 12.634033203125, 13.4423828125, 14.250732421875, 15.05908203125, 15.867431640625, 16.67578125, 17.484130859375, 18.29248046875, 19.100830078125, 19.9091796875, 20.717529296875, 21.52587890625, 22.334228515625, 23.142578125, 23.950927734375, 24.75927734375, 25.567626953125, 26.3759765625, 27.184326171875, 27.99267578125, 28.801025390625, 29.609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 6.0, 13.0, 17.0, 26.0, 39.0, 96.0, 138.0, 253.0, 602.0, 1461.0, 727.0, 296.0, 168.0, 85.0, 46.0, 27.0, 18.0, 13.0, 11.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0859375, -9.81036376953125, -9.5347900390625, -9.25921630859375, -8.983642578125, -8.70806884765625, -8.4324951171875, -8.15692138671875, -7.88134765625, -7.60577392578125, -7.3302001953125, -7.05462646484375, -6.779052734375, -6.50347900390625, -6.2279052734375, -5.95233154296875, -5.6767578125, -5.40118408203125, -5.1256103515625, -4.85003662109375, -4.574462890625, -4.29888916015625, -4.0233154296875, -3.74774169921875, -3.47216796875, -3.19659423828125, -2.9210205078125, -2.64544677734375, -2.369873046875, -2.09429931640625, -1.8187255859375, -1.54315185546875, -1.267578125, -0.99200439453125, -0.7164306640625, -0.44085693359375, -0.165283203125, 0.11029052734375, 0.3858642578125, 0.66143798828125, 0.93701171875, 1.21258544921875, 1.4881591796875, 1.76373291015625, 2.039306640625, 2.31488037109375, 2.5904541015625, 2.86602783203125, 3.1416015625, 3.41717529296875, 3.6927490234375, 3.96832275390625, 4.243896484375, 4.51947021484375, 4.7950439453125, 5.07061767578125, 5.34619140625, 5.62176513671875, 5.8973388671875, 6.17291259765625, 6.448486328125, 6.72406005859375, 6.9996337890625, 7.27520751953125, 7.55078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 6.0, 15.0, 25.0, 43.0, 56.0, 91.0, 103.0, 126.0, 113.0, 111.0, 91.0, 61.0, 45.0, 37.0, 21.0, 9.0, 14.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.82662582397461, -45.31364440917969, -43.8006591796875, -42.28767776489258, -40.774696350097656, -39.26171112060547, -37.74872970581055, -36.235748291015625, -34.72276306152344, -33.209781646728516, -31.696796417236328, -30.183815002441406, -28.67083168029785, -27.157848358154297, -25.644866943359375, -24.13188362121582, -22.618900299072266, -21.10591697692871, -19.592933654785156, -18.079952239990234, -16.56696891784668, -15.053985595703125, -13.541003227233887, -12.028020858764648, -10.515037536621094, -9.002054214477539, -7.489071846008301, -5.976089000701904, -4.463106155395508, -2.9501233100891113, -1.4371404647827148, 0.07584190368652344, 1.5888252258300781, 3.1018080711364746, 4.614790916442871, 6.127773761749268, 7.640756607055664, 9.153739929199219, 10.666722297668457, 12.179704666137695, 13.69268798828125, 15.205671310424805, 16.71865463256836, 18.23163604736328, 19.744619369506836, 21.25760269165039, 22.770584106445312, 24.283567428588867, 25.796550750732422, 27.309534072875977, 28.82251739501953, 30.335498809814453, 31.848482131958008, 33.36146545410156, 34.874446868896484, 36.387428283691406, 37.900413513183594, 39.413394927978516, 40.9263801574707, 42.439361572265625, 43.95234680175781, 45.465328216552734, 46.978309631347656, 48.491294860839844, 50.004276275634766]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 12.0, 14.0, 24.0, 23.0, 30.0, 42.0, 40.0, 50.0, 61.0, 77.0, 65.0, 74.0, 75.0, 64.0, 64.0, 59.0, 47.0, 44.0, 36.0, 34.0, 20.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.41676330566406, -45.2458381652832, -44.07490921020508, -42.90398406982422, -41.733055114746094, -40.562129974365234, -39.391204833984375, -38.22027587890625, -37.04935073852539, -35.87842559814453, -34.707496643066406, -33.53657150268555, -32.36564254760742, -31.194717407226562, -30.02379035949707, -28.852863311767578, -27.681936264038086, -26.511009216308594, -25.3400821685791, -24.16915512084961, -22.99822998046875, -21.827302932739258, -20.656375885009766, -19.485450744628906, -18.31452178955078, -17.14359474182129, -15.972668647766113, -14.801741600036621, -13.630815505981445, -12.459888458251953, -11.288961410522461, -10.118035316467285, -8.94710922241211, -7.776182651519775, -6.605256080627441, -5.434329032897949, -4.263402462005615, -3.0924758911132812, -1.921548843383789, -0.7506227493286133, 0.4203042984008789, 1.5912309885025024, 2.762157678604126, 3.933084487915039, 5.104011058807373, 6.274937629699707, 7.445864677429199, 8.616790771484375, 9.787717819213867, 10.95864486694336, 12.129570960998535, 13.300498008728027, 14.471424102783203, 15.642351150512695, 16.813278198242188, 17.984203338623047, 19.155132293701172, 20.326059341430664, 21.496986389160156, 22.667911529541016, 23.838838577270508, 25.009765625, 26.180692672729492, 27.351619720458984, 28.522544860839844]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 13.0, 19.0, 21.0, 39.0, 55.0, 105.0, 185.0, 309.0, 570.0, 1132.0, 2835.0, 10280.0, 56091.0, 346075.0, 514976.0, 93185.0, 15775.0, 3951.0, 1370.0, 705.0, 339.0, 211.0, 130.0, 67.0, 49.0, 21.0, 17.0, 13.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.6123046875, -27.693359375, -26.7744140625, -25.85546875, -24.9365234375, -24.017578125, -23.0986328125, -22.1796875, -21.2607421875, -20.341796875, -19.4228515625, -18.50390625, -17.5849609375, -16.666015625, -15.7470703125, -14.828125, -13.9091796875, -12.990234375, -12.0712890625, -11.15234375, -10.2333984375, -9.314453125, -8.3955078125, -7.4765625, -6.5576171875, -5.638671875, -4.7197265625, -3.80078125, -2.8818359375, -1.962890625, -1.0439453125, -0.125, 0.7939453125, 1.712890625, 2.6318359375, 3.55078125, 4.4697265625, 5.388671875, 6.3076171875, 7.2265625, 8.1455078125, 9.064453125, 9.9833984375, 10.90234375, 11.8212890625, 12.740234375, 13.6591796875, 14.578125, 15.4970703125, 16.416015625, 17.3349609375, 18.25390625, 19.1728515625, 20.091796875, 21.0107421875, 21.9296875, 22.8486328125, 23.767578125, 24.6865234375, 25.60546875, 26.5244140625, 27.443359375, 28.3623046875, 29.28125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 20.0, 18.0, 31.0, 47.0, 58.0, 68.0, 74.0, 57.0, 79.0, 83.0, 72.0, 63.0, 60.0, 50.0, 42.0, 46.0, 33.0, 25.0, 13.0, 14.0, 9.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-4.1875, -4.083953857421875, -3.98040771484375, -3.876861572265625, -3.7733154296875, -3.669769287109375, -3.56622314453125, -3.462677001953125, -3.359130859375, -3.255584716796875, -3.15203857421875, -3.048492431640625, -2.9449462890625, -2.841400146484375, -2.73785400390625, -2.634307861328125, -2.53076171875, -2.427215576171875, -2.32366943359375, -2.220123291015625, -2.1165771484375, -2.013031005859375, -1.90948486328125, -1.805938720703125, -1.702392578125, -1.598846435546875, -1.49530029296875, -1.391754150390625, -1.2882080078125, -1.184661865234375, -1.08111572265625, -0.977569580078125, -0.8740234375, -0.770477294921875, -0.66693115234375, -0.563385009765625, -0.4598388671875, -0.356292724609375, -0.25274658203125, -0.149200439453125, -0.045654296875, 0.057891845703125, 0.16143798828125, 0.264984130859375, 0.3685302734375, 0.472076416015625, 0.57562255859375, 0.679168701171875, 0.78271484375, 0.886260986328125, 0.98980712890625, 1.093353271484375, 1.1968994140625, 1.300445556640625, 1.40399169921875, 1.507537841796875, 1.611083984375, 1.714630126953125, 1.81817626953125, 1.921722412109375, 2.0252685546875, 2.128814697265625, 2.23236083984375, 2.335906982421875, 2.439453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 10.0, 13.0, 22.0, 23.0, 48.0, 61.0, 103.0, 176.0, 261.0, 379.0, 572.0, 951.0, 1858.0, 3812.0, 9061.0, 23771.0, 62824.0, 158437.0, 336690.0, 266393.0, 110795.0, 43055.0, 16291.0, 6466.0, 2885.0, 1433.0, 769.0, 542.0, 269.0, 197.0, 123.0, 83.0, 65.0, 41.0, 24.0, 22.0, 11.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3359375, -9.9891357421875, -9.642333984375, -9.2955322265625, -8.94873046875, -8.6019287109375, -8.255126953125, -7.9083251953125, -7.5615234375, -7.2147216796875, -6.867919921875, -6.5211181640625, -6.17431640625, -5.8275146484375, -5.480712890625, -5.1339111328125, -4.787109375, -4.4403076171875, -4.093505859375, -3.7467041015625, -3.39990234375, -3.0531005859375, -2.706298828125, -2.3594970703125, -2.0126953125, -1.6658935546875, -1.319091796875, -0.9722900390625, -0.62548828125, -0.2786865234375, 0.068115234375, 0.4149169921875, 0.76171875, 1.1085205078125, 1.455322265625, 1.8021240234375, 2.14892578125, 2.4957275390625, 2.842529296875, 3.1893310546875, 3.5361328125, 3.8829345703125, 4.229736328125, 4.5765380859375, 4.92333984375, 5.2701416015625, 5.616943359375, 5.9637451171875, 6.310546875, 6.6573486328125, 7.004150390625, 7.3509521484375, 7.69775390625, 8.0445556640625, 8.391357421875, 8.7381591796875, 9.0849609375, 9.4317626953125, 9.778564453125, 10.1253662109375, 10.47216796875, 10.8189697265625, 11.165771484375, 11.5125732421875, 11.859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 7.0, 9.0, 13.0, 16.0, 19.0, 19.0, 27.0, 27.0, 36.0, 31.0, 35.0, 54.0, 42.0, 43.0, 41.0, 31.0, 43.0, 54.0, 52.0, 40.0, 57.0, 45.0, 37.0, 24.0, 22.0, 31.0, 30.0, 21.0, 15.0, 10.0, 7.0, 8.0, 10.0, 10.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.9368896484375, -9.655029296875, -9.3731689453125, -9.09130859375, -8.8094482421875, -8.527587890625, -8.2457275390625, -7.9638671875, -7.6820068359375, -7.400146484375, -7.1182861328125, -6.83642578125, -6.5545654296875, -6.272705078125, -5.9908447265625, -5.708984375, -5.4271240234375, -5.145263671875, -4.8634033203125, -4.58154296875, -4.2996826171875, -4.017822265625, -3.7359619140625, -3.4541015625, -3.1722412109375, -2.890380859375, -2.6085205078125, -2.32666015625, -2.0447998046875, -1.762939453125, -1.4810791015625, -1.19921875, -0.9173583984375, -0.635498046875, -0.3536376953125, -0.07177734375, 0.2100830078125, 0.491943359375, 0.7738037109375, 1.0556640625, 1.3375244140625, 1.619384765625, 1.9012451171875, 2.18310546875, 2.4649658203125, 2.746826171875, 3.0286865234375, 3.310546875, 3.5924072265625, 3.874267578125, 4.1561279296875, 4.43798828125, 4.7198486328125, 5.001708984375, 5.2835693359375, 5.5654296875, 5.8472900390625, 6.129150390625, 6.4110107421875, 6.69287109375, 6.9747314453125, 7.256591796875, 7.5384521484375, 7.8203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 6.0, 12.0, 13.0, 19.0, 21.0, 33.0, 48.0, 77.0, 117.0, 176.0, 338.0, 598.0, 1081.0, 2142.0, 4616.0, 11911.0, 37946.0, 159020.0, 460728.0, 273803.0, 65277.0, 18114.0, 6507.0, 2757.0, 1373.0, 701.0, 403.0, 223.0, 154.0, 97.0, 56.0, 52.0, 29.0, 26.0, 17.0, 12.0, 8.0, 13.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.1484375, -7.9066162109375, -7.664794921875, -7.4229736328125, -7.18115234375, -6.9393310546875, -6.697509765625, -6.4556884765625, -6.2138671875, -5.9720458984375, -5.730224609375, -5.4884033203125, -5.24658203125, -5.0047607421875, -4.762939453125, -4.5211181640625, -4.279296875, -4.0374755859375, -3.795654296875, -3.5538330078125, -3.31201171875, -3.0701904296875, -2.828369140625, -2.5865478515625, -2.3447265625, -2.1029052734375, -1.861083984375, -1.6192626953125, -1.37744140625, -1.1356201171875, -0.893798828125, -0.6519775390625, -0.41015625, -0.1683349609375, 0.073486328125, 0.3153076171875, 0.55712890625, 0.7989501953125, 1.040771484375, 1.2825927734375, 1.5244140625, 1.7662353515625, 2.008056640625, 2.2498779296875, 2.49169921875, 2.7335205078125, 2.975341796875, 3.2171630859375, 3.458984375, 3.7008056640625, 3.942626953125, 4.1844482421875, 4.42626953125, 4.6680908203125, 4.909912109375, 5.1517333984375, 5.3935546875, 5.6353759765625, 5.877197265625, 6.1190185546875, 6.36083984375, 6.6026611328125, 6.844482421875, 7.0863037109375, 7.328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 1.0, 6.0, 12.0, 10.0, 12.0, 7.0, 15.0, 21.0, 24.0, 34.0, 41.0, 55.0, 76.0, 87.0, 106.0, 107.0, 77.0, 54.0, 56.0, 45.0, 20.0, 26.0, 15.0, 21.0, 9.0, 9.0, 14.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0009660720825195312, -0.0009374544024467468, -0.0009088367223739624, -0.000880219042301178, -0.0008516013622283936, -0.0008229836821556091, -0.0007943660020828247, -0.0007657483220100403, -0.0007371306419372559, -0.0007085129618644714, -0.000679895281791687, -0.0006512776017189026, -0.0006226599216461182, -0.0005940422415733337, -0.0005654245615005493, -0.0005368068814277649, -0.0005081892013549805, -0.00047957152128219604, -0.0004509538412094116, -0.0004223361611366272, -0.0003937184810638428, -0.00036510080099105835, -0.0003364831209182739, -0.0003078654408454895, -0.0002792477607727051, -0.00025063008069992065, -0.00022201240062713623, -0.0001933947205543518, -0.00016477704048156738, -0.00013615936040878296, -0.00010754168033599854, -7.892400026321411e-05, -5.030632019042969e-05, -2.1688640117645264e-05, 6.92903995513916e-06, 3.5546720027923584e-05, 6.416440010070801e-05, 9.278208017349243e-05, 0.00012139976024627686, 0.00015001744031906128, 0.0001786351203918457, 0.00020725280046463013, 0.00023587048053741455, 0.000264488160610199, 0.0002931058406829834, 0.0003217235207557678, 0.00035034120082855225, 0.00037895888090133667, 0.0004075765609741211, 0.0004361942410469055, 0.00046481192111968994, 0.0004934296011924744, 0.0005220472812652588, 0.0005506649613380432, 0.0005792826414108276, 0.0006079003214836121, 0.0006365180015563965, 0.0006651356816291809, 0.0006937533617019653, 0.0007223710417747498, 0.0007509887218475342, 0.0007796064019203186, 0.000808224081993103, 0.0008368417620658875, 0.0008654594421386719]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 7.0, 11.0, 10.0, 15.0, 28.0, 39.0, 43.0, 80.0, 130.0, 227.0, 457.0, 814.0, 1694.0, 4008.0, 12047.0, 53305.0, 359675.0, 505001.0, 84697.0, 16630.0, 5285.0, 2179.0, 974.0, 524.0, 255.0, 138.0, 76.0, 63.0, 49.0, 33.0, 23.0, 18.0, 4.0, 9.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.310791015625, -10.98876953125, -10.666748046875, -10.3447265625, -10.022705078125, -9.70068359375, -9.378662109375, -9.056640625, -8.734619140625, -8.41259765625, -8.090576171875, -7.7685546875, -7.446533203125, -7.12451171875, -6.802490234375, -6.48046875, -6.158447265625, -5.83642578125, -5.514404296875, -5.1923828125, -4.870361328125, -4.54833984375, -4.226318359375, -3.904296875, -3.582275390625, -3.26025390625, -2.938232421875, -2.6162109375, -2.294189453125, -1.97216796875, -1.650146484375, -1.328125, -1.006103515625, -0.68408203125, -0.362060546875, -0.0400390625, 0.281982421875, 0.60400390625, 0.926025390625, 1.248046875, 1.570068359375, 1.89208984375, 2.214111328125, 2.5361328125, 2.858154296875, 3.18017578125, 3.502197265625, 3.82421875, 4.146240234375, 4.46826171875, 4.790283203125, 5.1123046875, 5.434326171875, 5.75634765625, 6.078369140625, 6.400390625, 6.722412109375, 7.04443359375, 7.366455078125, 7.6884765625, 8.010498046875, 8.33251953125, 8.654541015625, 8.9765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 7.0, 8.0, 10.0, 18.0, 30.0, 56.0, 94.0, 130.0, 142.0, 129.0, 128.0, 81.0, 62.0, 41.0, 27.0, 11.0, 5.0, 5.0, 1.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28125, -10.999755859375, -10.71826171875, -10.436767578125, -10.1552734375, -9.873779296875, -9.59228515625, -9.310791015625, -9.029296875, -8.747802734375, -8.46630859375, -8.184814453125, -7.9033203125, -7.621826171875, -7.34033203125, -7.058837890625, -6.77734375, -6.495849609375, -6.21435546875, -5.932861328125, -5.6513671875, -5.369873046875, -5.08837890625, -4.806884765625, -4.525390625, -4.243896484375, -3.96240234375, -3.680908203125, -3.3994140625, -3.117919921875, -2.83642578125, -2.554931640625, -2.2734375, -1.991943359375, -1.71044921875, -1.428955078125, -1.1474609375, -0.865966796875, -0.58447265625, -0.302978515625, -0.021484375, 0.260009765625, 0.54150390625, 0.822998046875, 1.1044921875, 1.385986328125, 1.66748046875, 1.948974609375, 2.23046875, 2.511962890625, 2.79345703125, 3.074951171875, 3.3564453125, 3.637939453125, 3.91943359375, 4.200927734375, 4.482421875, 4.763916015625, 5.04541015625, 5.326904296875, 5.6083984375, 5.889892578125, 6.17138671875, 6.452880859375, 6.734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 10.0, 20.0, 26.0, 39.0, 61.0, 78.0, 102.0, 144.0, 123.0, 110.0, 101.0, 67.0, 35.0, 29.0, 18.0, 11.0, 10.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.7868881225586, -77.857421875, -74.9279556274414, -71.99848175048828, -69.06901550292969, -66.1395492553711, -63.2100830078125, -60.28061294555664, -57.35114288330078, -54.42167663574219, -51.49220657348633, -48.562740325927734, -45.633270263671875, -42.70380401611328, -39.77433776855469, -36.84486770629883, -33.915401458740234, -30.985933303833008, -28.05646514892578, -25.126998901367188, -22.197528839111328, -19.268062591552734, -16.338594436645508, -13.409126281738281, -10.479658126831055, -7.550189971923828, -4.62072229385376, -1.6912546157836914, 1.2382135391235352, 4.167681694030762, 7.097148895263672, 10.026617050170898, 12.956085205078125, 15.885553359985352, 18.815021514892578, 21.744487762451172, 24.67395782470703, 27.603424072265625, 30.53289222717285, 33.46236038208008, 36.39183044433594, 39.32129669189453, 42.25076675415039, 45.180233001708984, 48.109703063964844, 51.03916931152344, 53.96863555908203, 56.89810562133789, 59.827571868896484, 62.75703811645508, 65.68650817871094, 68.61597442626953, 71.54544067382812, 74.47491455078125, 77.40438079833984, 80.33384704589844, 83.26331329345703, 86.19277954101562, 89.12224578857422, 92.05171966552734, 94.98118591308594, 97.91065216064453, 100.84011840820312, 103.76959228515625, 106.69905853271484]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 9.0, 14.0, 12.0, 21.0, 19.0, 37.0, 39.0, 23.0, 32.0, 51.0, 48.0, 35.0, 51.0, 46.0, 45.0, 70.0, 56.0, 48.0, 45.0, 25.0, 36.0, 31.0, 35.0, 28.0, 23.0, 13.0, 23.0, 8.0, 11.0, 13.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-62.6007080078125, -60.938514709472656, -59.27631759643555, -57.61412048339844, -55.951927185058594, -54.28973388671875, -52.62753677368164, -50.96533966064453, -49.30314636230469, -47.640953063964844, -45.978755950927734, -44.316558837890625, -42.65436553955078, -40.99217224121094, -39.32997512817383, -37.66777801513672, -36.005584716796875, -34.34339141845703, -32.68119430541992, -31.018999099731445, -29.35680389404297, -27.694608688354492, -26.032413482666016, -24.37021827697754, -22.708023071289062, -21.045827865600586, -19.38363265991211, -17.721437454223633, -16.059242248535156, -14.39704704284668, -12.734851837158203, -11.072656631469727, -9.41046142578125, -7.748266220092773, -6.086071014404297, -4.42387580871582, -2.7616806030273438, -1.0994853973388672, 0.5627098083496094, 2.224905014038086, 3.8871002197265625, 5.549295425415039, 7.211490631103516, 8.873685836791992, 10.535881042480469, 12.198076248168945, 13.860271453857422, 15.522466659545898, 17.184661865234375, 18.84685707092285, 20.509052276611328, 22.171247482299805, 23.83344268798828, 25.495637893676758, 27.157833099365234, 28.82002830505371, 30.482223510742188, 32.14441680908203, 33.80661392211914, 35.46881103515625, 37.131004333496094, 38.79319763183594, 40.45539474487305, 42.117591857910156, 43.77978515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 4.0, 11.0, 5.0, 12.0, 26.0, 11.0, 27.0, 52.0, 67.0, 81.0, 133.0, 194.0, 315.0, 563.0, 1144.0, 2426.0, 6155.0, 21184.0, 142978.0, 3818468.0, 166207.0, 22676.0, 6497.0, 2519.0, 1120.0, 561.0, 311.0, 145.0, 135.0, 68.0, 47.0, 36.0, 13.0, 11.0, 16.0, 14.0, 11.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.9375, -23.1533203125, -22.369140625, -21.5849609375, -20.80078125, -20.0166015625, -19.232421875, -18.4482421875, -17.6640625, -16.8798828125, -16.095703125, -15.3115234375, -14.52734375, -13.7431640625, -12.958984375, -12.1748046875, -11.390625, -10.6064453125, -9.822265625, -9.0380859375, -8.25390625, -7.4697265625, -6.685546875, -5.9013671875, -5.1171875, -4.3330078125, -3.548828125, -2.7646484375, -1.98046875, -1.1962890625, -0.412109375, 0.3720703125, 1.15625, 1.9404296875, 2.724609375, 3.5087890625, 4.29296875, 5.0771484375, 5.861328125, 6.6455078125, 7.4296875, 8.2138671875, 8.998046875, 9.7822265625, 10.56640625, 11.3505859375, 12.134765625, 12.9189453125, 13.703125, 14.4873046875, 15.271484375, 16.0556640625, 16.83984375, 17.6240234375, 18.408203125, 19.1923828125, 19.9765625, 20.7607421875, 21.544921875, 22.3291015625, 23.11328125, 23.8974609375, 24.681640625, 25.4658203125, 26.25]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 13.0, 14.0, 9.0, 25.0, 30.0, 59.0, 62.0, 72.0, 78.0, 70.0, 84.0, 85.0, 75.0, 73.0, 49.0, 49.0, 40.0, 36.0, 18.0, 19.0, 14.0, 8.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.1563720703125, -4.043212890625, -3.9300537109375, -3.81689453125, -3.7037353515625, -3.590576171875, -3.4774169921875, -3.3642578125, -3.2510986328125, -3.137939453125, -3.0247802734375, -2.91162109375, -2.7984619140625, -2.685302734375, -2.5721435546875, -2.458984375, -2.3458251953125, -2.232666015625, -2.1195068359375, -2.00634765625, -1.8931884765625, -1.780029296875, -1.6668701171875, -1.5537109375, -1.4405517578125, -1.327392578125, -1.2142333984375, -1.10107421875, -0.9879150390625, -0.874755859375, -0.7615966796875, -0.6484375, -0.5352783203125, -0.422119140625, -0.3089599609375, -0.19580078125, -0.0826416015625, 0.030517578125, 0.1436767578125, 0.2568359375, 0.3699951171875, 0.483154296875, 0.5963134765625, 0.70947265625, 0.8226318359375, 0.935791015625, 1.0489501953125, 1.162109375, 1.2752685546875, 1.388427734375, 1.5015869140625, 1.61474609375, 1.7279052734375, 1.841064453125, 1.9542236328125, 2.0673828125, 2.1805419921875, 2.293701171875, 2.4068603515625, 2.52001953125, 2.6331787109375, 2.746337890625, 2.8594970703125, 2.97265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 16.0, 20.0, 23.0, 28.0, 26.0, 45.0, 56.0, 86.0, 157.0, 388.0, 1004.0, 3430.0, 14201.0, 98551.0, 3437615.0, 586633.0, 40405.0, 7800.0, 2104.0, 788.0, 381.0, 159.0, 112.0, 53.0, 44.0, 29.0, 22.0, 15.0, 8.0, 10.0, 8.0, 9.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.660888671875, -23.93115234375, -23.201416015625, -22.4716796875, -21.741943359375, -21.01220703125, -20.282470703125, -19.552734375, -18.822998046875, -18.09326171875, -17.363525390625, -16.6337890625, -15.904052734375, -15.17431640625, -14.444580078125, -13.71484375, -12.985107421875, -12.25537109375, -11.525634765625, -10.7958984375, -10.066162109375, -9.33642578125, -8.606689453125, -7.876953125, -7.147216796875, -6.41748046875, -5.687744140625, -4.9580078125, -4.228271484375, -3.49853515625, -2.768798828125, -2.0390625, -1.309326171875, -0.57958984375, 0.150146484375, 0.8798828125, 1.609619140625, 2.33935546875, 3.069091796875, 3.798828125, 4.528564453125, 5.25830078125, 5.988037109375, 6.7177734375, 7.447509765625, 8.17724609375, 8.906982421875, 9.63671875, 10.366455078125, 11.09619140625, 11.825927734375, 12.5556640625, 13.285400390625, 14.01513671875, 14.744873046875, 15.474609375, 16.204345703125, 16.93408203125, 17.663818359375, 18.3935546875, 19.123291015625, 19.85302734375, 20.582763671875, 21.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 13.0, 29.0, 47.0, 82.0, 179.0, 587.0, 2112.0, 642.0, 207.0, 78.0, 45.0, 16.0, 13.0, 11.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.60986328125, -12.3134765625, -12.01708984375, -11.720703125, -11.42431640625, -11.1279296875, -10.83154296875, -10.53515625, -10.23876953125, -9.9423828125, -9.64599609375, -9.349609375, -9.05322265625, -8.7568359375, -8.46044921875, -8.1640625, -7.86767578125, -7.5712890625, -7.27490234375, -6.978515625, -6.68212890625, -6.3857421875, -6.08935546875, -5.79296875, -5.49658203125, -5.2001953125, -4.90380859375, -4.607421875, -4.31103515625, -4.0146484375, -3.71826171875, -3.421875, -3.12548828125, -2.8291015625, -2.53271484375, -2.236328125, -1.93994140625, -1.6435546875, -1.34716796875, -1.05078125, -0.75439453125, -0.4580078125, -0.16162109375, 0.134765625, 0.43115234375, 0.7275390625, 1.02392578125, 1.3203125, 1.61669921875, 1.9130859375, 2.20947265625, 2.505859375, 2.80224609375, 3.0986328125, 3.39501953125, 3.69140625, 3.98779296875, 4.2841796875, 4.58056640625, 4.876953125, 5.17333984375, 5.4697265625, 5.76611328125, 6.0625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 15.0, 12.0, 20.0, 54.0, 85.0, 125.0, 134.0, 149.0, 144.0, 93.0, 79.0, 30.0, 26.0, 17.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.16429138183594, -47.81736755371094, -46.47044372558594, -45.12351989746094, -43.77659606933594, -42.42967224121094, -41.08274841308594, -39.73582458496094, -38.38890075683594, -37.04197692871094, -35.69505310058594, -34.34812927246094, -33.00120544433594, -31.654281616210938, -30.307357788085938, -28.960433959960938, -27.613508224487305, -26.266584396362305, -24.919660568237305, -23.572736740112305, -22.225812911987305, -20.878889083862305, -19.531963348388672, -18.185039520263672, -16.838115692138672, -15.491191864013672, -14.144268035888672, -12.797344207763672, -11.450420379638672, -10.103496551513672, -8.756571769714355, -7.4096479415893555, -6.062725067138672, -4.715801239013672, -3.3688771724700928, -2.0219531059265137, -0.6750292778015137, 0.6718945503234863, 2.0188188552856445, 3.3657426834106445, 4.7126665115356445, 6.0595903396606445, 7.4065141677856445, 8.753438949584961, 10.100362777709961, 11.447286605834961, 12.794210433959961, 14.141134262084961, 15.488058090209961, 16.83498191833496, 18.18190574645996, 19.52882957458496, 20.87575340270996, 22.22267723083496, 23.569602966308594, 24.916526794433594, 26.263450622558594, 27.610374450683594, 28.957298278808594, 30.304222106933594, 31.651145935058594, 32.998069763183594, 34.344993591308594, 35.691917419433594, 37.038841247558594]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 12.0, 16.0, 18.0, 26.0, 29.0, 45.0, 37.0, 45.0, 43.0, 53.0, 60.0, 64.0, 68.0, 54.0, 63.0, 56.0, 49.0, 27.0, 46.0, 43.0, 29.0, 25.0, 19.0, 18.0, 8.0, 6.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.060779571533203, -17.35297203063965, -16.645164489746094, -15.937358856201172, -15.229551315307617, -14.521743774414062, -13.813937187194824, -13.106130599975586, -12.398323059082031, -11.690515518188477, -10.982708930969238, -10.27490234375, -9.567094802856445, -8.85928726196289, -8.151480674743652, -7.443673610687256, -6.735866546630859, -6.028059482574463, -5.320252418518066, -4.61244535446167, -3.9046382904052734, -3.196831226348877, -2.4890241622924805, -1.781217098236084, -1.0734100341796875, -0.365602970123291, 0.34220409393310547, 1.050011157989502, 1.7578182220458984, 2.465625286102295, 3.1734323501586914, 3.881239414215088, 4.589046478271484, 5.296853542327881, 6.004660606384277, 6.712467670440674, 7.42027473449707, 8.128082275390625, 8.835888862609863, 9.543695449829102, 10.251502990722656, 10.959310531616211, 11.66711711883545, 12.374923706054688, 13.082731246948242, 13.790538787841797, 14.498345375061035, 15.206151962280273, 15.913959503173828, 16.621767044067383, 17.329574584960938, 18.03738021850586, 18.745187759399414, 19.45299530029297, 20.16080093383789, 20.868608474731445, 21.576416015625, 22.284223556518555, 22.99203109741211, 23.69983673095703, 24.407644271850586, 25.11545181274414, 25.823257446289062, 26.531064987182617, 27.238872528076172]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 2.0, 13.0, 14.0, 17.0, 25.0, 37.0, 52.0, 89.0, 129.0, 252.0, 460.0, 919.0, 1963.0, 5473.0, 20059.0, 104402.0, 507515.0, 329703.0, 58200.0, 12350.0, 3778.0, 1434.0, 690.0, 381.0, 210.0, 146.0, 86.0, 46.0, 33.0, 13.0, 19.0, 8.0, 12.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.875, -25.97412109375, -25.0732421875, -24.17236328125, -23.271484375, -22.37060546875, -21.4697265625, -20.56884765625, -19.66796875, -18.76708984375, -17.8662109375, -16.96533203125, -16.064453125, -15.16357421875, -14.2626953125, -13.36181640625, -12.4609375, -11.56005859375, -10.6591796875, -9.75830078125, -8.857421875, -7.95654296875, -7.0556640625, -6.15478515625, -5.25390625, -4.35302734375, -3.4521484375, -2.55126953125, -1.650390625, -0.74951171875, 0.1513671875, 1.05224609375, 1.953125, 2.85400390625, 3.7548828125, 4.65576171875, 5.556640625, 6.45751953125, 7.3583984375, 8.25927734375, 9.16015625, 10.06103515625, 10.9619140625, 11.86279296875, 12.763671875, 13.66455078125, 14.5654296875, 15.46630859375, 16.3671875, 17.26806640625, 18.1689453125, 19.06982421875, 19.970703125, 20.87158203125, 21.7724609375, 22.67333984375, 23.57421875, 24.47509765625, 25.3759765625, 26.27685546875, 27.177734375, 28.07861328125, 28.9794921875, 29.88037109375, 30.78125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 7.0, 21.0, 16.0, 35.0, 44.0, 49.0, 57.0, 78.0, 69.0, 81.0, 75.0, 77.0, 70.0, 58.0, 48.0, 50.0, 42.0, 36.0, 24.0, 13.0, 16.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.056610107421875, -3.94525146484375, -3.833892822265625, -3.7225341796875, -3.611175537109375, -3.49981689453125, -3.388458251953125, -3.277099609375, -3.165740966796875, -3.05438232421875, -2.943023681640625, -2.8316650390625, -2.720306396484375, -2.60894775390625, -2.497589111328125, -2.38623046875, -2.274871826171875, -2.16351318359375, -2.052154541015625, -1.9407958984375, -1.829437255859375, -1.71807861328125, -1.606719970703125, -1.495361328125, -1.384002685546875, -1.27264404296875, -1.161285400390625, -1.0499267578125, -0.938568115234375, -0.82720947265625, -0.715850830078125, -0.6044921875, -0.493133544921875, -0.38177490234375, -0.270416259765625, -0.1590576171875, -0.047698974609375, 0.06365966796875, 0.175018310546875, 0.286376953125, 0.397735595703125, 0.50909423828125, 0.620452880859375, 0.7318115234375, 0.843170166015625, 0.95452880859375, 1.065887451171875, 1.17724609375, 1.288604736328125, 1.39996337890625, 1.511322021484375, 1.6226806640625, 1.734039306640625, 1.84539794921875, 1.956756591796875, 2.068115234375, 2.179473876953125, 2.29083251953125, 2.402191162109375, 2.5135498046875, 2.624908447265625, 2.73626708984375, 2.847625732421875, 2.958984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 20.0, 15.0, 51.0, 65.0, 75.0, 128.0, 190.0, 344.0, 522.0, 963.0, 2188.0, 6292.0, 25450.0, 120642.0, 464069.0, 330088.0, 73438.0, 15902.0, 4409.0, 1681.0, 785.0, 458.0, 237.0, 173.0, 123.0, 70.0, 45.0, 37.0, 17.0, 13.0, 18.0, 9.0, 4.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.546875, -18.98583984375, -18.4248046875, -17.86376953125, -17.302734375, -16.74169921875, -16.1806640625, -15.61962890625, -15.05859375, -14.49755859375, -13.9365234375, -13.37548828125, -12.814453125, -12.25341796875, -11.6923828125, -11.13134765625, -10.5703125, -10.00927734375, -9.4482421875, -8.88720703125, -8.326171875, -7.76513671875, -7.2041015625, -6.64306640625, -6.08203125, -5.52099609375, -4.9599609375, -4.39892578125, -3.837890625, -3.27685546875, -2.7158203125, -2.15478515625, -1.59375, -1.03271484375, -0.4716796875, 0.08935546875, 0.650390625, 1.21142578125, 1.7724609375, 2.33349609375, 2.89453125, 3.45556640625, 4.0166015625, 4.57763671875, 5.138671875, 5.69970703125, 6.2607421875, 6.82177734375, 7.3828125, 7.94384765625, 8.5048828125, 9.06591796875, 9.626953125, 10.18798828125, 10.7490234375, 11.31005859375, 11.87109375, 12.43212890625, 12.9931640625, 13.55419921875, 14.115234375, 14.67626953125, 15.2373046875, 15.79833984375, 16.359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 9.0, 2.0, 4.0, 5.0, 10.0, 11.0, 21.0, 15.0, 27.0, 25.0, 30.0, 40.0, 41.0, 31.0, 31.0, 43.0, 31.0, 56.0, 37.0, 45.0, 35.0, 41.0, 39.0, 50.0, 45.0, 30.0, 36.0, 39.0, 17.0, 24.0, 27.0, 22.0, 9.0, 18.0, 9.0, 9.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.4140625, -9.14239501953125, -8.8707275390625, -8.59906005859375, -8.327392578125, -8.05572509765625, -7.7840576171875, -7.51239013671875, -7.24072265625, -6.96905517578125, -6.6973876953125, -6.42572021484375, -6.154052734375, -5.88238525390625, -5.6107177734375, -5.33905029296875, -5.0673828125, -4.79571533203125, -4.5240478515625, -4.25238037109375, -3.980712890625, -3.70904541015625, -3.4373779296875, -3.16571044921875, -2.89404296875, -2.62237548828125, -2.3507080078125, -2.07904052734375, -1.807373046875, -1.53570556640625, -1.2640380859375, -0.99237060546875, -0.720703125, -0.44903564453125, -0.1773681640625, 0.09429931640625, 0.365966796875, 0.63763427734375, 0.9093017578125, 1.18096923828125, 1.45263671875, 1.72430419921875, 1.9959716796875, 2.26763916015625, 2.539306640625, 2.81097412109375, 3.0826416015625, 3.35430908203125, 3.6259765625, 3.89764404296875, 4.1693115234375, 4.44097900390625, 4.712646484375, 4.98431396484375, 5.2559814453125, 5.52764892578125, 5.79931640625, 6.07098388671875, 6.3426513671875, 6.61431884765625, 6.885986328125, 7.15765380859375, 7.4293212890625, 7.70098876953125, 7.97265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 8.0, 5.0, 4.0, 11.0, 24.0, 27.0, 41.0, 81.0, 98.0, 164.0, 296.0, 471.0, 845.0, 1619.0, 3532.0, 10066.0, 38545.0, 224298.0, 589595.0, 138786.0, 26312.0, 7592.0, 2906.0, 1427.0, 731.0, 408.0, 248.0, 147.0, 90.0, 59.0, 41.0, 22.0, 16.0, 13.0, 9.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-11.6953125, -11.373779296875, -11.05224609375, -10.730712890625, -10.4091796875, -10.087646484375, -9.76611328125, -9.444580078125, -9.123046875, -8.801513671875, -8.47998046875, -8.158447265625, -7.8369140625, -7.515380859375, -7.19384765625, -6.872314453125, -6.55078125, -6.229248046875, -5.90771484375, -5.586181640625, -5.2646484375, -4.943115234375, -4.62158203125, -4.300048828125, -3.978515625, -3.656982421875, -3.33544921875, -3.013916015625, -2.6923828125, -2.370849609375, -2.04931640625, -1.727783203125, -1.40625, -1.084716796875, -0.76318359375, -0.441650390625, -0.1201171875, 0.201416015625, 0.52294921875, 0.844482421875, 1.166015625, 1.487548828125, 1.80908203125, 2.130615234375, 2.4521484375, 2.773681640625, 3.09521484375, 3.416748046875, 3.73828125, 4.059814453125, 4.38134765625, 4.702880859375, 5.0244140625, 5.345947265625, 5.66748046875, 5.989013671875, 6.310546875, 6.632080078125, 6.95361328125, 7.275146484375, 7.5966796875, 7.918212890625, 8.23974609375, 8.561279296875, 8.8828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 20.0, 21.0, 33.0, 43.0, 64.0, 60.0, 93.0, 127.0, 142.0, 117.0, 70.0, 62.0, 35.0, 19.0, 28.0, 13.0, 10.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001220703125, -0.0011721402406692505, -0.001123577356338501, -0.0010750144720077515, -0.001026451587677002, -0.0009778887033462524, -0.0009293258190155029, -0.0008807629346847534, -0.0008322000503540039, -0.0007836371660232544, -0.0007350742816925049, -0.0006865113973617554, -0.0006379485130310059, -0.0005893856287002563, -0.0005408227443695068, -0.0004922598600387573, -0.0004436969757080078, -0.0003951340913772583, -0.0003465712070465088, -0.0002980083227157593, -0.00024944543838500977, -0.00020088255405426025, -0.00015231966972351074, -0.00010375678539276123, -5.519390106201172e-05, -6.631016731262207e-06, 4.1931867599487305e-05, 9.049475193023682e-05, 0.00013905763626098633, 0.00018762052059173584, 0.00023618340492248535, 0.00028474628925323486, 0.0003333091735839844, 0.0003818720579147339, 0.0004304349422454834, 0.0004789978265762329, 0.0005275607109069824, 0.0005761235952377319, 0.0006246864795684814, 0.000673249363899231, 0.0007218122482299805, 0.00077037513256073, 0.0008189380168914795, 0.000867500901222229, 0.0009160637855529785, 0.000964626669883728, 0.0010131895542144775, 0.001061752438545227, 0.0011103153228759766, 0.001158878207206726, 0.0012074410915374756, 0.001256003975868225, 0.0013045668601989746, 0.0013531297445297241, 0.0014016926288604736, 0.0014502555131912231, 0.0014988183975219727, 0.0015473812818527222, 0.0015959441661834717, 0.0016445070505142212, 0.0016930699348449707, 0.0017416328191757202, 0.0017901957035064697, 0.0018387585878372192, 0.0018873214721679688]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 3.0, 11.0, 13.0, 14.0, 22.0, 45.0, 86.0, 160.0, 288.0, 511.0, 1076.0, 3058.0, 12962.0, 133436.0, 794380.0, 87717.0, 10112.0, 2634.0, 949.0, 503.0, 250.0, 117.0, 75.0, 35.0, 31.0, 14.0, 12.0, 7.0, 3.0, 7.0, 4.0, 7.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.25, -17.73486328125, -17.2197265625, -16.70458984375, -16.189453125, -15.67431640625, -15.1591796875, -14.64404296875, -14.12890625, -13.61376953125, -13.0986328125, -12.58349609375, -12.068359375, -11.55322265625, -11.0380859375, -10.52294921875, -10.0078125, -9.49267578125, -8.9775390625, -8.46240234375, -7.947265625, -7.43212890625, -6.9169921875, -6.40185546875, -5.88671875, -5.37158203125, -4.8564453125, -4.34130859375, -3.826171875, -3.31103515625, -2.7958984375, -2.28076171875, -1.765625, -1.25048828125, -0.7353515625, -0.22021484375, 0.294921875, 0.81005859375, 1.3251953125, 1.84033203125, 2.35546875, 2.87060546875, 3.3857421875, 3.90087890625, 4.416015625, 4.93115234375, 5.4462890625, 5.96142578125, 6.4765625, 6.99169921875, 7.5068359375, 8.02197265625, 8.537109375, 9.05224609375, 9.5673828125, 10.08251953125, 10.59765625, 11.11279296875, 11.6279296875, 12.14306640625, 12.658203125, 13.17333984375, 13.6884765625, 14.20361328125, 14.71875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 13.0, 8.0, 19.0, 35.0, 52.0, 117.0, 140.0, 167.0, 154.0, 98.0, 61.0, 48.0, 22.0, 22.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.1953125, -11.8780517578125, -11.560791015625, -11.2435302734375, -10.92626953125, -10.6090087890625, -10.291748046875, -9.9744873046875, -9.6572265625, -9.3399658203125, -9.022705078125, -8.7054443359375, -8.38818359375, -8.0709228515625, -7.753662109375, -7.4364013671875, -7.119140625, -6.8018798828125, -6.484619140625, -6.1673583984375, -5.85009765625, -5.5328369140625, -5.215576171875, -4.8983154296875, -4.5810546875, -4.2637939453125, -3.946533203125, -3.6292724609375, -3.31201171875, -2.9947509765625, -2.677490234375, -2.3602294921875, -2.04296875, -1.7257080078125, -1.408447265625, -1.0911865234375, -0.77392578125, -0.4566650390625, -0.139404296875, 0.1778564453125, 0.4951171875, 0.8123779296875, 1.129638671875, 1.4468994140625, 1.76416015625, 2.0814208984375, 2.398681640625, 2.7159423828125, 3.033203125, 3.3504638671875, 3.667724609375, 3.9849853515625, 4.30224609375, 4.6195068359375, 4.936767578125, 5.2540283203125, 5.5712890625, 5.8885498046875, 6.205810546875, 6.5230712890625, 6.84033203125, 7.1575927734375, 7.474853515625, 7.7921142578125, 8.109375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 13.0, 23.0, 22.0, 64.0, 88.0, 115.0, 125.0, 169.0, 141.0, 86.0, 71.0, 37.0, 20.0, 11.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.7540283203125, -65.89045715332031, -62.026885986328125, -58.16331100463867, -54.299739837646484, -50.4361686706543, -46.572593688964844, -42.709022521972656, -38.84545135498047, -34.98188018798828, -31.11830711364746, -27.25473403930664, -23.391162872314453, -19.527591705322266, -15.664018630981445, -11.800445556640625, -7.9368743896484375, -4.073302268981934, -0.2097301483154297, 3.653841972351074, 7.517414093017578, 11.380985260009766, 15.244558334350586, 19.108131408691406, 22.971702575683594, 26.83527374267578, 30.6988468170166, 34.56241989135742, 38.42599105834961, 42.2895622253418, 46.15313720703125, 50.01670837402344, 53.880279541015625, 57.74385070800781, 61.607421875, 65.47099304199219, 69.33456420898438, 73.19813537597656, 77.06171417236328, 80.92528533935547, 84.78885650634766, 88.65242767333984, 92.51599884033203, 96.37957000732422, 100.24314880371094, 104.10671997070312, 107.97029113769531, 111.8338623046875, 115.69743347167969, 119.56100463867188, 123.42457580566406, 127.28814697265625, 131.15171813964844, 135.01528930664062, 138.8788604736328, 142.742431640625, 146.60601806640625, 150.46958923339844, 154.33316040039062, 158.1967315673828, 162.060302734375, 165.9238739013672, 169.78744506835938, 173.65103149414062, 177.51458740234375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 11.0, 14.0, 15.0, 14.0, 12.0, 11.0, 15.0, 26.0, 22.0, 28.0, 34.0, 28.0, 33.0, 47.0, 51.0, 37.0, 49.0, 49.0, 42.0, 38.0, 47.0, 51.0, 43.0, 35.0, 42.0, 38.0, 29.0, 25.0, 28.0, 18.0, 15.0, 12.0, 8.0, 7.0, 8.0, 7.0, 2.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.45842742919922, -43.83392333984375, -42.20941925048828, -40.58491134643555, -38.96040725708008, -37.33590316772461, -35.71139907836914, -34.086891174316406, -32.46238708496094, -30.83788299560547, -29.213376998901367, -27.5888729095459, -25.964366912841797, -24.339862823486328, -22.71535873413086, -21.090852737426758, -19.46634864807129, -17.84184455871582, -16.21733856201172, -14.59283447265625, -12.968328475952148, -11.34382438659668, -9.719319343566895, -8.09481430053711, -6.470309257507324, -4.845804214477539, -3.221299409866333, -1.596794605255127, 0.027710437774658203, 1.6522150039672852, 3.2767200469970703, 4.9012250900268555, 6.525730133056641, 8.150235176086426, 9.774740219116211, 11.39924430847168, 13.023750305175781, 14.64825439453125, 16.27275848388672, 17.89726448059082, 19.521770477294922, 21.14627456665039, 22.770780563354492, 24.39528465270996, 26.019790649414062, 27.64429473876953, 29.268798828125, 30.8933048248291, 32.51780700683594, 34.142311096191406, 35.766815185546875, 37.39132308959961, 39.01582717895508, 40.64033126831055, 42.264835357666016, 43.88934326171875, 45.51384735107422, 47.13835144042969, 48.762855529785156, 50.38736343383789, 52.01186752319336, 53.63637161254883, 55.2608757019043, 56.88538360595703, 58.5098876953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 8.0, 10.0, 9.0, 20.0, 24.0, 33.0, 44.0, 62.0, 115.0, 141.0, 235.0, 374.0, 685.0, 1445.0, 3420.0, 11170.0, 52950.0, 1643128.0, 2406025.0, 56311.0, 11596.0, 3595.0, 1346.0, 694.0, 332.0, 190.0, 112.0, 61.0, 57.0, 26.0, 21.0, 13.0, 8.0, 9.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.640625, -25.722412109375, -24.80419921875, -23.885986328125, -22.9677734375, -22.049560546875, -21.13134765625, -20.213134765625, -19.294921875, -18.376708984375, -17.45849609375, -16.540283203125, -15.6220703125, -14.703857421875, -13.78564453125, -12.867431640625, -11.94921875, -11.031005859375, -10.11279296875, -9.194580078125, -8.2763671875, -7.358154296875, -6.43994140625, -5.521728515625, -4.603515625, -3.685302734375, -2.76708984375, -1.848876953125, -0.9306640625, -0.012451171875, 0.90576171875, 1.823974609375, 2.7421875, 3.660400390625, 4.57861328125, 5.496826171875, 6.4150390625, 7.333251953125, 8.25146484375, 9.169677734375, 10.087890625, 11.006103515625, 11.92431640625, 12.842529296875, 13.7607421875, 14.678955078125, 15.59716796875, 16.515380859375, 17.43359375, 18.351806640625, 19.27001953125, 20.188232421875, 21.1064453125, 22.024658203125, 22.94287109375, 23.861083984375, 24.779296875, 25.697509765625, 26.61572265625, 27.533935546875, 28.4521484375, 29.370361328125, 30.28857421875, 31.206787109375, 32.125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 9.0, 19.0, 17.0, 18.0, 43.0, 47.0, 58.0, 47.0, 83.0, 84.0, 73.0, 88.0, 72.0, 65.0, 63.0, 43.0, 44.0, 38.0, 19.0, 16.0, 18.0, 10.0, 6.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.092681884765625, -3.97833251953125, -3.863983154296875, -3.7496337890625, -3.635284423828125, -3.52093505859375, -3.406585693359375, -3.292236328125, -3.177886962890625, -3.06353759765625, -2.949188232421875, -2.8348388671875, -2.720489501953125, -2.60614013671875, -2.491790771484375, -2.37744140625, -2.263092041015625, -2.14874267578125, -2.034393310546875, -1.9200439453125, -1.805694580078125, -1.69134521484375, -1.576995849609375, -1.462646484375, -1.348297119140625, -1.23394775390625, -1.119598388671875, -1.0052490234375, -0.890899658203125, -0.77655029296875, -0.662200927734375, -0.5478515625, -0.433502197265625, -0.31915283203125, -0.204803466796875, -0.0904541015625, 0.023895263671875, 0.13824462890625, 0.252593994140625, 0.366943359375, 0.481292724609375, 0.59564208984375, 0.709991455078125, 0.8243408203125, 0.938690185546875, 1.05303955078125, 1.167388916015625, 1.28173828125, 1.396087646484375, 1.51043701171875, 1.624786376953125, 1.7391357421875, 1.853485107421875, 1.96783447265625, 2.082183837890625, 2.196533203125, 2.310882568359375, 2.42523193359375, 2.539581298828125, 2.6539306640625, 2.768280029296875, 2.88262939453125, 2.996978759765625, 3.111328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 14.0, 6.0, 11.0, 18.0, 31.0, 41.0, 48.0, 77.0, 98.0, 138.0, 258.0, 448.0, 892.0, 2093.0, 5456.0, 18866.0, 95647.0, 1811424.0, 2126760.0, 101907.0, 20079.0, 5783.0, 2063.0, 911.0, 447.0, 243.0, 157.0, 106.0, 73.0, 52.0, 23.0, 20.0, 16.0, 16.0, 11.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.281494140625, -17.67236328125, -17.063232421875, -16.4541015625, -15.844970703125, -15.23583984375, -14.626708984375, -14.017578125, -13.408447265625, -12.79931640625, -12.190185546875, -11.5810546875, -10.971923828125, -10.36279296875, -9.753662109375, -9.14453125, -8.535400390625, -7.92626953125, -7.317138671875, -6.7080078125, -6.098876953125, -5.48974609375, -4.880615234375, -4.271484375, -3.662353515625, -3.05322265625, -2.444091796875, -1.8349609375, -1.225830078125, -0.61669921875, -0.007568359375, 0.6015625, 1.210693359375, 1.81982421875, 2.428955078125, 3.0380859375, 3.647216796875, 4.25634765625, 4.865478515625, 5.474609375, 6.083740234375, 6.69287109375, 7.302001953125, 7.9111328125, 8.520263671875, 9.12939453125, 9.738525390625, 10.34765625, 10.956787109375, 11.56591796875, 12.175048828125, 12.7841796875, 13.393310546875, 14.00244140625, 14.611572265625, 15.220703125, 15.829833984375, 16.43896484375, 17.048095703125, 17.6572265625, 18.266357421875, 18.87548828125, 19.484619140625, 20.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 5.0, 12.0, 20.0, 35.0, 46.0, 74.0, 129.0, 232.0, 627.0, 1503.0, 710.0, 265.0, 138.0, 87.0, 55.0, 42.0, 30.0, 19.0, 8.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-11.234375, -10.9876708984375, -10.740966796875, -10.4942626953125, -10.24755859375, -10.0008544921875, -9.754150390625, -9.5074462890625, -9.2607421875, -9.0140380859375, -8.767333984375, -8.5206298828125, -8.27392578125, -8.0272216796875, -7.780517578125, -7.5338134765625, -7.287109375, -7.0404052734375, -6.793701171875, -6.5469970703125, -6.30029296875, -6.0535888671875, -5.806884765625, -5.5601806640625, -5.3134765625, -5.0667724609375, -4.820068359375, -4.5733642578125, -4.32666015625, -4.0799560546875, -3.833251953125, -3.5865478515625, -3.33984375, -3.0931396484375, -2.846435546875, -2.5997314453125, -2.35302734375, -2.1063232421875, -1.859619140625, -1.6129150390625, -1.3662109375, -1.1195068359375, -0.872802734375, -0.6260986328125, -0.37939453125, -0.1326904296875, 0.114013671875, 0.3607177734375, 0.607421875, 0.8541259765625, 1.100830078125, 1.3475341796875, 1.59423828125, 1.8409423828125, 2.087646484375, 2.3343505859375, 2.5810546875, 2.8277587890625, 3.074462890625, 3.3211669921875, 3.56787109375, 3.8145751953125, 4.061279296875, 4.3079833984375, 4.5546875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 13.0, 16.0, 33.0, 73.0, 112.0, 137.0, 155.0, 136.0, 136.0, 81.0, 43.0, 35.0, 14.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.05807495117188, -66.18486785888672, -64.31166076660156, -62.43845748901367, -60.565250396728516, -58.692047119140625, -56.81884002685547, -54.94563293457031, -53.072425842285156, -51.19921875, -49.32601547241211, -47.45280838012695, -45.5796012878418, -43.706398010253906, -41.83319091796875, -39.959983825683594, -38.0867805480957, -36.21357345581055, -34.340370178222656, -32.4671630859375, -30.593955993652344, -28.72075080871582, -26.847545623779297, -24.97433853149414, -23.101133346557617, -21.227928161621094, -19.354721069335938, -17.481515884399414, -15.608309745788574, -13.735103607177734, -11.861898422241211, -9.988692283630371, -8.115486145019531, -6.242280006408691, -4.36907434463501, -2.495868682861328, -0.6226625442504883, 1.2505435943603516, 3.123748779296875, 4.996954917907715, 6.870161056518555, 8.743367195129395, 10.616573333740234, 12.489778518676758, 14.362984657287598, 16.236190795898438, 18.10939598083496, 19.982601165771484, 21.85580825805664, 23.729013442993164, 25.60222053527832, 27.475425720214844, 29.3486328125, 31.221837997436523, 33.09504318237305, 34.9682502746582, 36.841453552246094, 38.71466064453125, 40.58786392211914, 42.4610710144043, 44.33427810668945, 46.207481384277344, 48.0806884765625, 49.953895568847656, 51.82710266113281]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 5.0, 14.0, 15.0, 14.0, 18.0, 14.0, 11.0, 19.0, 24.0, 37.0, 31.0, 30.0, 38.0, 35.0, 40.0, 46.0, 42.0, 50.0, 39.0, 44.0, 45.0, 50.0, 37.0, 29.0, 42.0, 22.0, 29.0, 26.0, 26.0, 19.0, 25.0, 13.0, 17.0, 11.0, 10.0, 3.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-22.42424774169922, -21.78011703491211, -21.135986328125, -20.49185562133789, -19.84772491455078, -19.203596115112305, -18.559465408325195, -17.915334701538086, -17.271203994750977, -16.627073287963867, -15.982942581176758, -15.338812828063965, -14.694682121276855, -14.050551414489746, -13.406421661376953, -12.762290954589844, -12.118160247802734, -11.474029541015625, -10.829898834228516, -10.185769081115723, -9.541638374328613, -8.897507667541504, -8.253377914428711, -7.609247207641602, -6.965116500854492, -6.320985794067383, -5.676855564117432, -5.0327253341674805, -4.388594627380371, -3.744464159011841, -3.1003336906433105, -2.4562034606933594, -1.81207275390625, -1.1679422855377197, -0.5238118171691895, 0.12031865119934082, 0.7644491195678711, 1.4085795879364014, 2.0527100563049316, 2.696840286254883, 3.340970993041992, 3.9851014614105225, 4.629231929779053, 5.273362159729004, 5.917492866516113, 6.561623573303223, 7.205753803253174, 7.849884033203125, 8.494014739990234, 9.138145446777344, 9.782276153564453, 10.426405906677246, 11.070536613464355, 11.714667320251465, 12.358797073364258, 13.002927780151367, 13.647058486938477, 14.291189193725586, 14.935319900512695, 15.579449653625488, 16.22357940673828, 16.86771011352539, 17.5118408203125, 18.15597152709961, 18.80010223388672]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 8.0, 8.0, 16.0, 13.0, 21.0, 25.0, 43.0, 52.0, 87.0, 118.0, 200.0, 327.0, 481.0, 981.0, 2025.0, 5024.0, 14078.0, 49829.0, 241917.0, 581678.0, 109386.0, 27177.0, 8550.0, 3156.0, 1420.0, 739.0, 432.0, 244.0, 164.0, 105.0, 69.0, 49.0, 26.0, 32.0, 16.0, 14.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.40625, -21.666015625, -20.92578125, -20.185546875, -19.4453125, -18.705078125, -17.96484375, -17.224609375, -16.484375, -15.744140625, -15.00390625, -14.263671875, -13.5234375, -12.783203125, -12.04296875, -11.302734375, -10.5625, -9.822265625, -9.08203125, -8.341796875, -7.6015625, -6.861328125, -6.12109375, -5.380859375, -4.640625, -3.900390625, -3.16015625, -2.419921875, -1.6796875, -0.939453125, -0.19921875, 0.541015625, 1.28125, 2.021484375, 2.76171875, 3.501953125, 4.2421875, 4.982421875, 5.72265625, 6.462890625, 7.203125, 7.943359375, 8.68359375, 9.423828125, 10.1640625, 10.904296875, 11.64453125, 12.384765625, 13.125, 13.865234375, 14.60546875, 15.345703125, 16.0859375, 16.826171875, 17.56640625, 18.306640625, 19.046875, 19.787109375, 20.52734375, 21.267578125, 22.0078125, 22.748046875, 23.48828125, 24.228515625, 24.96875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 12.0, 16.0, 17.0, 16.0, 33.0, 48.0, 50.0, 50.0, 79.0, 66.0, 90.0, 74.0, 83.0, 75.0, 68.0, 43.0, 40.0, 38.0, 32.0, 11.0, 17.0, 16.0, 5.0, 2.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.946807861328125, -3.83111572265625, -3.715423583984375, -3.5997314453125, -3.484039306640625, -3.36834716796875, -3.252655029296875, -3.136962890625, -3.021270751953125, -2.90557861328125, -2.789886474609375, -2.6741943359375, -2.558502197265625, -2.44281005859375, -2.327117919921875, -2.21142578125, -2.095733642578125, -1.98004150390625, -1.864349365234375, -1.7486572265625, -1.632965087890625, -1.51727294921875, -1.401580810546875, -1.285888671875, -1.170196533203125, -1.05450439453125, -0.938812255859375, -0.8231201171875, -0.707427978515625, -0.59173583984375, -0.476043701171875, -0.3603515625, -0.244659423828125, -0.12896728515625, -0.013275146484375, 0.1024169921875, 0.218109130859375, 0.33380126953125, 0.449493408203125, 0.565185546875, 0.680877685546875, 0.79656982421875, 0.912261962890625, 1.0279541015625, 1.143646240234375, 1.25933837890625, 1.375030517578125, 1.49072265625, 1.606414794921875, 1.72210693359375, 1.837799072265625, 1.9534912109375, 2.069183349609375, 2.18487548828125, 2.300567626953125, 2.416259765625, 2.531951904296875, 2.64764404296875, 2.763336181640625, 2.8790283203125, 2.994720458984375, 3.11041259765625, 3.226104736328125, 3.341796875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 13.0, 16.0, 22.0, 22.0, 45.0, 64.0, 80.0, 142.0, 167.0, 261.0, 434.0, 729.0, 1389.0, 3326.0, 9969.0, 36520.0, 166304.0, 615558.0, 161228.0, 35705.0, 9996.0, 3293.0, 1368.0, 700.0, 389.0, 228.0, 159.0, 101.0, 71.0, 71.0, 49.0, 36.0, 21.0, 18.0, 13.0, 4.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.609375, -21.00048828125, -20.3916015625, -19.78271484375, -19.173828125, -18.56494140625, -17.9560546875, -17.34716796875, -16.73828125, -16.12939453125, -15.5205078125, -14.91162109375, -14.302734375, -13.69384765625, -13.0849609375, -12.47607421875, -11.8671875, -11.25830078125, -10.6494140625, -10.04052734375, -9.431640625, -8.82275390625, -8.2138671875, -7.60498046875, -6.99609375, -6.38720703125, -5.7783203125, -5.16943359375, -4.560546875, -3.95166015625, -3.3427734375, -2.73388671875, -2.125, -1.51611328125, -0.9072265625, -0.29833984375, 0.310546875, 0.91943359375, 1.5283203125, 2.13720703125, 2.74609375, 3.35498046875, 3.9638671875, 4.57275390625, 5.181640625, 5.79052734375, 6.3994140625, 7.00830078125, 7.6171875, 8.22607421875, 8.8349609375, 9.44384765625, 10.052734375, 10.66162109375, 11.2705078125, 11.87939453125, 12.48828125, 13.09716796875, 13.7060546875, 14.31494140625, 14.923828125, 15.53271484375, 16.1416015625, 16.75048828125, 17.359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 11.0, 8.0, 8.0, 11.0, 18.0, 20.0, 18.0, 23.0, 27.0, 30.0, 23.0, 32.0, 39.0, 26.0, 46.0, 36.0, 48.0, 43.0, 40.0, 42.0, 42.0, 39.0, 43.0, 47.0, 32.0, 27.0, 29.0, 27.0, 28.0, 13.0, 26.0, 10.0, 20.0, 8.0, 8.0, 16.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6097412109375, -8.313232421875, -8.0167236328125, -7.72021484375, -7.4237060546875, -7.127197265625, -6.8306884765625, -6.5341796875, -6.2376708984375, -5.941162109375, -5.6446533203125, -5.34814453125, -5.0516357421875, -4.755126953125, -4.4586181640625, -4.162109375, -3.8656005859375, -3.569091796875, -3.2725830078125, -2.97607421875, -2.6795654296875, -2.383056640625, -2.0865478515625, -1.7900390625, -1.4935302734375, -1.197021484375, -0.9005126953125, -0.60400390625, -0.3074951171875, -0.010986328125, 0.2855224609375, 0.58203125, 0.8785400390625, 1.175048828125, 1.4715576171875, 1.76806640625, 2.0645751953125, 2.361083984375, 2.6575927734375, 2.9541015625, 3.2506103515625, 3.547119140625, 3.8436279296875, 4.14013671875, 4.4366455078125, 4.733154296875, 5.0296630859375, 5.326171875, 5.6226806640625, 5.919189453125, 6.2156982421875, 6.51220703125, 6.8087158203125, 7.105224609375, 7.4017333984375, 7.6982421875, 7.9947509765625, 8.291259765625, 8.5877685546875, 8.88427734375, 9.1807861328125, 9.477294921875, 9.7738037109375, 10.0703125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 5.0, 7.0, 5.0, 10.0, 13.0, 14.0, 18.0, 34.0, 36.0, 58.0, 116.0, 238.0, 628.0, 2188.0, 16276.0, 843572.0, 176421.0, 6802.0, 1268.0, 409.0, 169.0, 92.0, 52.0, 29.0, 23.0, 20.0, 11.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.296875, -27.407470703125, -26.51806640625, -25.628662109375, -24.7392578125, -23.849853515625, -22.96044921875, -22.071044921875, -21.181640625, -20.292236328125, -19.40283203125, -18.513427734375, -17.6240234375, -16.734619140625, -15.84521484375, -14.955810546875, -14.06640625, -13.177001953125, -12.28759765625, -11.398193359375, -10.5087890625, -9.619384765625, -8.72998046875, -7.840576171875, -6.951171875, -6.061767578125, -5.17236328125, -4.282958984375, -3.3935546875, -2.504150390625, -1.61474609375, -0.725341796875, 0.1640625, 1.053466796875, 1.94287109375, 2.832275390625, 3.7216796875, 4.611083984375, 5.50048828125, 6.389892578125, 7.279296875, 8.168701171875, 9.05810546875, 9.947509765625, 10.8369140625, 11.726318359375, 12.61572265625, 13.505126953125, 14.39453125, 15.283935546875, 16.17333984375, 17.062744140625, 17.9521484375, 18.841552734375, 19.73095703125, 20.620361328125, 21.509765625, 22.399169921875, 23.28857421875, 24.177978515625, 25.0673828125, 25.956787109375, 26.84619140625, 27.735595703125, 28.625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 10.0, 13.0, 14.0, 22.0, 17.0, 33.0, 52.0, 103.0, 155.0, 198.0, 132.0, 62.0, 43.0, 29.0, 18.0, 19.0, 17.0, 9.0, 10.0, 9.0, 4.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011167526245117188, -0.0010707974433898926, -0.0010248422622680664, -0.0009788870811462402, -0.0009329319000244141, -0.0008869767189025879, -0.0008410215377807617, -0.0007950663566589355, -0.0007491111755371094, -0.0007031559944152832, -0.000657200813293457, -0.0006112456321716309, -0.0005652904510498047, -0.0005193352699279785, -0.00047338008880615234, -0.00042742490768432617, -0.0003814697265625, -0.00033551454544067383, -0.00028955936431884766, -0.00024360418319702148, -0.0001976490020751953, -0.00015169382095336914, -0.00010573863983154297, -5.97834587097168e-05, -1.3828277587890625e-05, 3.212690353393555e-05, 7.808208465576172e-05, 0.0001240372657775879, 0.00016999244689941406, 0.00021594762802124023, 0.0002619028091430664, 0.0003078579902648926, 0.00035381317138671875, 0.0003997683525085449, 0.0004457235336303711, 0.0004916787147521973, 0.0005376338958740234, 0.0005835890769958496, 0.0006295442581176758, 0.000675499439239502, 0.0007214546203613281, 0.0007674098014831543, 0.0008133649826049805, 0.0008593201637268066, 0.0009052753448486328, 0.000951230525970459, 0.0009971857070922852, 0.0010431408882141113, 0.0010890960693359375, 0.0011350512504577637, 0.0011810064315795898, 0.001226961612701416, 0.0012729167938232422, 0.0013188719749450684, 0.0013648271560668945, 0.0014107823371887207, 0.0014567375183105469, 0.001502692699432373, 0.0015486478805541992, 0.0015946030616760254, 0.0016405582427978516, 0.0016865134239196777, 0.001732468605041504, 0.00177842378616333, 0.0018243789672851562]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 2.0, 4.0, 6.0, 13.0, 11.0, 21.0, 24.0, 57.0, 123.0, 209.0, 474.0, 1263.0, 4917.0, 90316.0, 938915.0, 8955.0, 1974.0, 659.0, 300.0, 135.0, 73.0, 28.0, 29.0, 10.0, 12.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.50146484375, -36.9716796875, -35.44189453125, -33.912109375, -32.38232421875, -30.8525390625, -29.32275390625, -27.79296875, -26.26318359375, -24.7333984375, -23.20361328125, -21.673828125, -20.14404296875, -18.6142578125, -17.08447265625, -15.5546875, -14.02490234375, -12.4951171875, -10.96533203125, -9.435546875, -7.90576171875, -6.3759765625, -4.84619140625, -3.31640625, -1.78662109375, -0.2568359375, 1.27294921875, 2.802734375, 4.33251953125, 5.8623046875, 7.39208984375, 8.921875, 10.45166015625, 11.9814453125, 13.51123046875, 15.041015625, 16.57080078125, 18.1005859375, 19.63037109375, 21.16015625, 22.68994140625, 24.2197265625, 25.74951171875, 27.279296875, 28.80908203125, 30.3388671875, 31.86865234375, 33.3984375, 34.92822265625, 36.4580078125, 37.98779296875, 39.517578125, 41.04736328125, 42.5771484375, 44.10693359375, 45.63671875, 47.16650390625, 48.6962890625, 50.22607421875, 51.755859375, 53.28564453125, 54.8154296875, 56.34521484375, 57.875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 13.0, 29.0, 63.0, 358.0, 369.0, 78.0, 30.0, 12.0, 13.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.640625, -23.819091796875, -22.99755859375, -22.176025390625, -21.3544921875, -20.532958984375, -19.71142578125, -18.889892578125, -18.068359375, -17.246826171875, -16.42529296875, -15.603759765625, -14.7822265625, -13.960693359375, -13.13916015625, -12.317626953125, -11.49609375, -10.674560546875, -9.85302734375, -9.031494140625, -8.2099609375, -7.388427734375, -6.56689453125, -5.745361328125, -4.923828125, -4.102294921875, -3.28076171875, -2.459228515625, -1.6376953125, -0.816162109375, 0.00537109375, 0.826904296875, 1.6484375, 2.469970703125, 3.29150390625, 4.113037109375, 4.9345703125, 5.756103515625, 6.57763671875, 7.399169921875, 8.220703125, 9.042236328125, 9.86376953125, 10.685302734375, 11.5068359375, 12.328369140625, 13.14990234375, 13.971435546875, 14.79296875, 15.614501953125, 16.43603515625, 17.257568359375, 18.0791015625, 18.900634765625, 19.72216796875, 20.543701171875, 21.365234375, 22.186767578125, 23.00830078125, 23.829833984375, 24.6513671875, 25.472900390625, 26.29443359375, 27.115966796875, 27.9375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 49.0, 276.0, 489.0, 153.0, 25.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.4330139160156, -259.2737731933594, -245.11451721191406, -230.95526123046875, -216.7960205078125, -202.63677978515625, -188.47752380371094, -174.31826782226562, -160.15902709960938, -145.99978637695312, -131.8405303955078, -117.68128204345703, -103.52203369140625, -89.36278533935547, -75.20353698730469, -61.044288635253906, -46.885040283203125, -32.725791931152344, -18.566543579101562, -4.407295227050781, 9.751953125, 23.91120147705078, 38.07044982910156, 52.229698181152344, 66.38894653320312, 80.5481948852539, 94.70744323730469, 108.86669158935547, 123.02593994140625, 137.1851806640625, 151.3444366455078, 165.50369262695312, 179.6629638671875, 193.82220458984375, 207.98146057128906, 222.14071655273438, 236.29995727539062, 250.45919799804688, 264.61846923828125, 278.7777099609375, 292.93695068359375, 307.09619140625, 321.25543212890625, 335.4147033691406, 349.5739440917969, 363.7331848144531, 377.8924560546875, 392.05169677734375, 406.2109375, 420.37017822265625, 434.5294189453125, 448.6886901855469, 462.8479309082031, 477.0071716308594, 491.16644287109375, 505.32568359375, 519.4849243164062, 533.6441650390625, 547.8034057617188, 561.962646484375, 576.1219482421875, 590.2811889648438, 604.4404296875, 618.5996704101562, 632.7589111328125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 11.0, 9.0, 2.0, 8.0, 20.0, 33.0, 44.0, 29.0, 43.0, 64.0, 83.0, 65.0, 71.0, 58.0, 57.0, 68.0, 65.0, 50.0, 44.0, 41.0, 36.0, 32.0, 25.0, 15.0, 3.0, 11.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0], "bins": [-119.6133804321289, -116.91424560546875, -114.2151107788086, -111.51597595214844, -108.81684112548828, -106.11770629882812, -103.41856384277344, -100.71943664550781, -98.02029418945312, -95.32115936279297, -92.62202453613281, -89.92288970947266, -87.2237548828125, -84.52462005615234, -81.82548522949219, -79.1263427734375, -76.42721557617188, -73.72808074951172, -71.02894592285156, -68.3298110961914, -65.63067626953125, -62.931541442871094, -60.23240280151367, -57.533267974853516, -54.83413314819336, -52.1349983215332, -49.43586349487305, -46.736724853515625, -44.03759002685547, -41.33845520019531, -38.639320373535156, -35.940185546875, -33.24104690551758, -30.541912078857422, -27.842777252197266, -25.143640518188477, -22.44450569152832, -19.745370864868164, -17.046234130859375, -14.347099304199219, -11.647964477539062, -8.948829650878906, -6.249693870544434, -3.550558090209961, -0.8514232635498047, 1.8477115631103516, 4.546848297119141, 7.245983123779297, 9.945117950439453, 12.64425277709961, 15.343388557434082, 18.042524337768555, 20.74165916442871, 23.440793991088867, 26.139930725097656, 28.839065551757812, 31.53820037841797, 34.237335205078125, 36.93647003173828, 39.63560485839844, 42.334739685058594, 45.03387451171875, 47.73301315307617, 50.43214797973633, 53.131282806396484]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 3.0, 10.0, 10.0, 14.0, 20.0, 17.0, 27.0, 37.0, 45.0, 58.0, 81.0, 101.0, 136.0, 160.0, 215.0, 346.0, 629.0, 1107.0, 2470.0, 5424.0, 14726.0, 55974.0, 689430.0, 3299828.0, 89832.0, 20557.0, 6955.0, 2929.0, 1331.0, 703.0, 397.0, 208.0, 145.0, 116.0, 81.0, 29.0, 34.0, 23.0, 18.0, 13.0, 11.0, 10.0, 4.0, 7.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.859375, -24.034423828125, -23.20947265625, -22.384521484375, -21.5595703125, -20.734619140625, -19.90966796875, -19.084716796875, -18.259765625, -17.434814453125, -16.60986328125, -15.784912109375, -14.9599609375, -14.135009765625, -13.31005859375, -12.485107421875, -11.66015625, -10.835205078125, -10.01025390625, -9.185302734375, -8.3603515625, -7.535400390625, -6.71044921875, -5.885498046875, -5.060546875, -4.235595703125, -3.41064453125, -2.585693359375, -1.7607421875, -0.935791015625, -0.11083984375, 0.714111328125, 1.5390625, 2.364013671875, 3.18896484375, 4.013916015625, 4.8388671875, 5.663818359375, 6.48876953125, 7.313720703125, 8.138671875, 8.963623046875, 9.78857421875, 10.613525390625, 11.4384765625, 12.263427734375, 13.08837890625, 13.913330078125, 14.73828125, 15.563232421875, 16.38818359375, 17.213134765625, 18.0380859375, 18.863037109375, 19.68798828125, 20.512939453125, 21.337890625, 22.162841796875, 22.98779296875, 23.812744140625, 24.6376953125, 25.462646484375, 26.28759765625, 27.112548828125, 27.9375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 10.0, 9.0, 14.0, 15.0, 31.0, 37.0, 40.0, 51.0, 69.0, 70.0, 72.0, 72.0, 81.0, 78.0, 62.0, 51.0, 49.0, 45.0, 34.0, 31.0, 22.0, 16.0, 15.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.13671875, -4.01837158203125, -3.9000244140625, -3.78167724609375, -3.663330078125, -3.54498291015625, -3.4266357421875, -3.30828857421875, -3.18994140625, -3.07159423828125, -2.9532470703125, -2.83489990234375, -2.716552734375, -2.59820556640625, -2.4798583984375, -2.36151123046875, -2.2431640625, -2.12481689453125, -2.0064697265625, -1.88812255859375, -1.769775390625, -1.65142822265625, -1.5330810546875, -1.41473388671875, -1.29638671875, -1.17803955078125, -1.0596923828125, -0.94134521484375, -0.822998046875, -0.70465087890625, -0.5863037109375, -0.46795654296875, -0.349609375, -0.23126220703125, -0.1129150390625, 0.00543212890625, 0.123779296875, 0.24212646484375, 0.3604736328125, 0.47882080078125, 0.59716796875, 0.71551513671875, 0.8338623046875, 0.95220947265625, 1.070556640625, 1.18890380859375, 1.3072509765625, 1.42559814453125, 1.5439453125, 1.66229248046875, 1.7806396484375, 1.89898681640625, 2.017333984375, 2.13568115234375, 2.2540283203125, 2.37237548828125, 2.49072265625, 2.60906982421875, 2.7274169921875, 2.84576416015625, 2.964111328125, 3.08245849609375, 3.2008056640625, 3.31915283203125, 3.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 11.0, 17.0, 21.0, 32.0, 61.0, 67.0, 118.0, 177.0, 295.0, 514.0, 944.0, 1947.0, 4085.0, 9961.0, 27616.0, 114249.0, 2078846.0, 1799501.0, 110955.0, 27242.0, 9783.0, 3883.0, 1821.0, 861.0, 505.0, 266.0, 165.0, 113.0, 75.0, 41.0, 34.0, 27.0, 12.0, 11.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.2725830078125, -15.763916015625, -15.2552490234375, -14.74658203125, -14.2379150390625, -13.729248046875, -13.2205810546875, -12.7119140625, -12.2032470703125, -11.694580078125, -11.1859130859375, -10.67724609375, -10.1685791015625, -9.659912109375, -9.1512451171875, -8.642578125, -8.1339111328125, -7.625244140625, -7.1165771484375, -6.60791015625, -6.0992431640625, -5.590576171875, -5.0819091796875, -4.5732421875, -4.0645751953125, -3.555908203125, -3.0472412109375, -2.53857421875, -2.0299072265625, -1.521240234375, -1.0125732421875, -0.50390625, 0.0047607421875, 0.513427734375, 1.0220947265625, 1.53076171875, 2.0394287109375, 2.548095703125, 3.0567626953125, 3.5654296875, 4.0740966796875, 4.582763671875, 5.0914306640625, 5.60009765625, 6.1087646484375, 6.617431640625, 7.1260986328125, 7.634765625, 8.1434326171875, 8.652099609375, 9.1607666015625, 9.66943359375, 10.1781005859375, 10.686767578125, 11.1954345703125, 11.7041015625, 12.2127685546875, 12.721435546875, 13.2301025390625, 13.73876953125, 14.2474365234375, 14.756103515625, 15.2647705078125, 15.7734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 4.0, 3.0, 8.0, 5.0, 12.0, 13.0, 21.0, 29.0, 56.0, 90.0, 197.0, 452.0, 1456.0, 994.0, 348.0, 144.0, 89.0, 50.0, 32.0, 23.0, 17.0, 9.0, 3.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.3817138671875, -7.150146484375, -6.9185791015625, -6.68701171875, -6.4554443359375, -6.223876953125, -5.9923095703125, -5.7607421875, -5.5291748046875, -5.297607421875, -5.0660400390625, -4.83447265625, -4.6029052734375, -4.371337890625, -4.1397705078125, -3.908203125, -3.6766357421875, -3.445068359375, -3.2135009765625, -2.98193359375, -2.7503662109375, -2.518798828125, -2.2872314453125, -2.0556640625, -1.8240966796875, -1.592529296875, -1.3609619140625, -1.12939453125, -0.8978271484375, -0.666259765625, -0.4346923828125, -0.203125, 0.0284423828125, 0.260009765625, 0.4915771484375, 0.72314453125, 0.9547119140625, 1.186279296875, 1.4178466796875, 1.6494140625, 1.8809814453125, 2.112548828125, 2.3441162109375, 2.57568359375, 2.8072509765625, 3.038818359375, 3.2703857421875, 3.501953125, 3.7335205078125, 3.965087890625, 4.1966552734375, 4.42822265625, 4.6597900390625, 4.891357421875, 5.1229248046875, 5.3544921875, 5.5860595703125, 5.817626953125, 6.0491943359375, 6.28076171875, 6.5123291015625, 6.743896484375, 6.9754638671875, 7.20703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 17.0, 18.0, 25.0, 46.0, 88.0, 127.0, 127.0, 157.0, 133.0, 90.0, 69.0, 41.0, 24.0, 13.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.59861373901367, -57.10755920410156, -55.61650466918945, -54.125450134277344, -52.6343994140625, -51.14334487915039, -49.65229034423828, -48.16123580932617, -46.67018127441406, -45.17912673950195, -43.688072204589844, -42.197017669677734, -40.705963134765625, -39.21491241455078, -37.72385787963867, -36.23280334472656, -34.74174880981445, -33.250694274902344, -31.759639739990234, -30.268587112426758, -28.77753257751465, -27.28647804260254, -25.795425415039062, -24.304370880126953, -22.813316345214844, -21.322261810302734, -19.831207275390625, -18.34015464782715, -16.84910011291504, -15.35804557800293, -13.866991996765137, -12.375938415527344, -10.884883880615234, -9.393829345703125, -7.902775764465332, -6.411721706390381, -4.92066764831543, -3.4296135902404785, -1.9385595321655273, -0.4475059509277344, 1.043548583984375, 2.534602642059326, 4.025656700134277, 5.5167107582092285, 7.00776481628418, 8.498819351196289, 9.989872932434082, 11.480926513671875, 12.971981048583984, 14.463035583496094, 15.954089164733887, 17.44514274597168, 18.93619728088379, 20.4272518157959, 21.918304443359375, 23.409358978271484, 24.900413513183594, 26.391468048095703, 27.882522583007812, 29.37357521057129, 30.8646297454834, 32.355682373046875, 33.846736907958984, 35.337791442871094, 36.8288459777832]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 10.0, 9.0, 12.0, 17.0, 21.0, 28.0, 52.0, 46.0, 43.0, 59.0, 62.0, 60.0, 81.0, 75.0, 82.0, 70.0, 48.0, 47.0, 46.0, 31.0, 23.0, 20.0, 18.0, 12.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.358570098876953, -30.502370834350586, -29.646169662475586, -28.78997039794922, -27.93376922607422, -27.07756996154785, -26.221370697021484, -25.365169525146484, -24.508968353271484, -23.652769088745117, -22.796567916870117, -21.94036865234375, -21.08416748046875, -20.227968215942383, -19.371768951416016, -18.515567779541016, -17.65936851501465, -16.80316925048828, -15.946968078613281, -15.090768814086914, -14.234567642211914, -13.378368377685547, -12.522168159484863, -11.66596794128418, -10.809767723083496, -9.953567504882812, -9.097367286682129, -8.241167068481445, -7.38496732711792, -6.528767108917236, -5.672567367553711, -4.816367149353027, -3.960165023803711, -3.1039648056030273, -2.247764825820923, -1.3915648460388184, -0.5353646278381348, 0.32083559036254883, 1.1770353317260742, 2.033235549926758, 2.8894357681274414, 3.745635986328125, 4.601836204528809, 5.458035945892334, 6.314236164093018, 7.170436382293701, 8.026636123657227, 8.88283634185791, 9.739036560058594, 10.595236778259277, 11.451436996459961, 12.307636260986328, 13.163837432861328, 14.020036697387695, 14.876236915588379, 15.732437133789062, 16.588638305664062, 17.44483757019043, 18.30103874206543, 19.157238006591797, 20.013439178466797, 20.869638442993164, 21.72583770751953, 22.58203887939453, 23.4382381439209]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 10.0, 10.0, 19.0, 23.0, 36.0, 47.0, 84.0, 131.0, 220.0, 344.0, 588.0, 1214.0, 3084.0, 9930.0, 39117.0, 208120.0, 645837.0, 105324.0, 23598.0, 6437.0, 2199.0, 917.0, 486.0, 288.0, 177.0, 107.0, 78.0, 38.0, 28.0, 14.0, 15.0, 12.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.046875, -26.2587890625, -25.470703125, -24.6826171875, -23.89453125, -23.1064453125, -22.318359375, -21.5302734375, -20.7421875, -19.9541015625, -19.166015625, -18.3779296875, -17.58984375, -16.8017578125, -16.013671875, -15.2255859375, -14.4375, -13.6494140625, -12.861328125, -12.0732421875, -11.28515625, -10.4970703125, -9.708984375, -8.9208984375, -8.1328125, -7.3447265625, -6.556640625, -5.7685546875, -4.98046875, -4.1923828125, -3.404296875, -2.6162109375, -1.828125, -1.0400390625, -0.251953125, 0.5361328125, 1.32421875, 2.1123046875, 2.900390625, 3.6884765625, 4.4765625, 5.2646484375, 6.052734375, 6.8408203125, 7.62890625, 8.4169921875, 9.205078125, 9.9931640625, 10.78125, 11.5693359375, 12.357421875, 13.1455078125, 13.93359375, 14.7216796875, 15.509765625, 16.2978515625, 17.0859375, 17.8740234375, 18.662109375, 19.4501953125, 20.23828125, 21.0263671875, 21.814453125, 22.6025390625, 23.390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 13.0, 27.0, 21.0, 25.0, 32.0, 47.0, 61.0, 75.0, 66.0, 75.0, 69.0, 95.0, 71.0, 44.0, 49.0, 46.0, 48.0, 32.0, 22.0, 20.0, 17.0, 12.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.03607177734375, -3.9119873046875, -3.78790283203125, -3.663818359375, -3.53973388671875, -3.4156494140625, -3.29156494140625, -3.16748046875, -3.04339599609375, -2.9193115234375, -2.79522705078125, -2.671142578125, -2.54705810546875, -2.4229736328125, -2.29888916015625, -2.1748046875, -2.05072021484375, -1.9266357421875, -1.80255126953125, -1.678466796875, -1.55438232421875, -1.4302978515625, -1.30621337890625, -1.18212890625, -1.05804443359375, -0.9339599609375, -0.80987548828125, -0.685791015625, -0.56170654296875, -0.4376220703125, -0.31353759765625, -0.189453125, -0.06536865234375, 0.0587158203125, 0.18280029296875, 0.306884765625, 0.43096923828125, 0.5550537109375, 0.67913818359375, 0.80322265625, 0.92730712890625, 1.0513916015625, 1.17547607421875, 1.299560546875, 1.42364501953125, 1.5477294921875, 1.67181396484375, 1.7958984375, 1.91998291015625, 2.0440673828125, 2.16815185546875, 2.292236328125, 2.41632080078125, 2.5404052734375, 2.66448974609375, 2.78857421875, 2.91265869140625, 3.0367431640625, 3.16082763671875, 3.284912109375, 3.40899658203125, 3.5330810546875, 3.65716552734375, 3.78125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 15.0, 12.0, 29.0, 34.0, 57.0, 71.0, 114.0, 145.0, 289.0, 470.0, 1012.0, 2266.0, 5529.0, 14565.0, 39315.0, 124923.0, 499911.0, 256082.0, 65260.0, 23178.0, 8760.0, 3381.0, 1475.0, 700.0, 319.0, 218.0, 141.0, 89.0, 52.0, 32.0, 27.0, 21.0, 16.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-13.25, -12.83251953125, -12.4150390625, -11.99755859375, -11.580078125, -11.16259765625, -10.7451171875, -10.32763671875, -9.91015625, -9.49267578125, -9.0751953125, -8.65771484375, -8.240234375, -7.82275390625, -7.4052734375, -6.98779296875, -6.5703125, -6.15283203125, -5.7353515625, -5.31787109375, -4.900390625, -4.48291015625, -4.0654296875, -3.64794921875, -3.23046875, -2.81298828125, -2.3955078125, -1.97802734375, -1.560546875, -1.14306640625, -0.7255859375, -0.30810546875, 0.109375, 0.52685546875, 0.9443359375, 1.36181640625, 1.779296875, 2.19677734375, 2.6142578125, 3.03173828125, 3.44921875, 3.86669921875, 4.2841796875, 4.70166015625, 5.119140625, 5.53662109375, 5.9541015625, 6.37158203125, 6.7890625, 7.20654296875, 7.6240234375, 8.04150390625, 8.458984375, 8.87646484375, 9.2939453125, 9.71142578125, 10.12890625, 10.54638671875, 10.9638671875, 11.38134765625, 11.798828125, 12.21630859375, 12.6337890625, 13.05126953125, 13.46875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 9.0, 9.0, 14.0, 7.0, 16.0, 15.0, 19.0, 26.0, 24.0, 32.0, 33.0, 32.0, 32.0, 43.0, 36.0, 32.0, 43.0, 43.0, 45.0, 40.0, 36.0, 38.0, 31.0, 36.0, 32.0, 39.0, 25.0, 21.0, 25.0, 19.0, 21.0, 18.0, 11.0, 4.0, 7.0, 10.0, 11.0, 7.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0], "bins": [-9.640625, -9.3623046875, -9.083984375, -8.8056640625, -8.52734375, -8.2490234375, -7.970703125, -7.6923828125, -7.4140625, -7.1357421875, -6.857421875, -6.5791015625, -6.30078125, -6.0224609375, -5.744140625, -5.4658203125, -5.1875, -4.9091796875, -4.630859375, -4.3525390625, -4.07421875, -3.7958984375, -3.517578125, -3.2392578125, -2.9609375, -2.6826171875, -2.404296875, -2.1259765625, -1.84765625, -1.5693359375, -1.291015625, -1.0126953125, -0.734375, -0.4560546875, -0.177734375, 0.1005859375, 0.37890625, 0.6572265625, 0.935546875, 1.2138671875, 1.4921875, 1.7705078125, 2.048828125, 2.3271484375, 2.60546875, 2.8837890625, 3.162109375, 3.4404296875, 3.71875, 3.9970703125, 4.275390625, 4.5537109375, 4.83203125, 5.1103515625, 5.388671875, 5.6669921875, 5.9453125, 6.2236328125, 6.501953125, 6.7802734375, 7.05859375, 7.3369140625, 7.615234375, 7.8935546875, 8.171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 23.0, 25.0, 29.0, 59.0, 91.0, 121.0, 202.0, 382.0, 770.0, 1789.0, 5011.0, 14403.0, 46850.0, 206716.0, 548339.0, 164702.0, 39265.0, 12432.0, 4174.0, 1620.0, 667.0, 351.0, 176.0, 107.0, 65.0, 47.0, 38.0, 19.0, 16.0, 13.0, 13.0, 10.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.724609375, -3.550811767578125, -3.37701416015625, -3.203216552734375, -3.0294189453125, -2.855621337890625, -2.68182373046875, -2.508026123046875, -2.334228515625, -2.160430908203125, -1.98663330078125, -1.812835693359375, -1.6390380859375, -1.465240478515625, -1.29144287109375, -1.117645263671875, -0.94384765625, -0.770050048828125, -0.59625244140625, -0.422454833984375, -0.2486572265625, -0.074859619140625, 0.09893798828125, 0.272735595703125, 0.446533203125, 0.620330810546875, 0.79412841796875, 0.967926025390625, 1.1417236328125, 1.315521240234375, 1.48931884765625, 1.663116455078125, 1.8369140625, 2.010711669921875, 2.18450927734375, 2.358306884765625, 2.5321044921875, 2.705902099609375, 2.87969970703125, 3.053497314453125, 3.227294921875, 3.401092529296875, 3.57489013671875, 3.748687744140625, 3.9224853515625, 4.096282958984375, 4.27008056640625, 4.443878173828125, 4.61767578125, 4.791473388671875, 4.96527099609375, 5.139068603515625, 5.3128662109375, 5.486663818359375, 5.66046142578125, 5.834259033203125, 6.008056640625, 6.181854248046875, 6.35565185546875, 6.529449462890625, 6.7032470703125, 6.877044677734375, 7.05084228515625, 7.224639892578125, 7.3984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 11.0, 4.0, 14.0, 6.0, 12.0, 18.0, 10.0, 15.0, 31.0, 61.0, 115.0, 190.0, 204.0, 103.0, 54.0, 34.0, 17.0, 20.0, 16.0, 11.0, 13.0, 10.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0014553070068359375, -0.0014198347926139832, -0.0013843625783920288, -0.0013488903641700745, -0.0013134181499481201, -0.0012779459357261658, -0.0012424737215042114, -0.001207001507282257, -0.0011715292930603027, -0.0011360570788383484, -0.001100584864616394, -0.0010651126503944397, -0.0010296404361724854, -0.000994168221950531, -0.0009586960077285767, -0.0009232237935066223, -0.000887751579284668, -0.0008522793650627136, -0.0008168071508407593, -0.0007813349366188049, -0.0007458627223968506, -0.0007103905081748962, -0.0006749182939529419, -0.0006394460797309875, -0.0006039738655090332, -0.0005685016512870789, -0.0005330294370651245, -0.0004975572228431702, -0.0004620850086212158, -0.0004266127943992615, -0.00039114058017730713, -0.0003556683659553528, -0.00032019615173339844, -0.0002847239375114441, -0.00024925172328948975, -0.0002137795090675354, -0.00017830729484558105, -0.0001428350806236267, -0.00010736286640167236, -7.189065217971802e-05, -3.641843795776367e-05, -9.462237358093262e-07, 3.452599048614502e-05, 6.999820470809937e-05, 0.00010547041893005371, 0.00014094263315200806, 0.0001764148473739624, 0.00021188706159591675, 0.0002473592758178711, 0.00028283149003982544, 0.0003183037042617798, 0.00035377591848373413, 0.0003892481327056885, 0.0004247203469276428, 0.00046019256114959717, 0.0004956647753715515, 0.0005311369895935059, 0.0005666092038154602, 0.0006020814180374146, 0.0006375536322593689, 0.0006730258464813232, 0.0007084980607032776, 0.0007439702749252319, 0.0007794424891471863, 0.0008149147033691406]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 11.0, 15.0, 35.0, 39.0, 90.0, 147.0, 309.0, 600.0, 1585.0, 5553.0, 24556.0, 147404.0, 703635.0, 133823.0, 22859.0, 5208.0, 1433.0, 544.0, 306.0, 174.0, 87.0, 52.0, 27.0, 19.0, 19.0, 9.0, 2.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -8.03143310546875, -7.8050537109375, -7.57867431640625, -7.352294921875, -7.12591552734375, -6.8995361328125, -6.67315673828125, -6.44677734375, -6.22039794921875, -5.9940185546875, -5.76763916015625, -5.541259765625, -5.31488037109375, -5.0885009765625, -4.86212158203125, -4.6357421875, -4.40936279296875, -4.1829833984375, -3.95660400390625, -3.730224609375, -3.50384521484375, -3.2774658203125, -3.05108642578125, -2.82470703125, -2.59832763671875, -2.3719482421875, -2.14556884765625, -1.919189453125, -1.69281005859375, -1.4664306640625, -1.24005126953125, -1.013671875, -0.78729248046875, -0.5609130859375, -0.33453369140625, -0.108154296875, 0.11822509765625, 0.3446044921875, 0.57098388671875, 0.79736328125, 1.02374267578125, 1.2501220703125, 1.47650146484375, 1.702880859375, 1.92926025390625, 2.1556396484375, 2.38201904296875, 2.6083984375, 2.83477783203125, 3.0611572265625, 3.28753662109375, 3.513916015625, 3.74029541015625, 3.9666748046875, 4.19305419921875, 4.41943359375, 4.64581298828125, 4.8721923828125, 5.09857177734375, 5.324951171875, 5.55133056640625, 5.7777099609375, 6.00408935546875, 6.23046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 17.0, 13.0, 26.0, 28.0, 39.0, 49.0, 58.0, 80.0, 93.0, 117.0, 111.0, 73.0, 55.0, 48.0, 40.0, 18.0, 21.0, 16.0, 12.0, 10.0, 11.0, 9.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.21875, -4.10247802734375, -3.9862060546875, -3.86993408203125, -3.753662109375, -3.63739013671875, -3.5211181640625, -3.40484619140625, -3.28857421875, -3.17230224609375, -3.0560302734375, -2.93975830078125, -2.823486328125, -2.70721435546875, -2.5909423828125, -2.47467041015625, -2.3583984375, -2.24212646484375, -2.1258544921875, -2.00958251953125, -1.893310546875, -1.77703857421875, -1.6607666015625, -1.54449462890625, -1.42822265625, -1.31195068359375, -1.1956787109375, -1.07940673828125, -0.963134765625, -0.84686279296875, -0.7305908203125, -0.61431884765625, -0.498046875, -0.38177490234375, -0.2655029296875, -0.14923095703125, -0.032958984375, 0.08331298828125, 0.1995849609375, 0.31585693359375, 0.43212890625, 0.54840087890625, 0.6646728515625, 0.78094482421875, 0.897216796875, 1.01348876953125, 1.1297607421875, 1.24603271484375, 1.3623046875, 1.47857666015625, 1.5948486328125, 1.71112060546875, 1.827392578125, 1.94366455078125, 2.0599365234375, 2.17620849609375, 2.29248046875, 2.40875244140625, 2.5250244140625, 2.64129638671875, 2.757568359375, 2.87384033203125, 2.9901123046875, 3.10638427734375, 3.22265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 13.0, 18.0, 46.0, 60.0, 79.0, 137.0, 160.0, 164.0, 137.0, 79.0, 48.0, 28.0, 18.0, 10.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.22698974609375, -73.6961669921875, -70.16534423828125, -66.634521484375, -63.10369873046875, -59.5728759765625, -56.042057037353516, -52.511234283447266, -48.980411529541016, -45.449588775634766, -41.918766021728516, -38.38794708251953, -34.85712432861328, -31.3262996673584, -27.79547882080078, -24.26465606689453, -20.73383331298828, -17.20301055908203, -13.672188758850098, -10.141366958618164, -6.610544204711914, -3.079721450805664, 0.4510993957519531, 3.981922149658203, 7.512744903564453, 11.043567657470703, 14.574389457702637, 18.10521125793457, 21.63603401184082, 25.16685676574707, 28.697677612304688, 32.22850036621094, 35.75932312011719, 39.29014587402344, 42.82096862792969, 46.35179138183594, 49.88261413574219, 53.41343688964844, 56.94425582885742, 60.47507858276367, 64.00590515136719, 67.53672790527344, 71.06755065917969, 74.59837341308594, 78.12919616699219, 81.66001892089844, 85.19084167480469, 88.72166442871094, 92.25247955322266, 95.7833023071289, 99.31412506103516, 102.8449478149414, 106.37577056884766, 109.9065933227539, 113.43740844726562, 116.96823120117188, 120.49905395507812, 124.02987670898438, 127.56069946289062, 131.09152221679688, 134.62234497070312, 138.15316772460938, 141.68399047851562, 145.21481323242188, 148.74563598632812]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 12.0, 14.0, 13.0, 13.0, 22.0, 29.0, 30.0, 24.0, 26.0, 30.0, 29.0, 34.0, 47.0, 61.0, 34.0, 47.0, 34.0, 45.0, 34.0, 44.0, 43.0, 39.0, 38.0, 42.0, 25.0, 23.0, 19.0, 20.0, 24.0, 15.0, 14.0, 15.0, 11.0, 8.0, 9.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.173648834228516, -44.74121856689453, -43.30878829956055, -41.87635803222656, -40.44392395019531, -39.01149368286133, -37.579063415527344, -36.14663314819336, -34.714202880859375, -33.28177261352539, -31.849342346191406, -30.41691017150879, -28.984479904174805, -27.55204963684082, -26.119617462158203, -24.68718719482422, -23.254756927490234, -21.82232666015625, -20.389896392822266, -18.95746421813965, -17.525033950805664, -16.09260368347168, -14.660172462463379, -13.227741241455078, -11.795310974121094, -10.36288070678711, -8.930449485778809, -7.498018741607666, -6.065587997436523, -4.633157253265381, -3.2007265090942383, -1.7682952880859375, -0.3358612060546875, 1.096569538116455, 2.5290002822875977, 3.9614310264587402, 5.393861770629883, 6.826292514801025, 8.258723258972168, 9.691154479980469, 11.123584747314453, 12.556015014648438, 13.988446235656738, 15.420877456665039, 16.853307723999023, 18.285737991333008, 19.718170166015625, 21.15060043334961, 22.583030700683594, 24.015460968017578, 25.447891235351562, 26.88032341003418, 28.312753677368164, 29.74518394470215, 31.177616119384766, 32.61004638671875, 34.042476654052734, 35.47490692138672, 36.9073371887207, 38.33976745605469, 39.77220153808594, 41.20463180541992, 42.637062072753906, 44.06949234008789, 45.501922607421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 13.0, 20.0, 28.0, 46.0, 67.0, 85.0, 135.0, 158.0, 259.0, 391.0, 717.0, 1466.0, 3344.0, 9662.0, 35301.0, 289809.0, 3707505.0, 112113.0, 21821.0, 6638.0, 2461.0, 1054.0, 524.0, 242.0, 138.0, 82.0, 61.0, 29.0, 30.0, 21.0, 12.0, 13.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.21435546875, -29.1474609375, -28.08056640625, -27.013671875, -25.94677734375, -24.8798828125, -23.81298828125, -22.74609375, -21.67919921875, -20.6123046875, -19.54541015625, -18.478515625, -17.41162109375, -16.3447265625, -15.27783203125, -14.2109375, -13.14404296875, -12.0771484375, -11.01025390625, -9.943359375, -8.87646484375, -7.8095703125, -6.74267578125, -5.67578125, -4.60888671875, -3.5419921875, -2.47509765625, -1.408203125, -0.34130859375, 0.7255859375, 1.79248046875, 2.859375, 3.92626953125, 4.9931640625, 6.06005859375, 7.126953125, 8.19384765625, 9.2607421875, 10.32763671875, 11.39453125, 12.46142578125, 13.5283203125, 14.59521484375, 15.662109375, 16.72900390625, 17.7958984375, 18.86279296875, 19.9296875, 20.99658203125, 22.0634765625, 23.13037109375, 24.197265625, 25.26416015625, 26.3310546875, 27.39794921875, 28.46484375, 29.53173828125, 30.5986328125, 31.66552734375, 32.732421875, 33.79931640625, 34.8662109375, 35.93310546875, 37.0]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 12.0, 16.0, 22.0, 28.0, 23.0, 40.0, 51.0, 49.0, 57.0, 64.0, 74.0, 80.0, 76.0, 70.0, 56.0, 55.0, 43.0, 40.0, 28.0, 32.0, 20.0, 11.0, 9.0, 14.0, 9.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.0472412109375, -3.926513671875, -3.8057861328125, -3.68505859375, -3.5643310546875, -3.443603515625, -3.3228759765625, -3.2021484375, -3.0814208984375, -2.960693359375, -2.8399658203125, -2.71923828125, -2.5985107421875, -2.477783203125, -2.3570556640625, -2.236328125, -2.1156005859375, -1.994873046875, -1.8741455078125, -1.75341796875, -1.6326904296875, -1.511962890625, -1.3912353515625, -1.2705078125, -1.1497802734375, -1.029052734375, -0.9083251953125, -0.78759765625, -0.6668701171875, -0.546142578125, -0.4254150390625, -0.3046875, -0.1839599609375, -0.063232421875, 0.0574951171875, 0.17822265625, 0.2989501953125, 0.419677734375, 0.5404052734375, 0.6611328125, 0.7818603515625, 0.902587890625, 1.0233154296875, 1.14404296875, 1.2647705078125, 1.385498046875, 1.5062255859375, 1.626953125, 1.7476806640625, 1.868408203125, 1.9891357421875, 2.10986328125, 2.2305908203125, 2.351318359375, 2.4720458984375, 2.5927734375, 2.7135009765625, 2.834228515625, 2.9549560546875, 3.07568359375, 3.1964111328125, 3.317138671875, 3.4378662109375, 3.55859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 11.0, 8.0, 18.0, 19.0, 22.0, 29.0, 39.0, 71.0, 103.0, 144.0, 229.0, 329.0, 483.0, 831.0, 1368.0, 2440.0, 4247.0, 8198.0, 16017.0, 36032.0, 98599.0, 501727.0, 3102140.0, 290089.0, 72813.0, 28927.0, 13417.0, 6817.0, 3714.0, 2075.0, 1232.0, 752.0, 456.0, 281.0, 182.0, 143.0, 86.0, 58.0, 36.0, 26.0, 25.0, 21.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.5390625, -13.13330078125, -12.7275390625, -12.32177734375, -11.916015625, -11.51025390625, -11.1044921875, -10.69873046875, -10.29296875, -9.88720703125, -9.4814453125, -9.07568359375, -8.669921875, -8.26416015625, -7.8583984375, -7.45263671875, -7.046875, -6.64111328125, -6.2353515625, -5.82958984375, -5.423828125, -5.01806640625, -4.6123046875, -4.20654296875, -3.80078125, -3.39501953125, -2.9892578125, -2.58349609375, -2.177734375, -1.77197265625, -1.3662109375, -0.96044921875, -0.5546875, -0.14892578125, 0.2568359375, 0.66259765625, 1.068359375, 1.47412109375, 1.8798828125, 2.28564453125, 2.69140625, 3.09716796875, 3.5029296875, 3.90869140625, 4.314453125, 4.72021484375, 5.1259765625, 5.53173828125, 5.9375, 6.34326171875, 6.7490234375, 7.15478515625, 7.560546875, 7.96630859375, 8.3720703125, 8.77783203125, 9.18359375, 9.58935546875, 9.9951171875, 10.40087890625, 10.806640625, 11.21240234375, 11.6181640625, 12.02392578125, 12.4296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 7.0, 9.0, 13.0, 20.0, 20.0, 26.0, 22.0, 55.0, 70.0, 107.0, 173.0, 326.0, 947.0, 1304.0, 377.0, 217.0, 96.0, 66.0, 52.0, 34.0, 27.0, 14.0, 15.0, 20.0, 5.0, 5.0, 5.0, 7.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.8359375, -5.65936279296875, -5.4827880859375, -5.30621337890625, -5.129638671875, -4.95306396484375, -4.7764892578125, -4.59991455078125, -4.42333984375, -4.24676513671875, -4.0701904296875, -3.89361572265625, -3.717041015625, -3.54046630859375, -3.3638916015625, -3.18731689453125, -3.0107421875, -2.83416748046875, -2.6575927734375, -2.48101806640625, -2.304443359375, -2.12786865234375, -1.9512939453125, -1.77471923828125, -1.59814453125, -1.42156982421875, -1.2449951171875, -1.06842041015625, -0.891845703125, -0.71527099609375, -0.5386962890625, -0.36212158203125, -0.185546875, -0.00897216796875, 0.1676025390625, 0.34417724609375, 0.520751953125, 0.69732666015625, 0.8739013671875, 1.05047607421875, 1.22705078125, 1.40362548828125, 1.5802001953125, 1.75677490234375, 1.933349609375, 2.10992431640625, 2.2864990234375, 2.46307373046875, 2.6396484375, 2.81622314453125, 2.9927978515625, 3.16937255859375, 3.345947265625, 3.52252197265625, 3.6990966796875, 3.87567138671875, 4.05224609375, 4.22882080078125, 4.4053955078125, 4.58197021484375, 4.758544921875, 4.93511962890625, 5.1116943359375, 5.28826904296875, 5.46484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 13.0, 34.0, 159.0, 414.0, 297.0, 69.0, 20.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-222.7930908203125, -218.32656860351562, -213.8600311279297, -209.3935089111328, -204.92697143554688, -200.46044921875, -195.99391174316406, -191.5273895263672, -187.06085205078125, -182.59432983398438, -178.12779235839844, -173.66127014160156, -169.19473266601562, -164.72821044921875, -160.2616729736328, -155.79515075683594, -151.32862854003906, -146.8621063232422, -142.39556884765625, -137.92904663085938, -133.46250915527344, -128.99598693847656, -124.52945709228516, -120.06292724609375, -115.59639739990234, -111.12986755371094, -106.66333770751953, -102.19680786132812, -97.73028564453125, -93.26374816894531, -88.79722595214844, -84.33069610595703, -79.86416625976562, -75.39763641357422, -70.93110656738281, -66.4645767211914, -61.998050689697266, -57.53152084350586, -53.06499481201172, -48.59846496582031, -44.13193893432617, -39.665409088134766, -35.198883056640625, -30.73235321044922, -26.265823364257812, -21.799293518066406, -17.332765579223633, -12.86623764038086, -8.399707794189453, -3.9331789016723633, 0.5333499908447266, 4.999878883361816, 9.466407775878906, 13.932937622070312, 18.399465560913086, 22.86599349975586, 27.332523345947266, 31.799053192138672, 36.26557922363281, 40.73210906982422, 45.198638916015625, 49.66516876220703, 54.13169860839844, 58.59822463989258, 63.064754486083984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 12.0, 7.0, 10.0, 16.0, 15.0, 14.0, 20.0, 25.0, 24.0, 36.0, 30.0, 47.0, 32.0, 48.0, 37.0, 46.0, 49.0, 61.0, 49.0, 43.0, 53.0, 47.0, 32.0, 51.0, 32.0, 43.0, 22.0, 28.0, 21.0, 12.0, 8.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.829288482666016, -26.098031997680664, -25.366775512695312, -24.63551902770996, -23.90426254272461, -23.173004150390625, -22.441749572753906, -21.710491180419922, -20.97923469543457, -20.24797821044922, -19.516721725463867, -18.785465240478516, -18.054208755493164, -17.322952270507812, -16.591693878173828, -15.860437393188477, -15.129181861877441, -14.39792537689209, -13.666668891906738, -12.93541145324707, -12.204154968261719, -11.472898483276367, -10.741641998291016, -10.010385513305664, -9.279129028320312, -8.547872543334961, -7.816615581512451, -7.0853590965271, -6.35410213470459, -5.622845649719238, -4.891589164733887, -4.160332202911377, -3.429075241088867, -2.6978185176849365, -1.9665619134902954, -1.2353053092956543, -0.5040485858917236, 0.22720813751220703, 0.9584646224975586, 1.6897215843200684, 2.42097806930542, 3.1522347927093506, 3.8834915161132812, 4.614748001098633, 5.346004486083984, 6.077261447906494, 6.808517932891846, 7.5397748947143555, 8.271031379699707, 9.002287864685059, 9.73354434967041, 10.464801788330078, 11.19605827331543, 11.927314758300781, 12.658571243286133, 13.389827728271484, 14.121084213256836, 14.852340698242188, 15.583597183227539, 16.31485366821289, 17.046110153198242, 17.777366638183594, 18.508625030517578, 19.23988151550293, 19.97113800048828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 5.0, 6.0, 7.0, 19.0, 27.0, 35.0, 68.0, 88.0, 128.0, 211.0, 315.0, 544.0, 988.0, 1898.0, 4363.0, 13428.0, 49298.0, 187004.0, 530693.0, 188168.0, 49159.0, 13415.0, 4449.0, 1925.0, 875.0, 526.0, 325.0, 177.0, 122.0, 100.0, 59.0, 42.0, 30.0, 16.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.64501953125, -18.9306640625, -18.21630859375, -17.501953125, -16.78759765625, -16.0732421875, -15.35888671875, -14.64453125, -13.93017578125, -13.2158203125, -12.50146484375, -11.787109375, -11.07275390625, -10.3583984375, -9.64404296875, -8.9296875, -8.21533203125, -7.5009765625, -6.78662109375, -6.072265625, -5.35791015625, -4.6435546875, -3.92919921875, -3.21484375, -2.50048828125, -1.7861328125, -1.07177734375, -0.357421875, 0.35693359375, 1.0712890625, 1.78564453125, 2.5, 3.21435546875, 3.9287109375, 4.64306640625, 5.357421875, 6.07177734375, 6.7861328125, 7.50048828125, 8.21484375, 8.92919921875, 9.6435546875, 10.35791015625, 11.072265625, 11.78662109375, 12.5009765625, 13.21533203125, 13.9296875, 14.64404296875, 15.3583984375, 16.07275390625, 16.787109375, 17.50146484375, 18.2158203125, 18.93017578125, 19.64453125, 20.35888671875, 21.0732421875, 21.78759765625, 22.501953125, 23.21630859375, 23.9306640625, 24.64501953125, 25.359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 13.0, 13.0, 39.0, 33.0, 37.0, 47.0, 52.0, 56.0, 64.0, 77.0, 76.0, 76.0, 58.0, 64.0, 39.0, 54.0, 48.0, 36.0, 33.0, 17.0, 12.0, 15.0, 4.0, 9.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.187713623046875, -4.06292724609375, -3.938140869140625, -3.8133544921875, -3.688568115234375, -3.56378173828125, -3.438995361328125, -3.314208984375, -3.189422607421875, -3.06463623046875, -2.939849853515625, -2.8150634765625, -2.690277099609375, -2.56549072265625, -2.440704345703125, -2.31591796875, -2.191131591796875, -2.06634521484375, -1.941558837890625, -1.8167724609375, -1.691986083984375, -1.56719970703125, -1.442413330078125, -1.317626953125, -1.192840576171875, -1.06805419921875, -0.943267822265625, -0.8184814453125, -0.693695068359375, -0.56890869140625, -0.444122314453125, -0.3193359375, -0.194549560546875, -0.06976318359375, 0.055023193359375, 0.1798095703125, 0.304595947265625, 0.42938232421875, 0.554168701171875, 0.678955078125, 0.803741455078125, 0.92852783203125, 1.053314208984375, 1.1781005859375, 1.302886962890625, 1.42767333984375, 1.552459716796875, 1.67724609375, 1.802032470703125, 1.92681884765625, 2.051605224609375, 2.1763916015625, 2.301177978515625, 2.42596435546875, 2.550750732421875, 2.675537109375, 2.800323486328125, 2.92510986328125, 3.049896240234375, 3.1746826171875, 3.299468994140625, 3.42425537109375, 3.549041748046875, 3.673828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 3.0, 9.0, 11.0, 17.0, 22.0, 21.0, 32.0, 40.0, 51.0, 67.0, 65.0, 107.0, 136.0, 199.0, 279.0, 432.0, 655.0, 1405.0, 3756.0, 11971.0, 45308.0, 176334.0, 525904.0, 206292.0, 53416.0, 13988.0, 4169.0, 1534.0, 767.0, 467.0, 294.0, 221.0, 148.0, 111.0, 90.0, 66.0, 58.0, 24.0, 29.0, 15.0, 14.0, 6.0, 12.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.7135009765625, -12.216064453125, -11.7186279296875, -11.22119140625, -10.7237548828125, -10.226318359375, -9.7288818359375, -9.2314453125, -8.7340087890625, -8.236572265625, -7.7391357421875, -7.24169921875, -6.7442626953125, -6.246826171875, -5.7493896484375, -5.251953125, -4.7545166015625, -4.257080078125, -3.7596435546875, -3.26220703125, -2.7647705078125, -2.267333984375, -1.7698974609375, -1.2724609375, -0.7750244140625, -0.277587890625, 0.2198486328125, 0.71728515625, 1.2147216796875, 1.712158203125, 2.2095947265625, 2.70703125, 3.2044677734375, 3.701904296875, 4.1993408203125, 4.69677734375, 5.1942138671875, 5.691650390625, 6.1890869140625, 6.6865234375, 7.1839599609375, 7.681396484375, 8.1788330078125, 8.67626953125, 9.1737060546875, 9.671142578125, 10.1685791015625, 10.666015625, 11.1634521484375, 11.660888671875, 12.1583251953125, 12.65576171875, 13.1531982421875, 13.650634765625, 14.1480712890625, 14.6455078125, 15.1429443359375, 15.640380859375, 16.1378173828125, 16.63525390625, 17.1326904296875, 17.630126953125, 18.1275634765625, 18.625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 7.0, 12.0, 6.0, 25.0, 19.0, 24.0, 38.0, 26.0, 37.0, 44.0, 38.0, 36.0, 46.0, 45.0, 54.0, 42.0, 58.0, 50.0, 62.0, 46.0, 37.0, 40.0, 31.0, 30.0, 38.0, 24.0, 23.0, 15.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.78125, -12.375732421875, -11.97021484375, -11.564697265625, -11.1591796875, -10.753662109375, -10.34814453125, -9.942626953125, -9.537109375, -9.131591796875, -8.72607421875, -8.320556640625, -7.9150390625, -7.509521484375, -7.10400390625, -6.698486328125, -6.29296875, -5.887451171875, -5.48193359375, -5.076416015625, -4.6708984375, -4.265380859375, -3.85986328125, -3.454345703125, -3.048828125, -2.643310546875, -2.23779296875, -1.832275390625, -1.4267578125, -1.021240234375, -0.61572265625, -0.210205078125, 0.1953125, 0.600830078125, 1.00634765625, 1.411865234375, 1.8173828125, 2.222900390625, 2.62841796875, 3.033935546875, 3.439453125, 3.844970703125, 4.25048828125, 4.656005859375, 5.0615234375, 5.467041015625, 5.87255859375, 6.278076171875, 6.68359375, 7.089111328125, 7.49462890625, 7.900146484375, 8.3056640625, 8.711181640625, 9.11669921875, 9.522216796875, 9.927734375, 10.333251953125, 10.73876953125, 11.144287109375, 11.5498046875, 11.955322265625, 12.36083984375, 12.766357421875, 13.171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 10.0, 13.0, 13.0, 23.0, 46.0, 53.0, 126.0, 244.0, 557.0, 1156.0, 2919.0, 8514.0, 28333.0, 102194.0, 496694.0, 308627.0, 69141.0, 19686.0, 6263.0, 2216.0, 871.0, 406.0, 208.0, 98.0, 73.0, 35.0, 17.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8787841796875, -6.640380859375, -6.4019775390625, -6.16357421875, -5.9251708984375, -5.686767578125, -5.4483642578125, -5.2099609375, -4.9715576171875, -4.733154296875, -4.4947509765625, -4.25634765625, -4.0179443359375, -3.779541015625, -3.5411376953125, -3.302734375, -3.0643310546875, -2.825927734375, -2.5875244140625, -2.34912109375, -2.1107177734375, -1.872314453125, -1.6339111328125, -1.3955078125, -1.1571044921875, -0.918701171875, -0.6802978515625, -0.44189453125, -0.2034912109375, 0.034912109375, 0.2733154296875, 0.51171875, 0.7501220703125, 0.988525390625, 1.2269287109375, 1.46533203125, 1.7037353515625, 1.942138671875, 2.1805419921875, 2.4189453125, 2.6573486328125, 2.895751953125, 3.1341552734375, 3.37255859375, 3.6109619140625, 3.849365234375, 4.0877685546875, 4.326171875, 4.5645751953125, 4.802978515625, 5.0413818359375, 5.27978515625, 5.5181884765625, 5.756591796875, 5.9949951171875, 6.2333984375, 6.4718017578125, 6.710205078125, 6.9486083984375, 7.18701171875, 7.4254150390625, 7.663818359375, 7.9022216796875, 8.140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 12.0, 12.0, 12.0, 21.0, 16.0, 26.0, 23.0, 35.0, 41.0, 66.0, 85.0, 151.0, 130.0, 76.0, 66.0, 39.0, 31.0, 37.0, 15.0, 26.0, 12.0, 19.0, 11.0, 7.0, 7.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007977485656738281, -0.000764213502407074, -0.0007306784391403198, -0.0006971433758735657, -0.0006636083126068115, -0.0006300732493400574, -0.0005965381860733032, -0.0005630031228065491, -0.0005294680595397949, -0.0004959329962730408, -0.0004623979330062866, -0.00042886286973953247, -0.0003953278064727783, -0.00036179274320602417, -0.00032825767993927, -0.00029472261667251587, -0.0002611875534057617, -0.00022765249013900757, -0.00019411742687225342, -0.00016058236360549927, -0.00012704730033874512, -9.351223707199097e-05, -5.9977173805236816e-05, -2.6442110538482666e-05, 7.092952728271484e-06, 4.0628015995025635e-05, 7.416307926177979e-05, 0.00010769814252853394, 0.00014123320579528809, 0.00017476826906204224, 0.0002083033323287964, 0.00024183839559555054, 0.0002753734588623047, 0.00030890852212905884, 0.000342443585395813, 0.00037597864866256714, 0.0004095137119293213, 0.00044304877519607544, 0.0004765838384628296, 0.0005101189017295837, 0.0005436539649963379, 0.000577189028263092, 0.0006107240915298462, 0.0006442591547966003, 0.0006777942180633545, 0.0007113292813301086, 0.0007448643445968628, 0.0007783994078636169, 0.0008119344711303711, 0.0008454695343971252, 0.0008790045976638794, 0.0009125396609306335, 0.0009460747241973877, 0.0009796097874641418, 0.001013144850730896, 0.0010466799139976501, 0.0010802149772644043, 0.0011137500405311584, 0.0011472851037979126, 0.0011808201670646667, 0.001214355230331421, 0.001247890293598175, 0.0012814253568649292, 0.0013149604201316833, 0.0013484954833984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 13.0, 18.0, 28.0, 49.0, 103.0, 164.0, 295.0, 601.0, 1568.0, 6227.0, 45090.0, 547376.0, 404750.0, 34643.0, 5106.0, 1337.0, 562.0, 271.0, 134.0, 87.0, 55.0, 25.0, 26.0, 12.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.8134765625, -8.392578125, -7.9716796875, -7.55078125, -7.1298828125, -6.708984375, -6.2880859375, -5.8671875, -5.4462890625, -5.025390625, -4.6044921875, -4.18359375, -3.7626953125, -3.341796875, -2.9208984375, -2.5, -2.0791015625, -1.658203125, -1.2373046875, -0.81640625, -0.3955078125, 0.025390625, 0.4462890625, 0.8671875, 1.2880859375, 1.708984375, 2.1298828125, 2.55078125, 2.9716796875, 3.392578125, 3.8134765625, 4.234375, 4.6552734375, 5.076171875, 5.4970703125, 5.91796875, 6.3388671875, 6.759765625, 7.1806640625, 7.6015625, 8.0224609375, 8.443359375, 8.8642578125, 9.28515625, 9.7060546875, 10.126953125, 10.5478515625, 10.96875, 11.3896484375, 11.810546875, 12.2314453125, 12.65234375, 13.0732421875, 13.494140625, 13.9150390625, 14.3359375, 14.7568359375, 15.177734375, 15.5986328125, 16.01953125, 16.4404296875, 16.861328125, 17.2822265625, 17.703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 16.0, 16.0, 20.0, 22.0, 34.0, 52.0, 55.0, 81.0, 94.0, 149.0, 115.0, 79.0, 53.0, 42.0, 32.0, 27.0, 18.0, 20.0, 5.0, 12.0, 9.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.92999267578125, -4.6998291015625, -4.46966552734375, -4.239501953125, -4.00933837890625, -3.7791748046875, -3.54901123046875, -3.31884765625, -3.08868408203125, -2.8585205078125, -2.62835693359375, -2.398193359375, -2.16802978515625, -1.9378662109375, -1.70770263671875, -1.4775390625, -1.24737548828125, -1.0172119140625, -0.78704833984375, -0.556884765625, -0.32672119140625, -0.0965576171875, 0.13360595703125, 0.36376953125, 0.59393310546875, 0.8240966796875, 1.05426025390625, 1.284423828125, 1.51458740234375, 1.7447509765625, 1.97491455078125, 2.205078125, 2.43524169921875, 2.6654052734375, 2.89556884765625, 3.125732421875, 3.35589599609375, 3.5860595703125, 3.81622314453125, 4.04638671875, 4.27655029296875, 4.5067138671875, 4.73687744140625, 4.967041015625, 5.19720458984375, 5.4273681640625, 5.65753173828125, 5.8876953125, 6.11785888671875, 6.3480224609375, 6.57818603515625, 6.808349609375, 7.03851318359375, 7.2686767578125, 7.49884033203125, 7.72900390625, 7.95916748046875, 8.1893310546875, 8.41949462890625, 8.649658203125, 8.87982177734375, 9.1099853515625, 9.34014892578125, 9.5703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 14.0, 9.0, 25.0, 45.0, 69.0, 61.0, 86.0, 98.0, 111.0, 96.0, 89.0, 88.0, 58.0, 36.0, 35.0, 18.0, 16.0, 12.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.94291687011719, -72.98637390136719, -70.02982330322266, -67.07328033447266, -64.11672973632812, -61.160186767578125, -58.20363998413086, -55.247093200683594, -52.29054641723633, -49.33399963378906, -46.3774528503418, -43.42090606689453, -40.46436309814453, -37.5078125, -34.55126953125, -31.594722747802734, -28.63817596435547, -25.681629180908203, -22.725082397460938, -19.768537521362305, -16.81199073791504, -13.855443954467773, -10.89889907836914, -7.942352294921875, -4.985805511474609, -2.029259204864502, 0.9272871017456055, 3.8838329315185547, 6.84037971496582, 9.796926498413086, 12.753471374511719, 15.710018157958984, 18.66656494140625, 21.623111724853516, 24.57965850830078, 27.536203384399414, 30.49275016784668, 33.44929504394531, 36.40584182739258, 39.362388610839844, 42.31893539428711, 45.275482177734375, 48.23202896118164, 51.188575744628906, 54.145118713378906, 57.10166931152344, 60.05821228027344, 63.0147590637207, 65.97130584716797, 68.92784881591797, 71.8843994140625, 74.8409423828125, 77.79749298095703, 80.75403594970703, 83.71058654785156, 86.66712951660156, 89.62367248535156, 92.58021545410156, 95.5367660522461, 98.4933090209961, 101.44985961914062, 104.40640258789062, 107.36294555664062, 110.31949615478516, 113.27604675292969]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 6.0, 4.0, 10.0, 12.0, 8.0, 9.0, 17.0, 20.0, 20.0, 27.0, 20.0, 25.0, 27.0, 34.0, 45.0, 32.0, 38.0, 47.0, 38.0, 39.0, 41.0, 28.0, 44.0, 40.0, 41.0, 33.0, 35.0, 37.0, 29.0, 32.0, 20.0, 25.0, 18.0, 11.0, 11.0, 12.0, 5.0, 6.0, 14.0, 2.0, 6.0, 5.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-55.7684440612793, -54.07344436645508, -52.37844467163086, -50.68344497680664, -48.988441467285156, -47.29344177246094, -45.59844207763672, -43.9034423828125, -42.20844268798828, -40.51344299316406, -38.818443298339844, -37.123443603515625, -35.428443908691406, -33.73344421386719, -32.0384407043457, -30.343441009521484, -28.648441314697266, -26.953441619873047, -25.258441925048828, -23.563440322875977, -21.868440628051758, -20.17344093322754, -18.478439331054688, -16.78343963623047, -15.08843994140625, -13.393440246582031, -11.698439598083496, -10.003438949584961, -8.308439254760742, -6.613439559936523, -4.918438911437988, -3.223438262939453, -1.5284347534179688, 0.1665654182434082, 1.8615655899047852, 3.556565761566162, 5.251565933227539, 6.946565628051758, 8.641566276550293, 10.336566925048828, 12.031566619873047, 13.726566314697266, 15.4215669631958, 17.116567611694336, 18.811567306518555, 20.506567001342773, 22.201568603515625, 23.896568298339844, 25.591567993164062, 27.28656768798828, 28.9815673828125, 30.67656898498535, 32.37156677246094, 34.066566467285156, 35.76156997680664, 37.45656967163086, 39.15156936645508, 40.8465690612793, 42.541568756103516, 44.236568450927734, 45.93157196044922, 47.62657165527344, 49.321571350097656, 51.016571044921875, 52.711570739746094]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 11.0, 24.0, 20.0, 37.0, 34.0, 79.0, 91.0, 196.0, 293.0, 572.0, 1149.0, 2903.0, 9999.0, 60796.0, 3335408.0, 735454.0, 36531.0, 7035.0, 2080.0, 755.0, 342.0, 188.0, 102.0, 42.0, 45.0, 28.0, 19.0, 7.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.78125, -33.57666015625, -32.3720703125, -31.16748046875, -29.962890625, -28.75830078125, -27.5537109375, -26.34912109375, -25.14453125, -23.93994140625, -22.7353515625, -21.53076171875, -20.326171875, -19.12158203125, -17.9169921875, -16.71240234375, -15.5078125, -14.30322265625, -13.0986328125, -11.89404296875, -10.689453125, -9.48486328125, -8.2802734375, -7.07568359375, -5.87109375, -4.66650390625, -3.4619140625, -2.25732421875, -1.052734375, 0.15185546875, 1.3564453125, 2.56103515625, 3.765625, 4.97021484375, 6.1748046875, 7.37939453125, 8.583984375, 9.78857421875, 10.9931640625, 12.19775390625, 13.40234375, 14.60693359375, 15.8115234375, 17.01611328125, 18.220703125, 19.42529296875, 20.6298828125, 21.83447265625, 23.0390625, 24.24365234375, 25.4482421875, 26.65283203125, 27.857421875, 29.06201171875, 30.2666015625, 31.47119140625, 32.67578125, 33.88037109375, 35.0849609375, 36.28955078125, 37.494140625, 38.69873046875, 39.9033203125, 41.10791015625, 42.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 15.0, 9.0, 14.0, 23.0, 24.0, 39.0, 40.0, 64.0, 62.0, 61.0, 69.0, 69.0, 70.0, 77.0, 57.0, 54.0, 49.0, 56.0, 30.0, 21.0, 21.0, 16.0, 24.0, 10.0, 7.0, 9.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.158782958984375, -4.03240966796875, -3.906036376953125, -3.7796630859375, -3.653289794921875, -3.52691650390625, -3.400543212890625, -3.274169921875, -3.147796630859375, -3.02142333984375, -2.895050048828125, -2.7686767578125, -2.642303466796875, -2.51593017578125, -2.389556884765625, -2.26318359375, -2.136810302734375, -2.01043701171875, -1.884063720703125, -1.7576904296875, -1.631317138671875, -1.50494384765625, -1.378570556640625, -1.252197265625, -1.125823974609375, -0.99945068359375, -0.873077392578125, -0.7467041015625, -0.620330810546875, -0.49395751953125, -0.367584228515625, -0.2412109375, -0.114837646484375, 0.01153564453125, 0.137908935546875, 0.2642822265625, 0.390655517578125, 0.51702880859375, 0.643402099609375, 0.769775390625, 0.896148681640625, 1.02252197265625, 1.148895263671875, 1.2752685546875, 1.401641845703125, 1.52801513671875, 1.654388427734375, 1.78076171875, 1.907135009765625, 2.03350830078125, 2.159881591796875, 2.2862548828125, 2.412628173828125, 2.53900146484375, 2.665374755859375, 2.791748046875, 2.918121337890625, 3.04449462890625, 3.170867919921875, 3.2972412109375, 3.423614501953125, 3.54998779296875, 3.676361083984375, 3.802734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 8.0, 8.0, 4.0, 12.0, 9.0, 17.0, 18.0, 20.0, 32.0, 46.0, 66.0, 105.0, 128.0, 211.0, 341.0, 589.0, 1200.0, 3057.0, 9957.0, 49391.0, 657196.0, 3316561.0, 127380.0, 19159.0, 5001.0, 1723.0, 774.0, 451.0, 261.0, 166.0, 122.0, 69.0, 50.0, 36.0, 29.0, 19.0, 19.0, 9.0, 5.0, 11.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0], "bins": [-24.890625, -24.163330078125, -23.43603515625, -22.708740234375, -21.9814453125, -21.254150390625, -20.52685546875, -19.799560546875, -19.072265625, -18.344970703125, -17.61767578125, -16.890380859375, -16.1630859375, -15.435791015625, -14.70849609375, -13.981201171875, -13.25390625, -12.526611328125, -11.79931640625, -11.072021484375, -10.3447265625, -9.617431640625, -8.89013671875, -8.162841796875, -7.435546875, -6.708251953125, -5.98095703125, -5.253662109375, -4.5263671875, -3.799072265625, -3.07177734375, -2.344482421875, -1.6171875, -0.889892578125, -0.16259765625, 0.564697265625, 1.2919921875, 2.019287109375, 2.74658203125, 3.473876953125, 4.201171875, 4.928466796875, 5.65576171875, 6.383056640625, 7.1103515625, 7.837646484375, 8.56494140625, 9.292236328125, 10.01953125, 10.746826171875, 11.47412109375, 12.201416015625, 12.9287109375, 13.656005859375, 14.38330078125, 15.110595703125, 15.837890625, 16.565185546875, 17.29248046875, 18.019775390625, 18.7470703125, 19.474365234375, 20.20166015625, 20.928955078125, 21.65625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 15.0, 35.0, 77.0, 107.0, 289.0, 1065.0, 1694.0, 452.0, 174.0, 72.0, 35.0, 23.0, 16.0, 7.0, 8.0, 3.0, 3.0, 1.0], "bins": [-22.8125, -22.37506103515625, -21.9376220703125, -21.50018310546875, -21.062744140625, -20.62530517578125, -20.1878662109375, -19.75042724609375, -19.31298828125, -18.87554931640625, -18.4381103515625, -18.00067138671875, -17.563232421875, -17.12579345703125, -16.6883544921875, -16.25091552734375, -15.8134765625, -15.37603759765625, -14.9385986328125, -14.50115966796875, -14.063720703125, -13.62628173828125, -13.1888427734375, -12.75140380859375, -12.31396484375, -11.87652587890625, -11.4390869140625, -11.00164794921875, -10.564208984375, -10.12677001953125, -9.6893310546875, -9.25189208984375, -8.814453125, -8.37701416015625, -7.9395751953125, -7.50213623046875, -7.064697265625, -6.62725830078125, -6.1898193359375, -5.75238037109375, -5.31494140625, -4.87750244140625, -4.4400634765625, -4.00262451171875, -3.565185546875, -3.12774658203125, -2.6903076171875, -2.25286865234375, -1.8154296875, -1.37799072265625, -0.9405517578125, -0.50311279296875, -0.065673828125, 0.37176513671875, 0.8092041015625, 1.24664306640625, 1.68408203125, 2.12152099609375, 2.5589599609375, 2.99639892578125, 3.433837890625, 3.87127685546875, 4.3087158203125, 4.74615478515625, 5.18359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 19.0, 36.0, 68.0, 154.0, 241.0, 204.0, 143.0, 76.0, 36.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-152.61488342285156, -149.49111938476562, -146.3673553466797, -143.24359130859375, -140.11981201171875, -136.9960479736328, -133.87228393554688, -130.74851989746094, -127.624755859375, -124.50099182128906, -121.3772201538086, -118.25345611572266, -115.12969207763672, -112.00592803955078, -108.88215637207031, -105.75839233398438, -102.63462829589844, -99.5108642578125, -96.38709259033203, -93.2633285522461, -90.13956451416016, -87.01580047607422, -83.89202880859375, -80.76826477050781, -77.64449310302734, -74.5207290649414, -71.39695739746094, -68.273193359375, -65.14942932128906, -62.02566146850586, -58.901893615722656, -55.77812957763672, -52.65436935424805, -49.530601501464844, -46.406837463378906, -43.2830696105957, -40.159305572509766, -37.03553771972656, -33.911773681640625, -30.788005828857422, -27.66423988342285, -24.54047393798828, -21.41670799255371, -18.29294204711914, -15.169175148010254, -12.045409202575684, -8.921642303466797, -5.797876358032227, -2.6741104125976562, 0.44965577125549316, 3.5734219551086426, 6.697188377380371, 9.820954322814941, 12.944720268249512, 16.0684871673584, 19.19225311279297, 22.31601905822754, 25.43978500366211, 28.56355094909668, 31.68731689453125, 34.81108474731445, 37.93484878540039, 41.058616638183594, 44.18238067626953, 47.306148529052734]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 15.0, 15.0, 20.0, 33.0, 27.0, 42.0, 58.0, 76.0, 61.0, 83.0, 77.0, 97.0, 71.0, 77.0, 62.0, 42.0, 43.0, 42.0, 20.0, 12.0, 17.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.415626525878906, -26.04025650024414, -24.664886474609375, -23.289518356323242, -21.914148330688477, -20.53877830505371, -19.163410186767578, -17.788040161132812, -16.412670135498047, -15.037300109863281, -13.661931037902832, -12.286561965942383, -10.911191940307617, -9.535821914672852, -8.160452842712402, -6.785083770751953, -5.4097137451171875, -4.03434419631958, -2.6589746475219727, -1.2836050987243652, 0.09176445007324219, 1.4671339988708496, 2.842503547668457, 4.217872619628906, 5.593242645263672, 6.968612194061279, 8.343981742858887, 9.719350814819336, 11.094720840454102, 12.470090866088867, 13.845459938049316, 15.220829010009766, 16.596195220947266, 17.97156524658203, 19.346935272216797, 20.72230339050293, 22.097673416137695, 23.47304344177246, 24.848411560058594, 26.22378158569336, 27.599151611328125, 28.97452163696289, 30.349891662597656, 31.72525978088379, 33.10063171386719, 34.47599792480469, 35.85136795043945, 37.22673797607422, 38.602108001708984, 39.97747802734375, 41.352848052978516, 42.72821807861328, 44.10358428955078, 45.47895431518555, 46.85432434082031, 48.22969436645508, 49.605064392089844, 50.98043441772461, 52.355804443359375, 53.73117446899414, 55.106544494628906, 56.481910705566406, 57.85728073120117, 59.23265075683594, 60.6080207824707]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 8.0, 9.0, 8.0, 14.0, 24.0, 26.0, 48.0, 50.0, 71.0, 98.0, 136.0, 218.0, 317.0, 441.0, 748.0, 1276.0, 2513.0, 5088.0, 12145.0, 34439.0, 109573.0, 308991.0, 357219.0, 142421.0, 44428.0, 15284.0, 6076.0, 2909.0, 1527.0, 844.0, 519.0, 340.0, 218.0, 155.0, 102.0, 70.0, 52.0, 38.0, 35.0, 16.0, 17.0, 17.0, 9.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0], "bins": [-19.078125, -18.5347900390625, -17.991455078125, -17.4481201171875, -16.90478515625, -16.3614501953125, -15.818115234375, -15.2747802734375, -14.7314453125, -14.1881103515625, -13.644775390625, -13.1014404296875, -12.55810546875, -12.0147705078125, -11.471435546875, -10.9281005859375, -10.384765625, -9.8414306640625, -9.298095703125, -8.7547607421875, -8.21142578125, -7.6680908203125, -7.124755859375, -6.5814208984375, -6.0380859375, -5.4947509765625, -4.951416015625, -4.4080810546875, -3.86474609375, -3.3214111328125, -2.778076171875, -2.2347412109375, -1.69140625, -1.1480712890625, -0.604736328125, -0.0614013671875, 0.48193359375, 1.0252685546875, 1.568603515625, 2.1119384765625, 2.6552734375, 3.1986083984375, 3.741943359375, 4.2852783203125, 4.82861328125, 5.3719482421875, 5.915283203125, 6.4586181640625, 7.001953125, 7.5452880859375, 8.088623046875, 8.6319580078125, 9.17529296875, 9.7186279296875, 10.261962890625, 10.8052978515625, 11.3486328125, 11.8919677734375, 12.435302734375, 12.9786376953125, 13.52197265625, 14.0653076171875, 14.608642578125, 15.1519775390625, 15.6953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 8.0, 9.0, 14.0, 15.0, 12.0, 28.0, 33.0, 48.0, 55.0, 62.0, 59.0, 73.0, 66.0, 72.0, 63.0, 64.0, 68.0, 45.0, 38.0, 34.0, 30.0, 29.0, 13.0, 18.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12847900390625, -3.9991455078125, -3.86981201171875, -3.740478515625, -3.61114501953125, -3.4818115234375, -3.35247802734375, -3.22314453125, -3.09381103515625, -2.9644775390625, -2.83514404296875, -2.705810546875, -2.57647705078125, -2.4471435546875, -2.31781005859375, -2.1884765625, -2.05914306640625, -1.9298095703125, -1.80047607421875, -1.671142578125, -1.54180908203125, -1.4124755859375, -1.28314208984375, -1.15380859375, -1.02447509765625, -0.8951416015625, -0.76580810546875, -0.636474609375, -0.50714111328125, -0.3778076171875, -0.24847412109375, -0.119140625, 0.01019287109375, 0.1395263671875, 0.26885986328125, 0.398193359375, 0.52752685546875, 0.6568603515625, 0.78619384765625, 0.91552734375, 1.04486083984375, 1.1741943359375, 1.30352783203125, 1.432861328125, 1.56219482421875, 1.6915283203125, 1.82086181640625, 1.9501953125, 2.07952880859375, 2.2088623046875, 2.33819580078125, 2.467529296875, 2.59686279296875, 2.7261962890625, 2.85552978515625, 2.98486328125, 3.11419677734375, 3.2435302734375, 3.37286376953125, 3.502197265625, 3.63153076171875, 3.7608642578125, 3.89019775390625, 4.01953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 17.0, 9.0, 15.0, 15.0, 37.0, 56.0, 79.0, 180.0, 429.0, 1117.0, 5293.0, 114156.0, 885142.0, 37493.0, 3034.0, 772.0, 289.0, 125.0, 96.0, 57.0, 40.0, 14.0, 23.0, 10.0, 12.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -49.95458984375, -48.2529296875, -46.55126953125, -44.849609375, -43.14794921875, -41.4462890625, -39.74462890625, -38.04296875, -36.34130859375, -34.6396484375, -32.93798828125, -31.236328125, -29.53466796875, -27.8330078125, -26.13134765625, -24.4296875, -22.72802734375, -21.0263671875, -19.32470703125, -17.623046875, -15.92138671875, -14.2197265625, -12.51806640625, -10.81640625, -9.11474609375, -7.4130859375, -5.71142578125, -4.009765625, -2.30810546875, -0.6064453125, 1.09521484375, 2.796875, 4.49853515625, 6.2001953125, 7.90185546875, 9.603515625, 11.30517578125, 13.0068359375, 14.70849609375, 16.41015625, 18.11181640625, 19.8134765625, 21.51513671875, 23.216796875, 24.91845703125, 26.6201171875, 28.32177734375, 30.0234375, 31.72509765625, 33.4267578125, 35.12841796875, 36.830078125, 38.53173828125, 40.2333984375, 41.93505859375, 43.63671875, 45.33837890625, 47.0400390625, 48.74169921875, 50.443359375, 52.14501953125, 53.8466796875, 55.54833984375, 57.25]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 1.0, 8.0, 6.0, 8.0, 12.0, 10.0, 14.0, 22.0, 23.0, 36.0, 37.0, 45.0, 46.0, 56.0, 56.0, 57.0, 79.0, 60.0, 57.0, 63.0, 46.0, 43.0, 43.0, 30.0, 29.0, 24.0, 18.0, 15.0, 8.0, 11.0, 11.0, 3.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.564208984375, -18.98779296875, -18.411376953125, -17.8349609375, -17.258544921875, -16.68212890625, -16.105712890625, -15.529296875, -14.952880859375, -14.37646484375, -13.800048828125, -13.2236328125, -12.647216796875, -12.07080078125, -11.494384765625, -10.91796875, -10.341552734375, -9.76513671875, -9.188720703125, -8.6123046875, -8.035888671875, -7.45947265625, -6.883056640625, -6.306640625, -5.730224609375, -5.15380859375, -4.577392578125, -4.0009765625, -3.424560546875, -2.84814453125, -2.271728515625, -1.6953125, -1.118896484375, -0.54248046875, 0.033935546875, 0.6103515625, 1.186767578125, 1.76318359375, 2.339599609375, 2.916015625, 3.492431640625, 4.06884765625, 4.645263671875, 5.2216796875, 5.798095703125, 6.37451171875, 6.950927734375, 7.52734375, 8.103759765625, 8.68017578125, 9.256591796875, 9.8330078125, 10.409423828125, 10.98583984375, 11.562255859375, 12.138671875, 12.715087890625, 13.29150390625, 13.867919921875, 14.4443359375, 15.020751953125, 15.59716796875, 16.173583984375, 16.75]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 6.0, 9.0, 12.0, 10.0, 23.0, 33.0, 41.0, 56.0, 100.0, 243.0, 597.0, 1598.0, 5985.0, 52833.0, 779664.0, 191166.0, 11967.0, 2607.0, 875.0, 313.0, 150.0, 95.0, 32.0, 31.0, 17.0, 15.0, 11.0, 11.0, 12.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.645263671875, -16.10302734375, -15.560791015625, -15.0185546875, -14.476318359375, -13.93408203125, -13.391845703125, -12.849609375, -12.307373046875, -11.76513671875, -11.222900390625, -10.6806640625, -10.138427734375, -9.59619140625, -9.053955078125, -8.51171875, -7.969482421875, -7.42724609375, -6.885009765625, -6.3427734375, -5.800537109375, -5.25830078125, -4.716064453125, -4.173828125, -3.631591796875, -3.08935546875, -2.547119140625, -2.0048828125, -1.462646484375, -0.92041015625, -0.378173828125, 0.1640625, 0.706298828125, 1.24853515625, 1.790771484375, 2.3330078125, 2.875244140625, 3.41748046875, 3.959716796875, 4.501953125, 5.044189453125, 5.58642578125, 6.128662109375, 6.6708984375, 7.213134765625, 7.75537109375, 8.297607421875, 8.83984375, 9.382080078125, 9.92431640625, 10.466552734375, 11.0087890625, 11.551025390625, 12.09326171875, 12.635498046875, 13.177734375, 13.719970703125, 14.26220703125, 14.804443359375, 15.3466796875, 15.888916015625, 16.43115234375, 16.973388671875, 17.515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 11.0, 14.0, 12.0, 22.0, 27.0, 43.0, 61.0, 94.0, 106.0, 118.0, 103.0, 101.0, 98.0, 58.0, 43.0, 25.0, 25.0, 9.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014820098876953125, -0.0014367848634719849, -0.0013915598392486572, -0.0013463348150253296, -0.001301109790802002, -0.0012558847665786743, -0.0012106597423553467, -0.001165434718132019, -0.0011202096939086914, -0.0010749846696853638, -0.0010297596454620361, -0.0009845346212387085, -0.0009393095970153809, -0.0008940845727920532, -0.0008488595485687256, -0.000803634524345398, -0.0007584095001220703, -0.0007131844758987427, -0.000667959451675415, -0.0006227344274520874, -0.0005775094032287598, -0.0005322843790054321, -0.0004870593547821045, -0.00044183433055877686, -0.0003966093063354492, -0.0003513842821121216, -0.00030615925788879395, -0.0002609342336654663, -0.00021570920944213867, -0.00017048418521881104, -0.0001252591609954834, -8.003413677215576e-05, -3.4809112548828125e-05, 1.0415911674499512e-05, 5.564093589782715e-05, 0.00010086596012115479, 0.00014609098434448242, 0.00019131600856781006, 0.0002365410327911377, 0.00028176605701446533, 0.00032699108123779297, 0.0003722161054611206, 0.00041744112968444824, 0.0004626661539077759, 0.0005078911781311035, 0.0005531162023544312, 0.0005983412265777588, 0.0006435662508010864, 0.0006887912750244141, 0.0007340162992477417, 0.0007792413234710693, 0.000824466347694397, 0.0008696913719177246, 0.0009149163961410522, 0.0009601414203643799, 0.0010053664445877075, 0.0010505914688110352, 0.0010958164930343628, 0.0011410415172576904, 0.001186266541481018, 0.0012314915657043457, 0.0012767165899276733, 0.001321941614151001, 0.0013671666383743286, 0.0014123916625976562]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 2.0, 18.0, 10.0, 19.0, 26.0, 32.0, 52.0, 73.0, 112.0, 200.0, 326.0, 599.0, 1231.0, 2791.0, 7870.0, 36554.0, 531655.0, 424168.0, 30635.0, 7092.0, 2498.0, 1139.0, 556.0, 326.0, 169.0, 110.0, 74.0, 57.0, 41.0, 23.0, 17.0, 14.0, 10.0, 5.0, 2.0, 9.0, 4.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.21875, -15.711181640625, -15.20361328125, -14.696044921875, -14.1884765625, -13.680908203125, -13.17333984375, -12.665771484375, -12.158203125, -11.650634765625, -11.14306640625, -10.635498046875, -10.1279296875, -9.620361328125, -9.11279296875, -8.605224609375, -8.09765625, -7.590087890625, -7.08251953125, -6.574951171875, -6.0673828125, -5.559814453125, -5.05224609375, -4.544677734375, -4.037109375, -3.529541015625, -3.02197265625, -2.514404296875, -2.0068359375, -1.499267578125, -0.99169921875, -0.484130859375, 0.0234375, 0.531005859375, 1.03857421875, 1.546142578125, 2.0537109375, 2.561279296875, 3.06884765625, 3.576416015625, 4.083984375, 4.591552734375, 5.09912109375, 5.606689453125, 6.1142578125, 6.621826171875, 7.12939453125, 7.636962890625, 8.14453125, 8.652099609375, 9.15966796875, 9.667236328125, 10.1748046875, 10.682373046875, 11.18994140625, 11.697509765625, 12.205078125, 12.712646484375, 13.22021484375, 13.727783203125, 14.2353515625, 14.742919921875, 15.25048828125, 15.758056640625, 16.265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 5.0, 7.0, 5.0, 16.0, 30.0, 46.0, 75.0, 115.0, 129.0, 155.0, 149.0, 87.0, 57.0, 28.0, 12.0, 25.0, 11.0, 3.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4453125, -13.04248046875, -12.6396484375, -12.23681640625, -11.833984375, -11.43115234375, -11.0283203125, -10.62548828125, -10.22265625, -9.81982421875, -9.4169921875, -9.01416015625, -8.611328125, -8.20849609375, -7.8056640625, -7.40283203125, -7.0, -6.59716796875, -6.1943359375, -5.79150390625, -5.388671875, -4.98583984375, -4.5830078125, -4.18017578125, -3.77734375, -3.37451171875, -2.9716796875, -2.56884765625, -2.166015625, -1.76318359375, -1.3603515625, -0.95751953125, -0.5546875, -0.15185546875, 0.2509765625, 0.65380859375, 1.056640625, 1.45947265625, 1.8623046875, 2.26513671875, 2.66796875, 3.07080078125, 3.4736328125, 3.87646484375, 4.279296875, 4.68212890625, 5.0849609375, 5.48779296875, 5.890625, 6.29345703125, 6.6962890625, 7.09912109375, 7.501953125, 7.90478515625, 8.3076171875, 8.71044921875, 9.11328125, 9.51611328125, 9.9189453125, 10.32177734375, 10.724609375, 11.12744140625, 11.5302734375, 11.93310546875, 12.3359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 23.0, 154.0, 375.0, 314.0, 105.0, 23.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.13784790039062, -121.69703674316406, -108.2562255859375, -94.8154067993164, -81.37459564208984, -67.93378448486328, -54.49296569824219, -41.052154541015625, -27.611343383789062, -14.170530319213867, -0.7297172546386719, 12.711097717285156, 26.15190887451172, 39.59272003173828, 53.033538818359375, 66.47434997558594, 79.9151611328125, 93.35597229003906, 106.79678344726562, 120.23760223388672, 133.67840576171875, 147.11923217773438, 160.56004333496094, 174.0008544921875, 187.44166564941406, 200.88247680664062, 214.3232879638672, 227.76409912109375, 241.20492553710938, 254.64572143554688, 268.0865478515625, 281.52734375, 294.9681396484375, 308.4089660644531, 321.8497619628906, 335.29058837890625, 348.73138427734375, 362.1722106933594, 375.613037109375, 389.0538330078125, 402.49462890625, 415.9354553222656, 429.3762512207031, 442.81707763671875, 456.25787353515625, 469.6986999511719, 483.1395263671875, 496.580322265625, 510.0211486816406, 523.4619750976562, 536.9027709960938, 550.3435668945312, 563.784423828125, 577.2252197265625, 590.666015625, 604.1068115234375, 617.5476684570312, 630.9884643554688, 644.4293212890625, 657.8701171875, 671.3109130859375, 684.751708984375, 698.1925659179688, 711.6333618164062, 725.0741577148438]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 7.0, 12.0, 10.0, 20.0, 16.0, 24.0, 21.0, 23.0, 21.0, 22.0, 38.0, 46.0, 33.0, 34.0, 45.0, 49.0, 51.0, 39.0, 31.0, 46.0, 32.0, 38.0, 30.0, 39.0, 33.0, 26.0, 28.0, 34.0, 32.0, 21.0, 18.0, 16.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-74.07373046875, -71.78854370117188, -69.50334930419922, -67.2181625366211, -64.93297576904297, -62.64778518676758, -60.36259460449219, -58.07740783691406, -55.79221725463867, -53.50702667236328, -51.221839904785156, -48.936649322509766, -46.651458740234375, -44.36627197265625, -42.08108139038086, -39.79589080810547, -37.510704040527344, -35.22551345825195, -32.94032669067383, -30.655136108398438, -28.36994743347168, -26.084758758544922, -23.79956817626953, -21.514379501342773, -19.229190826416016, -16.944002151489258, -14.658812522888184, -12.37362289428711, -10.088434219360352, -7.803245544433594, -5.5180559158325195, -3.2328662872314453, -0.9476776123046875, 1.3375115394592285, 3.6227006912231445, 5.9078898429870605, 8.193078994750977, 10.478267669677734, 12.763457298278809, 15.048646926879883, 17.33383560180664, 19.6190242767334, 21.904212951660156, 24.189403533935547, 26.474592208862305, 28.759780883789062, 31.044971466064453, 33.330162048339844, 35.61534881591797, 37.90053939819336, 40.185726165771484, 42.470916748046875, 44.756103515625, 47.04129409790039, 49.32648468017578, 51.611671447753906, 53.8968620300293, 56.18205261230469, 58.46723937988281, 60.7524299621582, 63.037620544433594, 65.32280731201172, 67.60799407958984, 69.8931884765625, 72.17837524414062]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 5.0, 9.0, 20.0, 17.0, 25.0, 55.0, 108.0, 179.0, 354.0, 759.0, 1869.0, 9147.0, 273170.0, 3890646.0, 13847.0, 2356.0, 858.0, 386.0, 216.0, 93.0, 55.0, 25.0, 25.0, 13.0, 6.0, 6.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.125, -46.470703125, -44.81640625, -43.162109375, -41.5078125, -39.853515625, -38.19921875, -36.544921875, -34.890625, -33.236328125, -31.58203125, -29.927734375, -28.2734375, -26.619140625, -24.96484375, -23.310546875, -21.65625, -20.001953125, -18.34765625, -16.693359375, -15.0390625, -13.384765625, -11.73046875, -10.076171875, -8.421875, -6.767578125, -5.11328125, -3.458984375, -1.8046875, -0.150390625, 1.50390625, 3.158203125, 4.8125, 6.466796875, 8.12109375, 9.775390625, 11.4296875, 13.083984375, 14.73828125, 16.392578125, 18.046875, 19.701171875, 21.35546875, 23.009765625, 24.6640625, 26.318359375, 27.97265625, 29.626953125, 31.28125, 32.935546875, 34.58984375, 36.244140625, 37.8984375, 39.552734375, 41.20703125, 42.861328125, 44.515625, 46.169921875, 47.82421875, 49.478515625, 51.1328125, 52.787109375, 54.44140625, 56.095703125, 57.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 3.0, 9.0, 14.0, 26.0, 30.0, 36.0, 51.0, 50.0, 58.0, 72.0, 67.0, 71.0, 78.0, 69.0, 72.0, 60.0, 47.0, 49.0, 32.0, 27.0, 19.0, 10.0, 11.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328125, -5.16070556640625, -4.9932861328125, -4.82586669921875, -4.658447265625, -4.49102783203125, -4.3236083984375, -4.15618896484375, -3.98876953125, -3.82135009765625, -3.6539306640625, -3.48651123046875, -3.319091796875, -3.15167236328125, -2.9842529296875, -2.81683349609375, -2.6494140625, -2.48199462890625, -2.3145751953125, -2.14715576171875, -1.979736328125, -1.81231689453125, -1.6448974609375, -1.47747802734375, -1.31005859375, -1.14263916015625, -0.9752197265625, -0.80780029296875, -0.640380859375, -0.47296142578125, -0.3055419921875, -0.13812255859375, 0.029296875, 0.19671630859375, 0.3641357421875, 0.53155517578125, 0.698974609375, 0.86639404296875, 1.0338134765625, 1.20123291015625, 1.36865234375, 1.53607177734375, 1.7034912109375, 1.87091064453125, 2.038330078125, 2.20574951171875, 2.3731689453125, 2.54058837890625, 2.7080078125, 2.87542724609375, 3.0428466796875, 3.21026611328125, 3.377685546875, 3.54510498046875, 3.7125244140625, 3.87994384765625, 4.04736328125, 4.21478271484375, 4.3822021484375, 4.54962158203125, 4.717041015625, 4.88446044921875, 5.0518798828125, 5.21929931640625, 5.38671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 18.0, 12.0, 23.0, 26.0, 43.0, 56.0, 68.0, 106.0, 137.0, 212.0, 347.0, 538.0, 1005.0, 2040.0, 4972.0, 18397.0, 214571.0, 3882961.0, 52882.0, 9226.0, 3100.0, 1454.0, 744.0, 417.0, 254.0, 193.0, 133.0, 89.0, 58.0, 51.0, 39.0, 22.0, 19.0, 11.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.734375, -21.0810546875, -20.427734375, -19.7744140625, -19.12109375, -18.4677734375, -17.814453125, -17.1611328125, -16.5078125, -15.8544921875, -15.201171875, -14.5478515625, -13.89453125, -13.2412109375, -12.587890625, -11.9345703125, -11.28125, -10.6279296875, -9.974609375, -9.3212890625, -8.66796875, -8.0146484375, -7.361328125, -6.7080078125, -6.0546875, -5.4013671875, -4.748046875, -4.0947265625, -3.44140625, -2.7880859375, -2.134765625, -1.4814453125, -0.828125, -0.1748046875, 0.478515625, 1.1318359375, 1.78515625, 2.4384765625, 3.091796875, 3.7451171875, 4.3984375, 5.0517578125, 5.705078125, 6.3583984375, 7.01171875, 7.6650390625, 8.318359375, 8.9716796875, 9.625, 10.2783203125, 10.931640625, 11.5849609375, 12.23828125, 12.8916015625, 13.544921875, 14.1982421875, 14.8515625, 15.5048828125, 16.158203125, 16.8115234375, 17.46484375, 18.1181640625, 18.771484375, 19.4248046875, 20.078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 11.0, 16.0, 28.0, 63.0, 118.0, 272.0, 2840.0, 420.0, 130.0, 60.0, 36.0, 22.0, 13.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.943359375, -3.83880615234375, -3.7342529296875, -3.62969970703125, -3.525146484375, -3.42059326171875, -3.3160400390625, -3.21148681640625, -3.10693359375, -3.00238037109375, -2.8978271484375, -2.79327392578125, -2.688720703125, -2.58416748046875, -2.4796142578125, -2.37506103515625, -2.2705078125, -2.16595458984375, -2.0614013671875, -1.95684814453125, -1.852294921875, -1.74774169921875, -1.6431884765625, -1.53863525390625, -1.43408203125, -1.32952880859375, -1.2249755859375, -1.12042236328125, -1.015869140625, -0.91131591796875, -0.8067626953125, -0.70220947265625, -0.59765625, -0.49310302734375, -0.3885498046875, -0.28399658203125, -0.179443359375, -0.07489013671875, 0.0296630859375, 0.13421630859375, 0.23876953125, 0.34332275390625, 0.4478759765625, 0.55242919921875, 0.656982421875, 0.76153564453125, 0.8660888671875, 0.97064208984375, 1.0751953125, 1.17974853515625, 1.2843017578125, 1.38885498046875, 1.493408203125, 1.59796142578125, 1.7025146484375, 1.80706787109375, 1.91162109375, 2.01617431640625, 2.1207275390625, 2.22528076171875, 2.329833984375, 2.43438720703125, 2.5389404296875, 2.64349365234375, 2.748046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 8.0, 3.0, 9.0, 17.0, 24.0, 28.0, 62.0, 73.0, 118.0, 153.0, 177.0, 147.0, 95.0, 41.0, 31.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.301677703857422, -27.589229583740234, -26.876781463623047, -26.16433334350586, -25.451885223388672, -24.739437103271484, -24.026988983154297, -23.31454086303711, -22.602092742919922, -21.889644622802734, -21.177196502685547, -20.46474838256836, -19.752300262451172, -19.039852142333984, -18.327404022216797, -17.61495590209961, -16.902507781982422, -16.190059661865234, -15.477611541748047, -14.76516342163086, -14.052715301513672, -13.340267181396484, -12.627819061279297, -11.91537094116211, -11.202922821044922, -10.490474700927734, -9.778026580810547, -9.06557846069336, -8.353130340576172, -7.640682220458984, -6.928234100341797, -6.215785980224609, -5.503335952758789, -4.790887832641602, -4.078439712524414, -3.3659915924072266, -2.653543472290039, -1.9410953521728516, -1.228647232055664, -0.5161991119384766, 0.19624900817871094, 0.9086971282958984, 1.621145248413086, 2.3335933685302734, 3.046041488647461, 3.7584896087646484, 4.470937728881836, 5.183385848999023, 5.895833969116211, 6.608282089233398, 7.320730209350586, 8.033178329467773, 8.745626449584961, 9.458074569702148, 10.170522689819336, 10.882970809936523, 11.595418930053711, 12.307867050170898, 13.020315170288086, 13.732763290405273, 14.445211410522461, 15.157659530639648, 15.870107650756836, 16.582555770874023, 17.29500389099121]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 12.0, 9.0, 11.0, 17.0, 23.0, 23.0, 18.0, 29.0, 31.0, 38.0, 31.0, 42.0, 35.0, 35.0, 28.0, 42.0, 48.0, 46.0, 43.0, 43.0, 39.0, 50.0, 36.0, 43.0, 16.0, 32.0, 26.0, 35.0, 22.0, 18.0, 13.0, 16.0, 13.0, 9.0, 10.0, 2.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34560775756836, -9.046968460083008, -8.748330116271973, -8.449690818786621, -8.151052474975586, -7.852413177490234, -7.553774356842041, -7.255135536193848, -6.956496238708496, -6.657857418060303, -6.359218597412109, -6.060579299926758, -5.7619404792785645, -5.463301658630371, -5.164662837982178, -4.866024017333984, -4.567385196685791, -4.268746376037598, -3.970107316970825, -3.671468496322632, -3.3728294372558594, -3.074190616607666, -2.7755517959594727, -2.4769127368927, -2.178273916244507, -1.879634976387024, -1.580996036529541, -1.2823572158813477, -0.9837182760238647, -0.6850793361663818, -0.3864405155181885, -0.08780145645141602, 0.21083736419677734, 0.5094763040542603, 0.8081151843070984, 1.1067540645599365, 1.4053930044174194, 1.7040319442749023, 2.0026707649230957, 2.301309823989868, 2.5999486446380615, 2.898587465286255, 3.1972265243530273, 3.4958653450012207, 3.794504165649414, 4.093143463134766, 4.391781806945801, 4.690421104431152, 4.989059925079346, 5.287698745727539, 5.586337566375732, 5.884976387023926, 6.183615684509277, 6.482254505157471, 6.780893325805664, 7.079532623291016, 7.378170967102051, 7.676809787750244, 7.9754486083984375, 8.274087905883789, 8.572726249694824, 8.871365547180176, 9.170003890991211, 9.468643188476562, 9.767282485961914]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 4.0, 11.0, 21.0, 26.0, 28.0, 43.0, 37.0, 72.0, 110.0, 179.0, 209.0, 316.0, 472.0, 760.0, 1244.0, 2249.0, 4579.0, 9953.0, 24078.0, 61300.0, 153601.0, 303859.0, 273324.0, 125654.0, 49525.0, 19638.0, 8215.0, 3916.0, 1959.0, 1090.0, 693.0, 438.0, 253.0, 210.0, 129.0, 94.0, 64.0, 48.0, 37.0, 28.0, 25.0, 7.0, 15.0, 9.0, 4.0, 4.0, 9.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.25, -11.825927734375, -11.40185546875, -10.977783203125, -10.5537109375, -10.129638671875, -9.70556640625, -9.281494140625, -8.857421875, -8.433349609375, -8.00927734375, -7.585205078125, -7.1611328125, -6.737060546875, -6.31298828125, -5.888916015625, -5.46484375, -5.040771484375, -4.61669921875, -4.192626953125, -3.7685546875, -3.344482421875, -2.92041015625, -2.496337890625, -2.072265625, -1.648193359375, -1.22412109375, -0.800048828125, -0.3759765625, 0.048095703125, 0.47216796875, 0.896240234375, 1.3203125, 1.744384765625, 2.16845703125, 2.592529296875, 3.0166015625, 3.440673828125, 3.86474609375, 4.288818359375, 4.712890625, 5.136962890625, 5.56103515625, 5.985107421875, 6.4091796875, 6.833251953125, 7.25732421875, 7.681396484375, 8.10546875, 8.529541015625, 8.95361328125, 9.377685546875, 9.8017578125, 10.225830078125, 10.64990234375, 11.073974609375, 11.498046875, 11.922119140625, 12.34619140625, 12.770263671875, 13.1943359375, 13.618408203125, 14.04248046875, 14.466552734375, 14.890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 4.0, 12.0, 15.0, 19.0, 20.0, 37.0, 47.0, 41.0, 42.0, 70.0, 54.0, 60.0, 70.0, 59.0, 69.0, 65.0, 54.0, 53.0, 40.0, 35.0, 35.0, 23.0, 21.0, 9.0, 12.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.293212890625, -5.12158203125, -4.949951171875, -4.7783203125, -4.606689453125, -4.43505859375, -4.263427734375, -4.091796875, -3.920166015625, -3.74853515625, -3.576904296875, -3.4052734375, -3.233642578125, -3.06201171875, -2.890380859375, -2.71875, -2.547119140625, -2.37548828125, -2.203857421875, -2.0322265625, -1.860595703125, -1.68896484375, -1.517333984375, -1.345703125, -1.174072265625, -1.00244140625, -0.830810546875, -0.6591796875, -0.487548828125, -0.31591796875, -0.144287109375, 0.02734375, 0.198974609375, 0.37060546875, 0.542236328125, 0.7138671875, 0.885498046875, 1.05712890625, 1.228759765625, 1.400390625, 1.572021484375, 1.74365234375, 1.915283203125, 2.0869140625, 2.258544921875, 2.43017578125, 2.601806640625, 2.7734375, 2.945068359375, 3.11669921875, 3.288330078125, 3.4599609375, 3.631591796875, 3.80322265625, 3.974853515625, 4.146484375, 4.318115234375, 4.48974609375, 4.661376953125, 4.8330078125, 5.004638671875, 5.17626953125, 5.347900390625, 5.51953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 9.0, 16.0, 17.0, 31.0, 42.0, 45.0, 62.0, 107.0, 168.0, 281.0, 707.0, 2160.0, 16796.0, 866958.0, 153329.0, 5490.0, 1172.0, 426.0, 217.0, 126.0, 94.0, 78.0, 49.0, 31.0, 21.0, 15.0, 12.0, 9.0, 12.0, 6.0, 10.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0, -62.9541015625, -60.908203125, -58.8623046875, -56.81640625, -54.7705078125, -52.724609375, -50.6787109375, -48.6328125, -46.5869140625, -44.541015625, -42.4951171875, -40.44921875, -38.4033203125, -36.357421875, -34.3115234375, -32.265625, -30.2197265625, -28.173828125, -26.1279296875, -24.08203125, -22.0361328125, -19.990234375, -17.9443359375, -15.8984375, -13.8525390625, -11.806640625, -9.7607421875, -7.71484375, -5.6689453125, -3.623046875, -1.5771484375, 0.46875, 2.5146484375, 4.560546875, 6.6064453125, 8.65234375, 10.6982421875, 12.744140625, 14.7900390625, 16.8359375, 18.8818359375, 20.927734375, 22.9736328125, 25.01953125, 27.0654296875, 29.111328125, 31.1572265625, 33.203125, 35.2490234375, 37.294921875, 39.3408203125, 41.38671875, 43.4326171875, 45.478515625, 47.5244140625, 49.5703125, 51.6162109375, 53.662109375, 55.7080078125, 57.75390625, 59.7998046875, 61.845703125, 63.8916015625, 65.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 10.0, 6.0, 13.0, 20.0, 19.0, 24.0, 45.0, 62.0, 60.0, 89.0, 93.0, 94.0, 82.0, 73.0, 74.0, 56.0, 39.0, 50.0, 20.0, 18.0, 9.0, 10.0, 3.0, 7.0, 3.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.548828125, -40.37890625, -39.208984375, -38.0390625, -36.869140625, -35.69921875, -34.529296875, -33.359375, -32.189453125, -31.01953125, -29.849609375, -28.6796875, -27.509765625, -26.33984375, -25.169921875, -24.0, -22.830078125, -21.66015625, -20.490234375, -19.3203125, -18.150390625, -16.98046875, -15.810546875, -14.640625, -13.470703125, -12.30078125, -11.130859375, -9.9609375, -8.791015625, -7.62109375, -6.451171875, -5.28125, -4.111328125, -2.94140625, -1.771484375, -0.6015625, 0.568359375, 1.73828125, 2.908203125, 4.078125, 5.248046875, 6.41796875, 7.587890625, 8.7578125, 9.927734375, 11.09765625, 12.267578125, 13.4375, 14.607421875, 15.77734375, 16.947265625, 18.1171875, 19.287109375, 20.45703125, 21.626953125, 22.796875, 23.966796875, 25.13671875, 26.306640625, 27.4765625, 28.646484375, 29.81640625, 30.986328125, 32.15625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 17.0, 9.0, 15.0, 31.0, 40.0, 71.0, 59.0, 136.0, 314.0, 779.0, 3605.0, 29202.0, 535484.0, 448905.0, 25272.0, 3154.0, 732.0, 311.0, 120.0, 74.0, 45.0, 43.0, 24.0, 16.0, 21.0, 6.0, 9.0, 6.0, 4.0, 7.0, 2.0, 5.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.9393310546875, -16.425537109375, -15.9117431640625, -15.39794921875, -14.8841552734375, -14.370361328125, -13.8565673828125, -13.3427734375, -12.8289794921875, -12.315185546875, -11.8013916015625, -11.28759765625, -10.7738037109375, -10.260009765625, -9.7462158203125, -9.232421875, -8.7186279296875, -8.204833984375, -7.6910400390625, -7.17724609375, -6.6634521484375, -6.149658203125, -5.6358642578125, -5.1220703125, -4.6082763671875, -4.094482421875, -3.5806884765625, -3.06689453125, -2.5531005859375, -2.039306640625, -1.5255126953125, -1.01171875, -0.4979248046875, 0.015869140625, 0.5296630859375, 1.04345703125, 1.5572509765625, 2.071044921875, 2.5848388671875, 3.0986328125, 3.6124267578125, 4.126220703125, 4.6400146484375, 5.15380859375, 5.6676025390625, 6.181396484375, 6.6951904296875, 7.208984375, 7.7227783203125, 8.236572265625, 8.7503662109375, 9.26416015625, 9.7779541015625, 10.291748046875, 10.8055419921875, 11.3193359375, 11.8331298828125, 12.346923828125, 12.8607177734375, 13.37451171875, 13.8883056640625, 14.402099609375, 14.9158935546875, 15.4296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 15.0, 11.0, 17.0, 25.0, 21.0, 39.0, 39.0, 39.0, 48.0, 50.0, 66.0, 60.0, 62.0, 54.0, 60.0, 60.0, 40.0, 32.0, 43.0, 30.0, 16.0, 31.0, 20.0, 16.0, 8.0, 13.0, 8.0, 5.0, 7.0, 9.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.000843048095703125, -0.0008190125226974487, -0.0007949769496917725, -0.0007709413766860962, -0.0007469058036804199, -0.0007228702306747437, -0.0006988346576690674, -0.0006747990846633911, -0.0006507635116577148, -0.0006267279386520386, -0.0006026923656463623, -0.000578656792640686, -0.0005546212196350098, -0.0005305856466293335, -0.0005065500736236572, -0.00048251450061798096, -0.0004584789276123047, -0.0004344433546066284, -0.00041040778160095215, -0.0003863722085952759, -0.0003623366355895996, -0.00033830106258392334, -0.00031426548957824707, -0.0002902299165725708, -0.00026619434356689453, -0.00024215877056121826, -0.000218123197555542, -0.00019408762454986572, -0.00017005205154418945, -0.00014601647853851318, -0.00012198090553283691, -9.794533252716064e-05, -7.390975952148438e-05, -4.9874186515808105e-05, -2.5838613510131836e-05, -1.8030405044555664e-06, 2.2232532501220703e-05, 4.626810550689697e-05, 7.030367851257324e-05, 9.433925151824951e-05, 0.00011837482452392578, 0.00014241039752960205, 0.00016644597053527832, 0.0001904815435409546, 0.00021451711654663086, 0.00023855268955230713, 0.0002625882625579834, 0.00028662383556365967, 0.00031065940856933594, 0.0003346949815750122, 0.0003587305545806885, 0.00038276612758636475, 0.000406801700592041, 0.0004308372735977173, 0.00045487284660339355, 0.0004789084196090698, 0.0005029439926147461, 0.0005269795656204224, 0.0005510151386260986, 0.0005750507116317749, 0.0005990862846374512, 0.0006231218576431274, 0.0006471574306488037, 0.00067119300365448, 0.0006952285766601562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 7.0, 4.0, 13.0, 18.0, 26.0, 67.0, 140.0, 363.0, 1273.0, 10484.0, 894015.0, 137225.0, 3759.0, 703.0, 232.0, 107.0, 42.0, 27.0, 15.0, 8.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.5048828125, -30.447265625, -29.3896484375, -28.33203125, -27.2744140625, -26.216796875, -25.1591796875, -24.1015625, -23.0439453125, -21.986328125, -20.9287109375, -19.87109375, -18.8134765625, -17.755859375, -16.6982421875, -15.640625, -14.5830078125, -13.525390625, -12.4677734375, -11.41015625, -10.3525390625, -9.294921875, -8.2373046875, -7.1796875, -6.1220703125, -5.064453125, -4.0068359375, -2.94921875, -1.8916015625, -0.833984375, 0.2236328125, 1.28125, 2.3388671875, 3.396484375, 4.4541015625, 5.51171875, 6.5693359375, 7.626953125, 8.6845703125, 9.7421875, 10.7998046875, 11.857421875, 12.9150390625, 13.97265625, 15.0302734375, 16.087890625, 17.1455078125, 18.203125, 19.2607421875, 20.318359375, 21.3759765625, 22.43359375, 23.4912109375, 24.548828125, 25.6064453125, 26.6640625, 27.7216796875, 28.779296875, 29.8369140625, 30.89453125, 31.9521484375, 33.009765625, 34.0673828125, 35.125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 4.0, 8.0, 9.0, 17.0, 33.0, 54.0, 81.0, 109.0, 124.0, 142.0, 120.0, 95.0, 66.0, 46.0, 23.0, 20.0, 15.0, 8.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.1221923828125, -12.642822265625, -12.1634521484375, -11.68408203125, -11.2047119140625, -10.725341796875, -10.2459716796875, -9.7666015625, -9.2872314453125, -8.807861328125, -8.3284912109375, -7.84912109375, -7.3697509765625, -6.890380859375, -6.4110107421875, -5.931640625, -5.4522705078125, -4.972900390625, -4.4935302734375, -4.01416015625, -3.5347900390625, -3.055419921875, -2.5760498046875, -2.0966796875, -1.6173095703125, -1.137939453125, -0.6585693359375, -0.17919921875, 0.3001708984375, 0.779541015625, 1.2589111328125, 1.73828125, 2.2176513671875, 2.697021484375, 3.1763916015625, 3.65576171875, 4.1351318359375, 4.614501953125, 5.0938720703125, 5.5732421875, 6.0526123046875, 6.531982421875, 7.0113525390625, 7.49072265625, 7.9700927734375, 8.449462890625, 8.9288330078125, 9.408203125, 9.8875732421875, 10.366943359375, 10.8463134765625, 11.32568359375, 11.8050537109375, 12.284423828125, 12.7637939453125, 13.2431640625, 13.7225341796875, 14.201904296875, 14.6812744140625, 15.16064453125, 15.6400146484375, 16.119384765625, 16.5987548828125, 17.078125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 14.0, 23.0, 61.0, 129.0, 175.0, 219.0, 174.0, 111.0, 46.0, 30.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.31735229492188, -239.45172119140625, -231.58609008789062, -223.720458984375, -215.8548126220703, -207.9891815185547, -200.12355041503906, -192.25791931152344, -184.3922882080078, -176.5266571044922, -168.66102600097656, -160.79537963867188, -152.92974853515625, -145.06411743164062, -137.198486328125, -129.33285522460938, -121.46721649169922, -113.6015853881836, -105.73594665527344, -97.87031555175781, -90.00468444824219, -82.13905334472656, -74.2734146118164, -66.40778350830078, -58.54214859008789, -50.676513671875, -42.810882568359375, -34.945247650146484, -27.079614639282227, -19.21398162841797, -11.348346710205078, -3.482715606689453, 4.3829193115234375, 12.248552322387695, 20.114185333251953, 27.979820251464844, 35.84545135498047, 43.71108627319336, 51.57672119140625, 59.442352294921875, 67.3079833984375, 75.17361450195312, 83.03925323486328, 90.9048843383789, 98.77051544189453, 106.63615417480469, 114.50178527832031, 122.36741638183594, 130.23306274414062, 138.09869384765625, 145.96432495117188, 153.8299560546875, 161.6956024169922, 169.5612335205078, 177.42686462402344, 185.29249572753906, 193.1581268310547, 201.0237579345703, 208.88938903808594, 216.75503540039062, 224.62066650390625, 232.48629760742188, 240.3519287109375, 248.21755981445312, 256.08319091796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 3.0, 6.0, 3.0, 13.0, 10.0, 23.0, 12.0, 21.0, 33.0, 31.0, 29.0, 30.0, 56.0, 37.0, 44.0, 36.0, 44.0, 49.0, 55.0, 50.0, 50.0, 53.0, 47.0, 41.0, 40.0, 38.0, 21.0, 32.0, 20.0, 16.0, 9.0, 10.0, 6.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-115.8680648803711, -112.44839477539062, -109.02872467041016, -105.60905456542969, -102.18938446044922, -98.76971435546875, -95.35003662109375, -91.93037414550781, -88.51069641113281, -85.09102630615234, -81.67135620117188, -78.2516860961914, -74.83201599121094, -71.41234588623047, -67.99267578125, -64.572998046875, -61.15333557128906, -57.733665466308594, -54.313995361328125, -50.894325256347656, -47.47465515136719, -44.05498504638672, -40.635311126708984, -37.215641021728516, -33.79597091674805, -30.376300811767578, -26.95663070678711, -23.536958694458008, -20.11728858947754, -16.69761848449707, -13.277946472167969, -9.8582763671875, -6.4385986328125, -3.018928050994873, 0.4007425308227539, 3.820413589477539, 7.240083694458008, 10.659753799438477, 14.079425811767578, 17.499095916748047, 20.918766021728516, 24.338436126708984, 27.758106231689453, 31.177778244018555, 34.597450256347656, 38.017120361328125, 41.436790466308594, 44.85646057128906, 48.27613067626953, 51.69580078125, 55.11547088623047, 58.53514099121094, 61.954811096191406, 65.37448120117188, 68.79415893554688, 72.21382141113281, 75.63349914550781, 79.05316925048828, 82.47283935546875, 85.89250946044922, 89.31217956542969, 92.73184967041016, 96.15151977539062, 99.57119750976562, 102.99085998535156]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 17.0, 28.0, 17.0, 50.0, 82.0, 134.0, 212.0, 477.0, 1103.0, 3450.0, 15570.0, 3540646.0, 612445.0, 14571.0, 3377.0, 1148.0, 456.0, 210.0, 98.0, 54.0, 28.0, 21.0, 11.0, 16.0, 8.0, 10.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.8310546875, -37.443359375, -36.0556640625, -34.66796875, -33.2802734375, -31.892578125, -30.5048828125, -29.1171875, -27.7294921875, -26.341796875, -24.9541015625, -23.56640625, -22.1787109375, -20.791015625, -19.4033203125, -18.015625, -16.6279296875, -15.240234375, -13.8525390625, -12.46484375, -11.0771484375, -9.689453125, -8.3017578125, -6.9140625, -5.5263671875, -4.138671875, -2.7509765625, -1.36328125, 0.0244140625, 1.412109375, 2.7998046875, 4.1875, 5.5751953125, 6.962890625, 8.3505859375, 9.73828125, 11.1259765625, 12.513671875, 13.9013671875, 15.2890625, 16.6767578125, 18.064453125, 19.4521484375, 20.83984375, 22.2275390625, 23.615234375, 25.0029296875, 26.390625, 27.7783203125, 29.166015625, 30.5537109375, 31.94140625, 33.3291015625, 34.716796875, 36.1044921875, 37.4921875, 38.8798828125, 40.267578125, 41.6552734375, 43.04296875, 44.4306640625, 45.818359375, 47.2060546875, 48.59375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 6.0, 6.0, 14.0, 17.0, 29.0, 43.0, 49.0, 61.0, 62.0, 81.0, 95.0, 78.0, 86.0, 69.0, 81.0, 61.0, 51.0, 36.0, 15.0, 17.0, 13.0, 17.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.06768798828125, -5.8463134765625, -5.62493896484375, -5.403564453125, -5.18218994140625, -4.9608154296875, -4.73944091796875, -4.51806640625, -4.29669189453125, -4.0753173828125, -3.85394287109375, -3.632568359375, -3.41119384765625, -3.1898193359375, -2.96844482421875, -2.7470703125, -2.52569580078125, -2.3043212890625, -2.08294677734375, -1.861572265625, -1.64019775390625, -1.4188232421875, -1.19744873046875, -0.97607421875, -0.75469970703125, -0.5333251953125, -0.31195068359375, -0.090576171875, 0.13079833984375, 0.3521728515625, 0.57354736328125, 0.794921875, 1.01629638671875, 1.2376708984375, 1.45904541015625, 1.680419921875, 1.90179443359375, 2.1231689453125, 2.34454345703125, 2.56591796875, 2.78729248046875, 3.0086669921875, 3.23004150390625, 3.451416015625, 3.67279052734375, 3.8941650390625, 4.11553955078125, 4.3369140625, 4.55828857421875, 4.7796630859375, 5.00103759765625, 5.222412109375, 5.44378662109375, 5.6651611328125, 5.88653564453125, 6.10791015625, 6.32928466796875, 6.5506591796875, 6.77203369140625, 6.993408203125, 7.21478271484375, 7.4361572265625, 7.65753173828125, 7.87890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 7.0, 6.0, 12.0, 6.0, 14.0, 22.0, 25.0, 33.0, 49.0, 55.0, 85.0, 92.0, 134.0, 174.0, 294.0, 399.0, 571.0, 837.0, 1351.0, 2341.0, 4690.0, 10785.0, 32241.0, 213794.0, 3776625.0, 108751.0, 22895.0, 8312.0, 3834.0, 2058.0, 1254.0, 766.0, 477.0, 338.0, 230.0, 182.0, 142.0, 112.0, 72.0, 48.0, 42.0, 28.0, 24.0, 23.0, 22.0, 7.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.7109375, -14.27001953125, -13.8291015625, -13.38818359375, -12.947265625, -12.50634765625, -12.0654296875, -11.62451171875, -11.18359375, -10.74267578125, -10.3017578125, -9.86083984375, -9.419921875, -8.97900390625, -8.5380859375, -8.09716796875, -7.65625, -7.21533203125, -6.7744140625, -6.33349609375, -5.892578125, -5.45166015625, -5.0107421875, -4.56982421875, -4.12890625, -3.68798828125, -3.2470703125, -2.80615234375, -2.365234375, -1.92431640625, -1.4833984375, -1.04248046875, -0.6015625, -0.16064453125, 0.2802734375, 0.72119140625, 1.162109375, 1.60302734375, 2.0439453125, 2.48486328125, 2.92578125, 3.36669921875, 3.8076171875, 4.24853515625, 4.689453125, 5.13037109375, 5.5712890625, 6.01220703125, 6.453125, 6.89404296875, 7.3349609375, 7.77587890625, 8.216796875, 8.65771484375, 9.0986328125, 9.53955078125, 9.98046875, 10.42138671875, 10.8623046875, 11.30322265625, 11.744140625, 12.18505859375, 12.6259765625, 13.06689453125, 13.5078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 3.0, 9.0, 8.0, 8.0, 11.0, 27.0, 27.0, 52.0, 99.0, 249.0, 2600.0, 518.0, 187.0, 93.0, 43.0, 35.0, 22.0, 14.0, 11.0, 4.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.919921875, -3.8189697265625, -3.718017578125, -3.6170654296875, -3.51611328125, -3.4151611328125, -3.314208984375, -3.2132568359375, -3.1123046875, -3.0113525390625, -2.910400390625, -2.8094482421875, -2.70849609375, -2.6075439453125, -2.506591796875, -2.4056396484375, -2.3046875, -2.2037353515625, -2.102783203125, -2.0018310546875, -1.90087890625, -1.7999267578125, -1.698974609375, -1.5980224609375, -1.4970703125, -1.3961181640625, -1.295166015625, -1.1942138671875, -1.09326171875, -0.9923095703125, -0.891357421875, -0.7904052734375, -0.689453125, -0.5885009765625, -0.487548828125, -0.3865966796875, -0.28564453125, -0.1846923828125, -0.083740234375, 0.0172119140625, 0.1181640625, 0.2191162109375, 0.320068359375, 0.4210205078125, 0.52197265625, 0.6229248046875, 0.723876953125, 0.8248291015625, 0.92578125, 1.0267333984375, 1.127685546875, 1.2286376953125, 1.32958984375, 1.4305419921875, 1.531494140625, 1.6324462890625, 1.7333984375, 1.8343505859375, 1.935302734375, 2.0362548828125, 2.13720703125, 2.2381591796875, 2.339111328125, 2.4400634765625, 2.541015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 17.0, 21.0, 32.0, 61.0, 99.0, 136.0, 165.0, 165.0, 131.0, 68.0, 33.0, 22.0, 10.0, 10.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.878122329711914, -21.056169509887695, -20.23421859741211, -19.41226577758789, -18.590312957763672, -17.768362045288086, -16.946409225463867, -16.12445831298828, -15.302505493164062, -14.48055362701416, -13.658601760864258, -12.836648941040039, -12.014697074890137, -11.192745208740234, -10.370792388916016, -9.548840522766113, -8.726888656616211, -7.904936790466309, -7.082984447479248, -6.2610321044921875, -5.439080238342285, -4.617128372192383, -3.7951760292053223, -2.9732236862182617, -2.1512718200683594, -1.329319715499878, -0.5073676109313965, 0.31458449363708496, 1.1365365982055664, 1.9584884643554688, 2.7804408073425293, 3.60239315032959, 4.424346923828125, 5.246298789978027, 6.068251132965088, 6.890203475952148, 7.712155342102051, 8.534107208251953, 9.356060028076172, 10.178011894226074, 10.999963760375977, 11.821915626525879, 12.643867492675781, 13.4658203125, 14.287772178649902, 15.109724044799805, 15.931676864624023, 16.75362777709961, 17.575580596923828, 18.397533416748047, 19.219484329223633, 20.04143714904785, 20.863388061523438, 21.685340881347656, 22.507293701171875, 23.329246520996094, 24.15119743347168, 24.9731502532959, 25.795101165771484, 26.617053985595703, 27.439006805419922, 28.260957717895508, 29.082910537719727, 29.904861450195312, 30.72681427001953]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 2.0, 7.0, 10.0, 7.0, 8.0, 17.0, 16.0, 29.0, 25.0, 27.0, 38.0, 47.0, 48.0, 55.0, 60.0, 59.0, 67.0, 47.0, 43.0, 43.0, 50.0, 44.0, 35.0, 41.0, 35.0, 26.0, 21.0, 16.0, 25.0, 10.0, 11.0, 11.0, 6.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.751505851745605, -10.385904312133789, -10.020303726196289, -9.654702186584473, -9.289101600646973, -8.923500061035156, -8.557899475097656, -8.19229793548584, -7.826696872711182, -7.461095809936523, -7.095494747161865, -6.729893684387207, -6.364292144775391, -5.998691558837891, -5.633090019226074, -5.267488956451416, -4.901887893676758, -4.5362868309021, -4.170685768127441, -3.805084466934204, -3.439483404159546, -3.0738823413848877, -2.7082810401916504, -2.342679977416992, -1.977078914642334, -1.6114778518676758, -1.245876669883728, -0.8802754878997803, -0.5146744251251221, -0.14907336235046387, 0.21652793884277344, 0.5821290016174316, 0.9477291107177734, 1.3133301734924316, 1.6789313554763794, 2.044532537460327, 2.4101336002349854, 2.7757346630096436, 3.141335964202881, 3.506937026977539, 3.8725380897521973, 4.2381391525268555, 4.603740215301514, 4.969341278076172, 5.334942817687988, 5.700543403625488, 6.066144943237305, 6.431746006011963, 6.797347068786621, 7.162948131561279, 7.5285491943359375, 7.894150733947754, 8.259751319885254, 8.62535285949707, 8.99095344543457, 9.356554985046387, 9.722156524658203, 10.08775806427002, 10.45335865020752, 10.818960189819336, 11.184560775756836, 11.550162315368652, 11.915763854980469, 12.281364440917969, 12.646965026855469]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 4.0, 7.0, 9.0, 18.0, 18.0, 42.0, 49.0, 67.0, 115.0, 156.0, 244.0, 418.0, 693.0, 1249.0, 2390.0, 5114.0, 12445.0, 34604.0, 111348.0, 309614.0, 353147.0, 144243.0, 44684.0, 15416.0, 6103.0, 2813.0, 1399.0, 761.0, 450.0, 305.0, 182.0, 132.0, 91.0, 53.0, 45.0, 39.0, 18.0, 19.0, 9.0, 9.0, 12.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0], "bins": [-16.96875, -16.4854736328125, -16.002197265625, -15.5189208984375, -15.03564453125, -14.5523681640625, -14.069091796875, -13.5858154296875, -13.1025390625, -12.6192626953125, -12.135986328125, -11.6527099609375, -11.16943359375, -10.6861572265625, -10.202880859375, -9.7196044921875, -9.236328125, -8.7530517578125, -8.269775390625, -7.7864990234375, -7.30322265625, -6.8199462890625, -6.336669921875, -5.8533935546875, -5.3701171875, -4.8868408203125, -4.403564453125, -3.9202880859375, -3.43701171875, -2.9537353515625, -2.470458984375, -1.9871826171875, -1.50390625, -1.0206298828125, -0.537353515625, -0.0540771484375, 0.42919921875, 0.9124755859375, 1.395751953125, 1.8790283203125, 2.3623046875, 2.8455810546875, 3.328857421875, 3.8121337890625, 4.29541015625, 4.7786865234375, 5.261962890625, 5.7452392578125, 6.228515625, 6.7117919921875, 7.195068359375, 7.6783447265625, 8.16162109375, 8.6448974609375, 9.128173828125, 9.6114501953125, 10.0947265625, 10.5780029296875, 11.061279296875, 11.5445556640625, 12.02783203125, 12.5111083984375, 12.994384765625, 13.4776611328125, 13.9609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 9.0, 11.0, 20.0, 14.0, 27.0, 34.0, 51.0, 65.0, 79.0, 82.0, 73.0, 94.0, 70.0, 78.0, 62.0, 66.0, 42.0, 40.0, 28.0, 16.0, 16.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.58367919921875, -6.3509521484375, -6.11822509765625, -5.885498046875, -5.65277099609375, -5.4200439453125, -5.18731689453125, -4.95458984375, -4.72186279296875, -4.4891357421875, -4.25640869140625, -4.023681640625, -3.79095458984375, -3.5582275390625, -3.32550048828125, -3.0927734375, -2.86004638671875, -2.6273193359375, -2.39459228515625, -2.161865234375, -1.92913818359375, -1.6964111328125, -1.46368408203125, -1.23095703125, -0.99822998046875, -0.7655029296875, -0.53277587890625, -0.300048828125, -0.06732177734375, 0.1654052734375, 0.39813232421875, 0.630859375, 0.86358642578125, 1.0963134765625, 1.32904052734375, 1.561767578125, 1.79449462890625, 2.0272216796875, 2.25994873046875, 2.49267578125, 2.72540283203125, 2.9581298828125, 3.19085693359375, 3.423583984375, 3.65631103515625, 3.8890380859375, 4.12176513671875, 4.3544921875, 4.58721923828125, 4.8199462890625, 5.05267333984375, 5.285400390625, 5.51812744140625, 5.7508544921875, 5.98358154296875, 6.21630859375, 6.44903564453125, 6.6817626953125, 6.91448974609375, 7.147216796875, 7.37994384765625, 7.6126708984375, 7.84539794921875, 8.078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 10.0, 8.0, 25.0, 17.0, 28.0, 42.0, 51.0, 99.0, 226.0, 477.0, 1310.0, 6941.0, 458157.0, 571209.0, 7479.0, 1433.0, 462.0, 209.0, 109.0, 58.0, 38.0, 42.0, 25.0, 17.0, 13.0, 12.0, 7.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.9375, -74.607421875, -72.27734375, -69.947265625, -67.6171875, -65.287109375, -62.95703125, -60.626953125, -58.296875, -55.966796875, -53.63671875, -51.306640625, -48.9765625, -46.646484375, -44.31640625, -41.986328125, -39.65625, -37.326171875, -34.99609375, -32.666015625, -30.3359375, -28.005859375, -25.67578125, -23.345703125, -21.015625, -18.685546875, -16.35546875, -14.025390625, -11.6953125, -9.365234375, -7.03515625, -4.705078125, -2.375, -0.044921875, 2.28515625, 4.615234375, 6.9453125, 9.275390625, 11.60546875, 13.935546875, 16.265625, 18.595703125, 20.92578125, 23.255859375, 25.5859375, 27.916015625, 30.24609375, 32.576171875, 34.90625, 37.236328125, 39.56640625, 41.896484375, 44.2265625, 46.556640625, 48.88671875, 51.216796875, 53.546875, 55.876953125, 58.20703125, 60.537109375, 62.8671875, 65.197265625, 67.52734375, 69.857421875, 72.1875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 4.0, 3.0, 8.0, 6.0, 13.0, 10.0, 25.0, 31.0, 42.0, 51.0, 57.0, 77.0, 95.0, 92.0, 95.0, 86.0, 76.0, 44.0, 48.0, 31.0, 33.0, 11.0, 10.0, 15.0, 6.0, 3.0, 5.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.09375, -48.83447265625, -47.5751953125, -46.31591796875, -45.056640625, -43.79736328125, -42.5380859375, -41.27880859375, -40.01953125, -38.76025390625, -37.5009765625, -36.24169921875, -34.982421875, -33.72314453125, -32.4638671875, -31.20458984375, -29.9453125, -28.68603515625, -27.4267578125, -26.16748046875, -24.908203125, -23.64892578125, -22.3896484375, -21.13037109375, -19.87109375, -18.61181640625, -17.3525390625, -16.09326171875, -14.833984375, -13.57470703125, -12.3154296875, -11.05615234375, -9.796875, -8.53759765625, -7.2783203125, -6.01904296875, -4.759765625, -3.50048828125, -2.2412109375, -0.98193359375, 0.27734375, 1.53662109375, 2.7958984375, 4.05517578125, 5.314453125, 6.57373046875, 7.8330078125, 9.09228515625, 10.3515625, 11.61083984375, 12.8701171875, 14.12939453125, 15.388671875, 16.64794921875, 17.9072265625, 19.16650390625, 20.42578125, 21.68505859375, 22.9443359375, 24.20361328125, 25.462890625, 26.72216796875, 27.9814453125, 29.24072265625, 30.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 5.0, 8.0, 8.0, 12.0, 28.0, 20.0, 40.0, 43.0, 49.0, 91.0, 160.0, 269.0, 575.0, 2232.0, 27639.0, 931751.0, 80108.0, 3867.0, 805.0, 336.0, 189.0, 82.0, 67.0, 49.0, 36.0, 15.0, 15.0, 11.0, 10.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.581787109375, -21.81982421875, -21.057861328125, -20.2958984375, -19.533935546875, -18.77197265625, -18.010009765625, -17.248046875, -16.486083984375, -15.72412109375, -14.962158203125, -14.2001953125, -13.438232421875, -12.67626953125, -11.914306640625, -11.15234375, -10.390380859375, -9.62841796875, -8.866455078125, -8.1044921875, -7.342529296875, -6.58056640625, -5.818603515625, -5.056640625, -4.294677734375, -3.53271484375, -2.770751953125, -2.0087890625, -1.246826171875, -0.48486328125, 0.277099609375, 1.0390625, 1.801025390625, 2.56298828125, 3.324951171875, 4.0869140625, 4.848876953125, 5.61083984375, 6.372802734375, 7.134765625, 7.896728515625, 8.65869140625, 9.420654296875, 10.1826171875, 10.944580078125, 11.70654296875, 12.468505859375, 13.23046875, 13.992431640625, 14.75439453125, 15.516357421875, 16.2783203125, 17.040283203125, 17.80224609375, 18.564208984375, 19.326171875, 20.088134765625, 20.85009765625, 21.612060546875, 22.3740234375, 23.135986328125, 23.89794921875, 24.659912109375, 25.421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 9.0, 6.0, 11.0, 16.0, 31.0, 50.0, 76.0, 149.0, 200.0, 169.0, 125.0, 68.0, 34.0, 19.0, 16.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028228759765625, -0.002751663327217102, -0.002680450677871704, -0.002609238028526306, -0.002538025379180908, -0.0024668127298355103, -0.0023956000804901123, -0.0023243874311447144, -0.0022531747817993164, -0.0021819621324539185, -0.0021107494831085205, -0.0020395368337631226, -0.0019683241844177246, -0.0018971115350723267, -0.0018258988857269287, -0.0017546862363815308, -0.0016834735870361328, -0.0016122609376907349, -0.001541048288345337, -0.001469835638999939, -0.001398622989654541, -0.001327410340309143, -0.0012561976909637451, -0.0011849850416183472, -0.0011137723922729492, -0.0010425597429275513, -0.0009713470935821533, -0.0009001344442367554, -0.0008289217948913574, -0.0007577091455459595, -0.0006864964962005615, -0.0006152838468551636, -0.0005440711975097656, -0.0004728585481643677, -0.0004016458988189697, -0.0003304332494735718, -0.00025922060012817383, -0.00018800795078277588, -0.00011679530143737793, -4.558265209197998e-05, 2.562999725341797e-05, 9.684264659881592e-05, 0.00016805529594421387, 0.00023926794528961182, 0.00031048059463500977, 0.0003816932439804077, 0.00045290589332580566, 0.0005241185426712036, 0.0005953311920166016, 0.0006665438413619995, 0.0007377564907073975, 0.0008089691400527954, 0.0008801817893981934, 0.0009513944387435913, 0.0010226070880889893, 0.0010938197374343872, 0.0011650323867797852, 0.001236245036125183, 0.001307457685470581, 0.001378670334815979, 0.001449882984161377, 0.001521095633506775, 0.0015923082828521729, 0.0016635209321975708, 0.0017347335815429688]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 5.0, 2.0, 9.0, 6.0, 14.0, 17.0, 21.0, 35.0, 45.0, 98.0, 151.0, 286.0, 722.0, 3110.0, 38561.0, 951414.0, 48957.0, 3570.0, 816.0, 323.0, 155.0, 75.0, 53.0, 27.0, 25.0, 17.0, 13.0, 10.0, 7.0, 1.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.90625, -28.114990234375, -27.32373046875, -26.532470703125, -25.7412109375, -24.949951171875, -24.15869140625, -23.367431640625, -22.576171875, -21.784912109375, -20.99365234375, -20.202392578125, -19.4111328125, -18.619873046875, -17.82861328125, -17.037353515625, -16.24609375, -15.454833984375, -14.66357421875, -13.872314453125, -13.0810546875, -12.289794921875, -11.49853515625, -10.707275390625, -9.916015625, -9.124755859375, -8.33349609375, -7.542236328125, -6.7509765625, -5.959716796875, -5.16845703125, -4.377197265625, -3.5859375, -2.794677734375, -2.00341796875, -1.212158203125, -0.4208984375, 0.370361328125, 1.16162109375, 1.952880859375, 2.744140625, 3.535400390625, 4.32666015625, 5.117919921875, 5.9091796875, 6.700439453125, 7.49169921875, 8.282958984375, 9.07421875, 9.865478515625, 10.65673828125, 11.447998046875, 12.2392578125, 13.030517578125, 13.82177734375, 14.613037109375, 15.404296875, 16.195556640625, 16.98681640625, 17.778076171875, 18.5693359375, 19.360595703125, 20.15185546875, 20.943115234375, 21.734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 10.0, 10.0, 15.0, 10.0, 18.0, 24.0, 41.0, 63.0, 96.0, 123.0, 131.0, 129.0, 97.0, 62.0, 33.0, 28.0, 24.0, 13.0, 14.0, 5.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.0792236328125, -10.674072265625, -10.2689208984375, -9.86376953125, -9.4586181640625, -9.053466796875, -8.6483154296875, -8.2431640625, -7.8380126953125, -7.432861328125, -7.0277099609375, -6.62255859375, -6.2174072265625, -5.812255859375, -5.4071044921875, -5.001953125, -4.5968017578125, -4.191650390625, -3.7864990234375, -3.38134765625, -2.9761962890625, -2.571044921875, -2.1658935546875, -1.7607421875, -1.3555908203125, -0.950439453125, -0.5452880859375, -0.14013671875, 0.2650146484375, 0.670166015625, 1.0753173828125, 1.48046875, 1.8856201171875, 2.290771484375, 2.6959228515625, 3.10107421875, 3.5062255859375, 3.911376953125, 4.3165283203125, 4.7216796875, 5.1268310546875, 5.531982421875, 5.9371337890625, 6.34228515625, 6.7474365234375, 7.152587890625, 7.5577392578125, 7.962890625, 8.3680419921875, 8.773193359375, 9.1783447265625, 9.58349609375, 9.9886474609375, 10.393798828125, 10.7989501953125, 11.2041015625, 11.6092529296875, 12.014404296875, 12.4195556640625, 12.82470703125, 13.2298583984375, 13.635009765625, 14.0401611328125, 14.4453125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 23.0, 35.0, 92.0, 164.0, 210.0, 199.0, 134.0, 62.0, 35.0, 20.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.58497619628906, -163.07998657226562, -155.57498168945312, -148.0699920654297, -140.56500244140625, -133.05999755859375, -125.55500793457031, -118.05001068115234, -110.54501342773438, -103.0400161743164, -95.53501892089844, -88.030029296875, -80.52503204345703, -73.02003479003906, -65.51504516601562, -58.010047912597656, -50.50505065917969, -43.00005340576172, -35.495059967041016, -27.99006462097168, -20.485069274902344, -12.980072021484375, -5.475078582763672, 2.0299148559570312, 9.534912109375, 17.039907455444336, 24.544902801513672, 32.049896240234375, 39.554893493652344, 47.05989074707031, 54.564884185791016, 62.06987762451172, 69.57485961914062, 77.0798568725586, 84.58485412597656, 92.08984375, 99.59484100341797, 107.09983825683594, 114.60482788085938, 122.10982513427734, 129.6148223876953, 137.11981201171875, 144.62481689453125, 152.1298065185547, 159.63479614257812, 167.13980102539062, 174.64479064941406, 182.1497802734375, 189.65478515625, 197.15977478027344, 204.66477966308594, 212.16976928710938, 219.67477416992188, 227.1797637939453, 234.68475341796875, 242.18975830078125, 249.6947479248047, 257.1997375488281, 264.7047424316406, 272.2097473144531, 279.7147216796875, 287.2197265625, 294.7247314453125, 302.2297058105469, 309.7347106933594]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 11.0, 10.0, 10.0, 13.0, 10.0, 18.0, 16.0, 18.0, 31.0, 24.0, 23.0, 43.0, 38.0, 28.0, 43.0, 33.0, 41.0, 39.0, 38.0, 53.0, 25.0, 37.0, 35.0, 32.0, 33.0, 36.0, 30.0, 24.0, 23.0, 28.0, 20.0, 20.0, 16.0, 14.0, 14.0, 11.0, 6.0, 8.0, 9.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.84262084960938, -72.40647888183594, -69.9703369140625, -67.53418731689453, -65.0980453491211, -62.661903381347656, -60.22576141357422, -57.789615631103516, -55.35346984863281, -52.917327880859375, -50.48118209838867, -48.045040130615234, -45.60889434814453, -43.172752380371094, -40.736610412597656, -38.30046463012695, -35.864322662353516, -33.42818069458008, -30.992034912109375, -28.555892944335938, -26.119747161865234, -23.683605194091797, -21.247461318969727, -18.811317443847656, -16.375173568725586, -13.939029693603516, -11.502885818481445, -9.066742897033691, -6.630599021911621, -4.194455146789551, -1.7583122253417969, 0.6778316497802734, 3.1139755249023438, 5.550119400024414, 7.986262798309326, 10.422406196594238, 12.858550071716309, 15.294693946838379, 17.730836868286133, 20.166980743408203, 22.603124618530273, 25.039268493652344, 27.475412368774414, 29.911556243896484, 32.34769821166992, 34.783843994140625, 37.21998596191406, 39.6561279296875, 42.0922737121582, 44.52841567993164, 46.964561462402344, 49.40070343017578, 51.836849212646484, 54.27299118041992, 56.709136962890625, 59.14527893066406, 61.5814208984375, 64.01756286621094, 66.45370483398438, 68.88985443115234, 71.32599639892578, 73.76213836669922, 76.19828033447266, 78.63442993164062, 81.07057189941406]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 8.0, 10.0, 19.0, 17.0, 29.0, 35.0, 79.0, 150.0, 267.0, 569.0, 1408.0, 4090.0, 36041.0, 4122154.0, 23625.0, 3482.0, 1245.0, 525.0, 222.0, 114.0, 77.0, 34.0, 22.0, 15.0, 9.0, 14.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.15625, -43.7197265625, -42.283203125, -40.8466796875, -39.41015625, -37.9736328125, -36.537109375, -35.1005859375, -33.6640625, -32.2275390625, -30.791015625, -29.3544921875, -27.91796875, -26.4814453125, -25.044921875, -23.6083984375, -22.171875, -20.7353515625, -19.298828125, -17.8623046875, -16.42578125, -14.9892578125, -13.552734375, -12.1162109375, -10.6796875, -9.2431640625, -7.806640625, -6.3701171875, -4.93359375, -3.4970703125, -2.060546875, -0.6240234375, 0.8125, 2.2490234375, 3.685546875, 5.1220703125, 6.55859375, 7.9951171875, 9.431640625, 10.8681640625, 12.3046875, 13.7412109375, 15.177734375, 16.6142578125, 18.05078125, 19.4873046875, 20.923828125, 22.3603515625, 23.796875, 25.2333984375, 26.669921875, 28.1064453125, 29.54296875, 30.9794921875, 32.416015625, 33.8525390625, 35.2890625, 36.7255859375, 38.162109375, 39.5986328125, 41.03515625, 42.4716796875, 43.908203125, 45.3447265625, 46.78125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 10.0, 11.0, 18.0, 20.0, 38.0, 56.0, 72.0, 73.0, 90.0, 101.0, 107.0, 92.0, 89.0, 76.0, 54.0, 26.0, 27.0, 14.0, 13.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.6802978515625, -7.384033203125, -7.0877685546875, -6.79150390625, -6.4952392578125, -6.198974609375, -5.9027099609375, -5.6064453125, -5.3101806640625, -5.013916015625, -4.7176513671875, -4.42138671875, -4.1251220703125, -3.828857421875, -3.5325927734375, -3.236328125, -2.9400634765625, -2.643798828125, -2.3475341796875, -2.05126953125, -1.7550048828125, -1.458740234375, -1.1624755859375, -0.8662109375, -0.5699462890625, -0.273681640625, 0.0225830078125, 0.31884765625, 0.6151123046875, 0.911376953125, 1.2076416015625, 1.50390625, 1.8001708984375, 2.096435546875, 2.3927001953125, 2.68896484375, 2.9852294921875, 3.281494140625, 3.5777587890625, 3.8740234375, 4.1702880859375, 4.466552734375, 4.7628173828125, 5.05908203125, 5.3553466796875, 5.651611328125, 5.9478759765625, 6.244140625, 6.5404052734375, 6.836669921875, 7.1329345703125, 7.42919921875, 7.7254638671875, 8.021728515625, 8.3179931640625, 8.6142578125, 8.9105224609375, 9.206787109375, 9.5030517578125, 9.79931640625, 10.0955810546875, 10.391845703125, 10.6881103515625, 10.984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 11.0, 17.0, 14.0, 15.0, 20.0, 18.0, 34.0, 23.0, 43.0, 67.0, 113.0, 380.0, 1400.0, 6417.0, 3948057.0, 230404.0, 5315.0, 1210.0, 298.0, 113.0, 52.0, 44.0, 28.0, 27.0, 34.0, 19.0, 15.0, 11.0, 14.0, 12.0, 11.0, 7.0, 5.0, 0.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-60.59375, -59.03759765625, -57.4814453125, -55.92529296875, -54.369140625, -52.81298828125, -51.2568359375, -49.70068359375, -48.14453125, -46.58837890625, -45.0322265625, -43.47607421875, -41.919921875, -40.36376953125, -38.8076171875, -37.25146484375, -35.6953125, -34.13916015625, -32.5830078125, -31.02685546875, -29.470703125, -27.91455078125, -26.3583984375, -24.80224609375, -23.24609375, -21.68994140625, -20.1337890625, -18.57763671875, -17.021484375, -15.46533203125, -13.9091796875, -12.35302734375, -10.796875, -9.24072265625, -7.6845703125, -6.12841796875, -4.572265625, -3.01611328125, -1.4599609375, 0.09619140625, 1.65234375, 3.20849609375, 4.7646484375, 6.32080078125, 7.876953125, 9.43310546875, 10.9892578125, 12.54541015625, 14.1015625, 15.65771484375, 17.2138671875, 18.77001953125, 20.326171875, 21.88232421875, 23.4384765625, 24.99462890625, 26.55078125, 28.10693359375, 29.6630859375, 31.21923828125, 32.775390625, 34.33154296875, 35.8876953125, 37.44384765625, 39.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 39.0, 168.0, 3617.0, 159.0, 35.0, 15.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.140625, -11.89044189453125, -11.6402587890625, -11.39007568359375, -11.139892578125, -10.88970947265625, -10.6395263671875, -10.38934326171875, -10.13916015625, -9.88897705078125, -9.6387939453125, -9.38861083984375, -9.138427734375, -8.88824462890625, -8.6380615234375, -8.38787841796875, -8.1376953125, -7.88751220703125, -7.6373291015625, -7.38714599609375, -7.136962890625, -6.88677978515625, -6.6365966796875, -6.38641357421875, -6.13623046875, -5.88604736328125, -5.6358642578125, -5.38568115234375, -5.135498046875, -4.88531494140625, -4.6351318359375, -4.38494873046875, -4.134765625, -3.88458251953125, -3.6343994140625, -3.38421630859375, -3.134033203125, -2.88385009765625, -2.6336669921875, -2.38348388671875, -2.13330078125, -1.88311767578125, -1.6329345703125, -1.38275146484375, -1.132568359375, -0.88238525390625, -0.6322021484375, -0.38201904296875, -0.1318359375, 0.11834716796875, 0.3685302734375, 0.61871337890625, 0.868896484375, 1.11907958984375, 1.3692626953125, 1.61944580078125, 1.86962890625, 2.11981201171875, 2.3699951171875, 2.62017822265625, 2.870361328125, 3.12054443359375, 3.3707275390625, 3.62091064453125, 3.87109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 22.0, 36.0, 58.0, 72.0, 116.0, 199.0, 173.0, 123.0, 64.0, 44.0, 26.0, 11.0, 13.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.56570053100586, -23.767024993896484, -22.968351364135742, -22.169675827026367, -21.371002197265625, -20.57232666015625, -19.773651123046875, -18.974977493286133, -18.176301956176758, -17.377626419067383, -16.57895278930664, -15.780277252197266, -14.981602668762207, -14.182928085327148, -13.38425350189209, -12.585578918457031, -11.786904335021973, -10.988229751586914, -10.189555168151855, -9.390880584716797, -8.592205047607422, -7.793530464172363, -6.994855880737305, -6.196180820465088, -5.397506237030029, -4.598831653594971, -3.800156593322754, -3.0014820098876953, -2.2028071880340576, -1.40413236618042, -0.6054577827453613, 0.19321727752685547, 0.9918918609619141, 1.7905666828155518, 2.5892415046691895, 3.387916088104248, 4.186591148376465, 4.985265731811523, 5.783940315246582, 6.582615375518799, 7.381289958953857, 8.179965019226074, 8.978639602661133, 9.777314186096191, 10.57598876953125, 11.374664306640625, 12.173337936401367, 12.972013473510742, 13.7706880569458, 14.56936264038086, 15.368037223815918, 16.166711807250977, 16.96538734436035, 17.764060974121094, 18.56273651123047, 19.361412048339844, 20.160085678100586, 20.95876121520996, 21.757434844970703, 22.556110382080078, 23.35478401184082, 24.153459548950195, 24.952133178710938, 25.750808715820312, 26.549484252929688]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 11.0, 12.0, 7.0, 13.0, 16.0, 14.0, 18.0, 23.0, 31.0, 24.0, 30.0, 25.0, 24.0, 41.0, 35.0, 38.0, 36.0, 29.0, 50.0, 34.0, 48.0, 43.0, 34.0, 36.0, 23.0, 29.0, 26.0, 32.0, 32.0, 25.0, 19.0, 22.0, 11.0, 16.0, 15.0, 14.0, 4.0, 12.0, 9.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-8.252778053283691, -8.00320816040039, -7.75363826751709, -7.504068374633789, -7.254498481750488, -7.0049285888671875, -6.755358695983887, -6.505788326263428, -6.256218433380127, -6.006648540496826, -5.757078647613525, -5.507508754730225, -5.257938861846924, -5.008368492126465, -4.758798599243164, -4.509228706359863, -4.2596588134765625, -4.010088920593262, -3.760519027709961, -3.51094913482666, -3.2613790035247803, -3.0118091106414795, -2.7622392177581787, -2.512669086456299, -2.2630996704101562, -2.0135297775268555, -1.7639597654342651, -1.5143898725509644, -1.264819860458374, -1.0152499675750732, -0.7656800746917725, -0.5161100625991821, -0.2665400505065918, -0.016970112919807434, 0.23259982466697693, 0.4821697473526001, 0.7317396998405457, 0.9813096523284912, 1.230879545211792, 1.4804495573043823, 1.730019450187683, 1.9795893430709839, 2.229159355163574, 2.478729248046875, 2.728299140930176, 2.9778690338134766, 3.2274389266967773, 3.4770090579986572, 3.726578950881958, 3.976148843765259, 4.225718975067139, 4.4752888679504395, 4.72485876083374, 4.974428653717041, 5.223998546600342, 5.473568439483643, 5.723138332366943, 5.972708225250244, 6.222278118133545, 6.471848011016846, 6.7214179039001465, 6.9709882736206055, 7.220558166503906, 7.470128059387207, 7.719697952270508]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 14.0, 18.0, 30.0, 55.0, 58.0, 99.0, 171.0, 330.0, 608.0, 1389.0, 3408.0, 11301.0, 54135.0, 296777.0, 520699.0, 126087.0, 23497.0, 5847.0, 2086.0, 865.0, 477.0, 237.0, 129.0, 76.0, 47.0, 36.0, 20.0, 17.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.0625, -21.418212890625, -20.77392578125, -20.129638671875, -19.4853515625, -18.841064453125, -18.19677734375, -17.552490234375, -16.908203125, -16.263916015625, -15.61962890625, -14.975341796875, -14.3310546875, -13.686767578125, -13.04248046875, -12.398193359375, -11.75390625, -11.109619140625, -10.46533203125, -9.821044921875, -9.1767578125, -8.532470703125, -7.88818359375, -7.243896484375, -6.599609375, -5.955322265625, -5.31103515625, -4.666748046875, -4.0224609375, -3.378173828125, -2.73388671875, -2.089599609375, -1.4453125, -0.801025390625, -0.15673828125, 0.487548828125, 1.1318359375, 1.776123046875, 2.42041015625, 3.064697265625, 3.708984375, 4.353271484375, 4.99755859375, 5.641845703125, 6.2861328125, 6.930419921875, 7.57470703125, 8.218994140625, 8.86328125, 9.507568359375, 10.15185546875, 10.796142578125, 11.4404296875, 12.084716796875, 12.72900390625, 13.373291015625, 14.017578125, 14.661865234375, 15.30615234375, 15.950439453125, 16.5947265625, 17.239013671875, 17.88330078125, 18.527587890625, 19.171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 9.0, 5.0, 9.0, 19.0, 35.0, 33.0, 53.0, 72.0, 89.0, 69.0, 108.0, 92.0, 96.0, 75.0, 81.0, 55.0, 37.0, 14.0, 18.0, 14.0, 8.0, 9.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.86083984375, -7.5576171875, -7.25439453125, -6.951171875, -6.64794921875, -6.3447265625, -6.04150390625, -5.73828125, -5.43505859375, -5.1318359375, -4.82861328125, -4.525390625, -4.22216796875, -3.9189453125, -3.61572265625, -3.3125, -3.00927734375, -2.7060546875, -2.40283203125, -2.099609375, -1.79638671875, -1.4931640625, -1.18994140625, -0.88671875, -0.58349609375, -0.2802734375, 0.02294921875, 0.326171875, 0.62939453125, 0.9326171875, 1.23583984375, 1.5390625, 1.84228515625, 2.1455078125, 2.44873046875, 2.751953125, 3.05517578125, 3.3583984375, 3.66162109375, 3.96484375, 4.26806640625, 4.5712890625, 4.87451171875, 5.177734375, 5.48095703125, 5.7841796875, 6.08740234375, 6.390625, 6.69384765625, 6.9970703125, 7.30029296875, 7.603515625, 7.90673828125, 8.2099609375, 8.51318359375, 8.81640625, 9.11962890625, 9.4228515625, 9.72607421875, 10.029296875, 10.33251953125, 10.6357421875, 10.93896484375, 11.2421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 13.0, 9.0, 15.0, 20.0, 48.0, 69.0, 110.0, 206.0, 440.0, 1180.0, 4682.0, 176166.0, 853914.0, 8768.0, 1656.0, 589.0, 276.0, 159.0, 91.0, 49.0, 27.0, 26.0, 17.0, 8.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.8125, -73.119140625, -70.42578125, -67.732421875, -65.0390625, -62.345703125, -59.65234375, -56.958984375, -54.265625, -51.572265625, -48.87890625, -46.185546875, -43.4921875, -40.798828125, -38.10546875, -35.412109375, -32.71875, -30.025390625, -27.33203125, -24.638671875, -21.9453125, -19.251953125, -16.55859375, -13.865234375, -11.171875, -8.478515625, -5.78515625, -3.091796875, -0.3984375, 2.294921875, 4.98828125, 7.681640625, 10.375, 13.068359375, 15.76171875, 18.455078125, 21.1484375, 23.841796875, 26.53515625, 29.228515625, 31.921875, 34.615234375, 37.30859375, 40.001953125, 42.6953125, 45.388671875, 48.08203125, 50.775390625, 53.46875, 56.162109375, 58.85546875, 61.548828125, 64.2421875, 66.935546875, 69.62890625, 72.322265625, 75.015625, 77.708984375, 80.40234375, 83.095703125, 85.7890625, 88.482421875, 91.17578125, 93.869140625, 96.5625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 15.0, 23.0, 39.0, 35.0, 60.0, 82.0, 107.0, 105.0, 122.0, 97.0, 73.0, 71.0, 52.0, 25.0, 19.0, 12.0, 10.0, 2.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.625, -63.5029296875, -61.380859375, -59.2587890625, -57.13671875, -55.0146484375, -52.892578125, -50.7705078125, -48.6484375, -46.5263671875, -44.404296875, -42.2822265625, -40.16015625, -38.0380859375, -35.916015625, -33.7939453125, -31.671875, -29.5498046875, -27.427734375, -25.3056640625, -23.18359375, -21.0615234375, -18.939453125, -16.8173828125, -14.6953125, -12.5732421875, -10.451171875, -8.3291015625, -6.20703125, -4.0849609375, -1.962890625, 0.1591796875, 2.28125, 4.4033203125, 6.525390625, 8.6474609375, 10.76953125, 12.8916015625, 15.013671875, 17.1357421875, 19.2578125, 21.3798828125, 23.501953125, 25.6240234375, 27.74609375, 29.8681640625, 31.990234375, 34.1123046875, 36.234375, 38.3564453125, 40.478515625, 42.6005859375, 44.72265625, 46.8447265625, 48.966796875, 51.0888671875, 53.2109375, 55.3330078125, 57.455078125, 59.5771484375, 61.69921875, 63.8212890625, 65.943359375, 68.0654296875, 70.1875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 10.0, 11.0, 12.0, 19.0, 26.0, 39.0, 47.0, 82.0, 147.0, 262.0, 706.0, 7922.0, 1021597.0, 16037.0, 877.0, 300.0, 162.0, 96.0, 72.0, 27.0, 33.0, 21.0, 17.0, 16.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.60791015625, -47.8720703125, -46.13623046875, -44.400390625, -42.66455078125, -40.9287109375, -39.19287109375, -37.45703125, -35.72119140625, -33.9853515625, -32.24951171875, -30.513671875, -28.77783203125, -27.0419921875, -25.30615234375, -23.5703125, -21.83447265625, -20.0986328125, -18.36279296875, -16.626953125, -14.89111328125, -13.1552734375, -11.41943359375, -9.68359375, -7.94775390625, -6.2119140625, -4.47607421875, -2.740234375, -1.00439453125, 0.7314453125, 2.46728515625, 4.203125, 5.93896484375, 7.6748046875, 9.41064453125, 11.146484375, 12.88232421875, 14.6181640625, 16.35400390625, 18.08984375, 19.82568359375, 21.5615234375, 23.29736328125, 25.033203125, 26.76904296875, 28.5048828125, 30.24072265625, 31.9765625, 33.71240234375, 35.4482421875, 37.18408203125, 38.919921875, 40.65576171875, 42.3916015625, 44.12744140625, 45.86328125, 47.59912109375, 49.3349609375, 51.07080078125, 52.806640625, 54.54248046875, 56.2783203125, 58.01416015625, 59.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 7.0, 11.0, 17.0, 7.0, 19.0, 30.0, 35.0, 46.0, 76.0, 115.0, 114.0, 118.0, 98.0, 64.0, 54.0, 36.0, 36.0, 24.0, 13.0, 14.0, 8.0, 7.0, 5.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0016698837280273438, -0.001623407006263733, -0.001576930284500122, -0.0015304535627365112, -0.0014839768409729004, -0.0014375001192092896, -0.0013910233974456787, -0.0013445466756820679, -0.001298069953918457, -0.0012515932321548462, -0.0012051165103912354, -0.0011586397886276245, -0.0011121630668640137, -0.0010656863451004028, -0.001019209623336792, -0.0009727329015731812, -0.0009262561798095703, -0.0008797794580459595, -0.0008333027362823486, -0.0007868260145187378, -0.000740349292755127, -0.0006938725709915161, -0.0006473958492279053, -0.0006009191274642944, -0.0005544424057006836, -0.0005079656839370728, -0.0004614889621734619, -0.0004150122404098511, -0.00036853551864624023, -0.0003220587968826294, -0.00027558207511901855, -0.00022910535335540771, -0.00018262863159179688, -0.00013615190982818604, -8.96751880645752e-05, -4.3198466300964355e-05, 3.2782554626464844e-06, 4.9754977226257324e-05, 9.623169898986816e-05, 0.000142708420753479, 0.00018918514251708984, 0.00023566186428070068, 0.0002821385860443115, 0.00032861530780792236, 0.0003750920295715332, 0.00042156875133514404, 0.0004680454730987549, 0.0005145221948623657, 0.0005609989166259766, 0.0006074756383895874, 0.0006539523601531982, 0.0007004290819168091, 0.0007469058036804199, 0.0007933825254440308, 0.0008398592472076416, 0.0008863359689712524, 0.0009328126907348633, 0.0009792894124984741, 0.001025766134262085, 0.0010722428560256958, 0.0011187195777893066, 0.0011651962995529175, 0.0012116730213165283, 0.0012581497430801392, 0.00130462646484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 10.0, 12.0, 12.0, 9.0, 30.0, 35.0, 54.0, 103.0, 189.0, 356.0, 932.0, 4847.0, 149219.0, 879976.0, 10188.0, 1599.0, 461.0, 207.0, 98.0, 72.0, 51.0, 15.0, 22.0, 16.0, 8.0, 9.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.732666015625, -43.59033203125, -42.447998046875, -41.3056640625, -40.163330078125, -39.02099609375, -37.878662109375, -36.736328125, -35.593994140625, -34.45166015625, -33.309326171875, -32.1669921875, -31.024658203125, -29.88232421875, -28.739990234375, -27.59765625, -26.455322265625, -25.31298828125, -24.170654296875, -23.0283203125, -21.885986328125, -20.74365234375, -19.601318359375, -18.458984375, -17.316650390625, -16.17431640625, -15.031982421875, -13.8896484375, -12.747314453125, -11.60498046875, -10.462646484375, -9.3203125, -8.177978515625, -7.03564453125, -5.893310546875, -4.7509765625, -3.608642578125, -2.46630859375, -1.323974609375, -0.181640625, 0.960693359375, 2.10302734375, 3.245361328125, 4.3876953125, 5.530029296875, 6.67236328125, 7.814697265625, 8.95703125, 10.099365234375, 11.24169921875, 12.384033203125, 13.5263671875, 14.668701171875, 15.81103515625, 16.953369140625, 18.095703125, 19.238037109375, 20.38037109375, 21.522705078125, 22.6650390625, 23.807373046875, 24.94970703125, 26.092041015625, 27.234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 10.0, 4.0, 9.0, 5.0, 26.0, 51.0, 119.0, 177.0, 240.0, 170.0, 79.0, 37.0, 22.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.8984375, -35.984375, -35.0703125, -34.15625, -33.2421875, -32.328125, -31.4140625, -30.5, -29.5859375, -28.671875, -27.7578125, -26.84375, -25.9296875, -25.015625, -24.1015625, -23.1875, -22.2734375, -21.359375, -20.4453125, -19.53125, -18.6171875, -17.703125, -16.7890625, -15.875, -14.9609375, -14.046875, -13.1328125, -12.21875, -11.3046875, -10.390625, -9.4765625, -8.5625, -7.6484375, -6.734375, -5.8203125, -4.90625, -3.9921875, -3.078125, -2.1640625, -1.25, -0.3359375, 0.578125, 1.4921875, 2.40625, 3.3203125, 4.234375, 5.1484375, 6.0625, 6.9765625, 7.890625, 8.8046875, 9.71875, 10.6328125, 11.546875, 12.4609375, 13.375, 14.2890625, 15.203125, 16.1171875, 17.03125, 17.9453125, 18.859375, 19.7734375, 20.6875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 19.0, 73.0, 231.0, 359.0, 219.0, 64.0, 17.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-643.5451049804688, -629.9508056640625, -616.3564453125, -602.7621459960938, -589.1677856445312, -575.573486328125, -561.9791259765625, -548.3848266601562, -534.79052734375, -521.1962280273438, -507.60186767578125, -494.0075378417969, -480.4132080078125, -466.81890869140625, -453.2245788574219, -439.6302490234375, -426.035888671875, -412.4415588378906, -398.84722900390625, -385.2528991699219, -371.6585693359375, -358.06427001953125, -344.4699401855469, -330.8756103515625, -317.2812805175781, -303.68695068359375, -290.0926208496094, -276.498291015625, -262.90399169921875, -249.3096466064453, -235.71533203125, -222.12100219726562, -208.52670288085938, -194.932373046875, -181.33804321289062, -167.7437286376953, -154.14939880371094, -140.55506896972656, -126.96074676513672, -113.36642456054688, -99.7720947265625, -86.17776489257812, -72.58344268798828, -58.98911666870117, -45.39479064941406, -31.800460815429688, -18.206138610839844, -4.61181640625, 8.982513427734375, 22.576839447021484, 36.171165466308594, 49.7654914855957, 63.35981750488281, 76.95414733886719, 90.54846954345703, 104.14279174804688, 117.73712158203125, 131.33145141601562, 144.92578125, 158.5200958251953, 172.1144256591797, 185.70875549316406, 199.30307006835938, 212.89739990234375, 226.49172973632812]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 10.0, 16.0, 7.0, 13.0, 13.0, 18.0, 14.0, 26.0, 30.0, 41.0, 35.0, 44.0, 36.0, 50.0, 50.0, 43.0, 56.0, 45.0, 44.0, 45.0, 49.0, 39.0, 41.0, 42.0, 28.0, 25.0, 19.0, 11.0, 23.0, 16.0, 12.0, 15.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-125.21125030517578, -121.36190795898438, -117.51256561279297, -113.66322326660156, -109.81388092041016, -105.96453857421875, -102.11518859863281, -98.26585388183594, -94.41650390625, -90.5671615600586, -86.71781921386719, -82.86847686767578, -79.01913452148438, -75.16979217529297, -71.32044982910156, -67.47109985351562, -63.62176513671875, -59.772422790527344, -55.92308044433594, -52.07373809814453, -48.224395751953125, -44.37505340576172, -40.52570724487305, -36.67636489868164, -32.827022552490234, -28.977680206298828, -25.128337860107422, -21.278993606567383, -17.429651260375977, -13.58030891418457, -9.730964660644531, -5.881622314453125, -2.0322723388671875, 1.817070484161377, 5.666413307189941, 9.515756607055664, 13.36509895324707, 17.214441299438477, 21.063785552978516, 24.913127899169922, 28.762470245361328, 32.611812591552734, 36.46115493774414, 40.31050109863281, 44.15984344482422, 48.009185791015625, 51.85852813720703, 55.70787048339844, 59.557212829589844, 63.40655517578125, 67.25589752197266, 71.10523986816406, 74.95458221435547, 78.80392456054688, 82.65327453613281, 86.50260925292969, 90.35195922851562, 94.20130157470703, 98.05064392089844, 101.89998626708984, 105.74932861328125, 109.59867095947266, 113.44801330566406, 117.29736328125, 121.14669799804688]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 19.0, 49.0, 90.0, 161.0, 370.0, 967.0, 3169.0, 19725.0, 4001239.0, 157140.0, 8285.0, 1820.0, 674.0, 256.0, 123.0, 69.0, 38.0, 25.0, 13.0, 9.0, 9.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.555908203125, -25.43994140625, -24.323974609375, -23.2080078125, -22.092041015625, -20.97607421875, -19.860107421875, -18.744140625, -17.628173828125, -16.51220703125, -15.396240234375, -14.2802734375, -13.164306640625, -12.04833984375, -10.932373046875, -9.81640625, -8.700439453125, -7.58447265625, -6.468505859375, -5.3525390625, -4.236572265625, -3.12060546875, -2.004638671875, -0.888671875, 0.227294921875, 1.34326171875, 2.459228515625, 3.5751953125, 4.691162109375, 5.80712890625, 6.923095703125, 8.0390625, 9.155029296875, 10.27099609375, 11.386962890625, 12.5029296875, 13.618896484375, 14.73486328125, 15.850830078125, 16.966796875, 18.082763671875, 19.19873046875, 20.314697265625, 21.4306640625, 22.546630859375, 23.66259765625, 24.778564453125, 25.89453125, 27.010498046875, 28.12646484375, 29.242431640625, 30.3583984375, 31.474365234375, 32.59033203125, 33.706298828125, 34.822265625, 35.938232421875, 37.05419921875, 38.170166015625, 39.2861328125, 40.402099609375, 41.51806640625, 42.634033203125, 43.75]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 21.0, 28.0, 34.0, 48.0, 51.0, 55.0, 92.0, 98.0, 85.0, 90.0, 83.0, 80.0, 70.0, 41.0, 30.0, 16.0, 9.0, 14.0, 4.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.5694580078125, -7.271728515625, -6.9739990234375, -6.67626953125, -6.3785400390625, -6.080810546875, -5.7830810546875, -5.4853515625, -5.1876220703125, -4.889892578125, -4.5921630859375, -4.29443359375, -3.9967041015625, -3.698974609375, -3.4012451171875, -3.103515625, -2.8057861328125, -2.508056640625, -2.2103271484375, -1.91259765625, -1.6148681640625, -1.317138671875, -1.0194091796875, -0.7216796875, -0.4239501953125, -0.126220703125, 0.1715087890625, 0.46923828125, 0.7669677734375, 1.064697265625, 1.3624267578125, 1.66015625, 1.9578857421875, 2.255615234375, 2.5533447265625, 2.85107421875, 3.1488037109375, 3.446533203125, 3.7442626953125, 4.0419921875, 4.3397216796875, 4.637451171875, 4.9351806640625, 5.23291015625, 5.5306396484375, 5.828369140625, 6.1260986328125, 6.423828125, 6.7215576171875, 7.019287109375, 7.3170166015625, 7.61474609375, 7.9124755859375, 8.210205078125, 8.5079345703125, 8.8056640625, 9.1033935546875, 9.401123046875, 9.6988525390625, 9.99658203125, 10.2943115234375, 10.592041015625, 10.8897705078125, 11.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 10.0, 7.0, 8.0, 17.0, 23.0, 37.0, 36.0, 55.0, 73.0, 106.0, 142.0, 190.0, 305.0, 574.0, 1507.0, 5560.0, 42947.0, 4076205.0, 56760.0, 6483.0, 1616.0, 604.0, 293.0, 189.0, 145.0, 99.0, 80.0, 52.0, 34.0, 33.0, 24.0, 22.0, 10.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.59375, -31.650146484375, -30.70654296875, -29.762939453125, -28.8193359375, -27.875732421875, -26.93212890625, -25.988525390625, -25.044921875, -24.101318359375, -23.15771484375, -22.214111328125, -21.2705078125, -20.326904296875, -19.38330078125, -18.439697265625, -17.49609375, -16.552490234375, -15.60888671875, -14.665283203125, -13.7216796875, -12.778076171875, -11.83447265625, -10.890869140625, -9.947265625, -9.003662109375, -8.06005859375, -7.116455078125, -6.1728515625, -5.229248046875, -4.28564453125, -3.342041015625, -2.3984375, -1.454833984375, -0.51123046875, 0.432373046875, 1.3759765625, 2.319580078125, 3.26318359375, 4.206787109375, 5.150390625, 6.093994140625, 7.03759765625, 7.981201171875, 8.9248046875, 9.868408203125, 10.81201171875, 11.755615234375, 12.69921875, 13.642822265625, 14.58642578125, 15.530029296875, 16.4736328125, 17.417236328125, 18.36083984375, 19.304443359375, 20.248046875, 21.191650390625, 22.13525390625, 23.078857421875, 24.0224609375, 24.966064453125, 25.90966796875, 26.853271484375, 27.796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 12.0, 10.0, 13.0, 24.0, 42.0, 149.0, 2008.0, 1551.0, 152.0, 51.0, 30.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.61376953125, -9.2822265625, -8.95068359375, -8.619140625, -8.28759765625, -7.9560546875, -7.62451171875, -7.29296875, -6.96142578125, -6.6298828125, -6.29833984375, -5.966796875, -5.63525390625, -5.3037109375, -4.97216796875, -4.640625, -4.30908203125, -3.9775390625, -3.64599609375, -3.314453125, -2.98291015625, -2.6513671875, -2.31982421875, -1.98828125, -1.65673828125, -1.3251953125, -0.99365234375, -0.662109375, -0.33056640625, 0.0009765625, 0.33251953125, 0.6640625, 0.99560546875, 1.3271484375, 1.65869140625, 1.990234375, 2.32177734375, 2.6533203125, 2.98486328125, 3.31640625, 3.64794921875, 3.9794921875, 4.31103515625, 4.642578125, 4.97412109375, 5.3056640625, 5.63720703125, 5.96875, 6.30029296875, 6.6318359375, 6.96337890625, 7.294921875, 7.62646484375, 7.9580078125, 8.28955078125, 8.62109375, 8.95263671875, 9.2841796875, 9.61572265625, 9.947265625, 10.27880859375, 10.6103515625, 10.94189453125, 11.2734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 13.0, 25.0, 40.0, 84.0, 143.0, 195.0, 192.0, 126.0, 69.0, 39.0, 28.0, 12.0, 10.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.317665100097656, -45.959861755371094, -44.602054595947266, -43.2442512512207, -41.886444091796875, -40.52864074707031, -39.170833587646484, -37.81303024291992, -36.455223083496094, -35.09741973876953, -33.7396125793457, -32.38180923461914, -31.024002075195312, -29.666196823120117, -28.308391571044922, -26.95058822631836, -25.592782974243164, -24.23497772216797, -22.877172470092773, -21.519367218017578, -20.161561965942383, -18.803756713867188, -17.445953369140625, -16.088146209716797, -14.730341911315918, -13.372536659240723, -12.014731407165527, -10.656927108764648, -9.299121856689453, -7.9413161277771, -6.5835113525390625, -5.225706100463867, -3.867900848388672, -2.5100955963134766, -1.1522905826568604, 0.20551443099975586, 1.5633196830749512, 2.9211249351501465, 4.278929710388184, 5.636734962463379, 6.994540214538574, 8.35234546661377, 9.710150718688965, 11.067955017089844, 12.425760269165039, 13.783565521240234, 15.14137077331543, 16.499176025390625, 17.85698127746582, 19.214786529541016, 20.57259178161621, 21.930397033691406, 23.2882022857666, 24.646007537841797, 26.00381088256836, 27.361618041992188, 28.71942138671875, 30.077226638793945, 31.43503189086914, 32.7928352355957, 34.15064239501953, 35.508445739746094, 36.86625289916992, 38.224056243896484, 39.58186340332031]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 5.0, 8.0, 10.0, 18.0, 16.0, 28.0, 22.0, 26.0, 33.0, 40.0, 40.0, 45.0, 57.0, 62.0, 61.0, 51.0, 54.0, 46.0, 58.0, 40.0, 44.0, 29.0, 26.0, 36.0, 27.0, 19.0, 14.0, 29.0, 6.0, 5.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.488224029541016, -15.883613586425781, -15.279003143310547, -14.674392700195312, -14.069781303405762, -13.465170860290527, -12.860560417175293, -12.255949020385742, -11.651338577270508, -11.046728134155273, -10.442117691040039, -9.837507247924805, -9.232895851135254, -8.62828540802002, -8.023674964904785, -7.419064044952393, -6.814454078674316, -6.209843635559082, -5.6052327156066895, -5.000622272491455, -4.3960113525390625, -3.791400909423828, -3.1867904663085938, -2.582179546356201, -1.9775691032409668, -1.3729584217071533, -0.7683478593826294, -0.16373729705810547, 0.440873384475708, 1.0454840660095215, 1.6500945091247559, 2.2547054290771484, 2.859315872192383, 3.4639265537261963, 4.06853723526001, 4.673147678375244, 5.277758598327637, 5.882369041442871, 6.4869794845581055, 7.091590404510498, 7.696200847625732, 8.300811767578125, 8.90542221069336, 9.510032653808594, 10.114643096923828, 10.719253540039062, 11.323863983154297, 11.928475379943848, 12.533085823059082, 13.137696266174316, 13.74230670928955, 14.346918106079102, 14.951528549194336, 15.55613899230957, 16.160749435424805, 16.76535987854004, 17.369970321655273, 17.974580764770508, 18.579191207885742, 19.183801651000977, 19.78841209411621, 20.393024444580078, 20.997634887695312, 21.602245330810547, 22.20685577392578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 10.0, 9.0, 20.0, 26.0, 52.0, 76.0, 110.0, 247.0, 532.0, 1228.0, 3895.0, 15979.0, 103154.0, 620606.0, 257729.0, 34396.0, 6892.0, 2089.0, 737.0, 354.0, 147.0, 101.0, 54.0, 40.0, 21.0, 10.0, 3.0, 12.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.75, -32.80517578125, -31.8603515625, -30.91552734375, -29.970703125, -29.02587890625, -28.0810546875, -27.13623046875, -26.19140625, -25.24658203125, -24.3017578125, -23.35693359375, -22.412109375, -21.46728515625, -20.5224609375, -19.57763671875, -18.6328125, -17.68798828125, -16.7431640625, -15.79833984375, -14.853515625, -13.90869140625, -12.9638671875, -12.01904296875, -11.07421875, -10.12939453125, -9.1845703125, -8.23974609375, -7.294921875, -6.35009765625, -5.4052734375, -4.46044921875, -3.515625, -2.57080078125, -1.6259765625, -0.68115234375, 0.263671875, 1.20849609375, 2.1533203125, 3.09814453125, 4.04296875, 4.98779296875, 5.9326171875, 6.87744140625, 7.822265625, 8.76708984375, 9.7119140625, 10.65673828125, 11.6015625, 12.54638671875, 13.4912109375, 14.43603515625, 15.380859375, 16.32568359375, 17.2705078125, 18.21533203125, 19.16015625, 20.10498046875, 21.0498046875, 21.99462890625, 22.939453125, 23.88427734375, 24.8291015625, 25.77392578125, 26.71875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 18.0, 23.0, 22.0, 30.0, 36.0, 46.0, 49.0, 69.0, 86.0, 78.0, 83.0, 84.0, 69.0, 72.0, 49.0, 42.0, 33.0, 23.0, 15.0, 12.0, 9.0, 10.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.1937255859375, -5.926513671875, -5.6593017578125, -5.39208984375, -5.1248779296875, -4.857666015625, -4.5904541015625, -4.3232421875, -4.0560302734375, -3.788818359375, -3.5216064453125, -3.25439453125, -2.9871826171875, -2.719970703125, -2.4527587890625, -2.185546875, -1.9183349609375, -1.651123046875, -1.3839111328125, -1.11669921875, -0.8494873046875, -0.582275390625, -0.3150634765625, -0.0478515625, 0.2193603515625, 0.486572265625, 0.7537841796875, 1.02099609375, 1.2882080078125, 1.555419921875, 1.8226318359375, 2.08984375, 2.3570556640625, 2.624267578125, 2.8914794921875, 3.15869140625, 3.4259033203125, 3.693115234375, 3.9603271484375, 4.2275390625, 4.4947509765625, 4.761962890625, 5.0291748046875, 5.29638671875, 5.5635986328125, 5.830810546875, 6.0980224609375, 6.365234375, 6.6324462890625, 6.899658203125, 7.1668701171875, 7.43408203125, 7.7012939453125, 7.968505859375, 8.2357177734375, 8.5029296875, 8.7701416015625, 9.037353515625, 9.3045654296875, 9.57177734375, 9.8389892578125, 10.106201171875, 10.3734130859375, 10.640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 12.0, 14.0, 24.0, 25.0, 39.0, 59.0, 88.0, 116.0, 245.0, 441.0, 1190.0, 5618.0, 124900.0, 895564.0, 16590.0, 2186.0, 660.0, 304.0, 160.0, 77.0, 63.0, 25.0, 30.0, 37.0, 17.0, 6.0, 12.0, 7.0, 5.0, 2.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-78.75, -76.228515625, -73.70703125, -71.185546875, -68.6640625, -66.142578125, -63.62109375, -61.099609375, -58.578125, -56.056640625, -53.53515625, -51.013671875, -48.4921875, -45.970703125, -43.44921875, -40.927734375, -38.40625, -35.884765625, -33.36328125, -30.841796875, -28.3203125, -25.798828125, -23.27734375, -20.755859375, -18.234375, -15.712890625, -13.19140625, -10.669921875, -8.1484375, -5.626953125, -3.10546875, -0.583984375, 1.9375, 4.458984375, 6.98046875, 9.501953125, 12.0234375, 14.544921875, 17.06640625, 19.587890625, 22.109375, 24.630859375, 27.15234375, 29.673828125, 32.1953125, 34.716796875, 37.23828125, 39.759765625, 42.28125, 44.802734375, 47.32421875, 49.845703125, 52.3671875, 54.888671875, 57.41015625, 59.931640625, 62.453125, 64.974609375, 67.49609375, 70.017578125, 72.5390625, 75.060546875, 77.58203125, 80.103515625, 82.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 8.0, 5.0, 9.0, 24.0, 39.0, 36.0, 47.0, 58.0, 86.0, 74.0, 83.0, 76.0, 82.0, 89.0, 70.0, 60.0, 35.0, 34.0, 22.0, 11.0, 11.0, 2.0, 6.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.5625, -41.0576171875, -39.552734375, -38.0478515625, -36.54296875, -35.0380859375, -33.533203125, -32.0283203125, -30.5234375, -29.0185546875, -27.513671875, -26.0087890625, -24.50390625, -22.9990234375, -21.494140625, -19.9892578125, -18.484375, -16.9794921875, -15.474609375, -13.9697265625, -12.46484375, -10.9599609375, -9.455078125, -7.9501953125, -6.4453125, -4.9404296875, -3.435546875, -1.9306640625, -0.42578125, 1.0791015625, 2.583984375, 4.0888671875, 5.59375, 7.0986328125, 8.603515625, 10.1083984375, 11.61328125, 13.1181640625, 14.623046875, 16.1279296875, 17.6328125, 19.1376953125, 20.642578125, 22.1474609375, 23.65234375, 25.1572265625, 26.662109375, 28.1669921875, 29.671875, 31.1767578125, 32.681640625, 34.1865234375, 35.69140625, 37.1962890625, 38.701171875, 40.2060546875, 41.7109375, 43.2158203125, 44.720703125, 46.2255859375, 47.73046875, 49.2353515625, 50.740234375, 52.2451171875, 53.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 10.0, 4.0, 6.0, 11.0, 13.0, 20.0, 20.0, 27.0, 32.0, 44.0, 62.0, 72.0, 139.0, 180.0, 304.0, 538.0, 1141.0, 3036.0, 10006.0, 62971.0, 774348.0, 169494.0, 18137.0, 4551.0, 1565.0, 741.0, 355.0, 227.0, 133.0, 102.0, 73.0, 43.0, 25.0, 25.0, 21.0, 10.0, 13.0, 16.0, 14.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.7421875, -13.32177734375, -12.9013671875, -12.48095703125, -12.060546875, -11.64013671875, -11.2197265625, -10.79931640625, -10.37890625, -9.95849609375, -9.5380859375, -9.11767578125, -8.697265625, -8.27685546875, -7.8564453125, -7.43603515625, -7.015625, -6.59521484375, -6.1748046875, -5.75439453125, -5.333984375, -4.91357421875, -4.4931640625, -4.07275390625, -3.65234375, -3.23193359375, -2.8115234375, -2.39111328125, -1.970703125, -1.55029296875, -1.1298828125, -0.70947265625, -0.2890625, 0.13134765625, 0.5517578125, 0.97216796875, 1.392578125, 1.81298828125, 2.2333984375, 2.65380859375, 3.07421875, 3.49462890625, 3.9150390625, 4.33544921875, 4.755859375, 5.17626953125, 5.5966796875, 6.01708984375, 6.4375, 6.85791015625, 7.2783203125, 7.69873046875, 8.119140625, 8.53955078125, 8.9599609375, 9.38037109375, 9.80078125, 10.22119140625, 10.6416015625, 11.06201171875, 11.482421875, 11.90283203125, 12.3232421875, 12.74365234375, 13.1640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 10.0, 24.0, 29.0, 30.0, 56.0, 77.0, 128.0, 259.0, 129.0, 79.0, 56.0, 27.0, 23.0, 10.0, 7.0, 12.0, 8.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022411346435546875, -0.0021535754203796387, -0.00206601619720459, -0.001978456974029541, -0.0018908977508544922, -0.0018033385276794434, -0.0017157793045043945, -0.0016282200813293457, -0.0015406608581542969, -0.001453101634979248, -0.0013655424118041992, -0.0012779831886291504, -0.0011904239654541016, -0.0011028647422790527, -0.001015305519104004, -0.0009277462959289551, -0.0008401870727539062, -0.0007526278495788574, -0.0006650686264038086, -0.0005775094032287598, -0.0004899501800537109, -0.0004023909568786621, -0.0003148317337036133, -0.00022727251052856445, -0.00013971328735351562, -5.21540641784668e-05, 3.540515899658203e-05, 0.00012296438217163086, 0.0002105236053466797, 0.0002980828285217285, 0.00038564205169677734, 0.00047320127487182617, 0.000560760498046875, 0.0006483197212219238, 0.0007358789443969727, 0.0008234381675720215, 0.0009109973907470703, 0.0009985566139221191, 0.001086115837097168, 0.0011736750602722168, 0.0012612342834472656, 0.0013487935066223145, 0.0014363527297973633, 0.0015239119529724121, 0.001611471176147461, 0.0016990303993225098, 0.0017865896224975586, 0.0018741488456726074, 0.0019617080688476562, 0.002049267292022705, 0.002136826515197754, 0.0022243857383728027, 0.0023119449615478516, 0.0023995041847229004, 0.0024870634078979492, 0.002574622631072998, 0.002662181854248047, 0.0027497410774230957, 0.0028373003005981445, 0.0029248595237731934, 0.003012418746948242, 0.003099977970123291, 0.00318753719329834, 0.0032750964164733887, 0.0033626556396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 13.0, 28.0, 30.0, 43.0, 62.0, 90.0, 183.0, 253.0, 446.0, 1108.0, 3742.0, 25355.0, 704943.0, 293368.0, 14258.0, 2654.0, 893.0, 422.0, 202.0, 141.0, 98.0, 46.0, 39.0, 24.0, 23.0, 22.0, 15.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.806640625, -19.26953125, -18.732421875, -18.1953125, -17.658203125, -17.12109375, -16.583984375, -16.046875, -15.509765625, -14.97265625, -14.435546875, -13.8984375, -13.361328125, -12.82421875, -12.287109375, -11.75, -11.212890625, -10.67578125, -10.138671875, -9.6015625, -9.064453125, -8.52734375, -7.990234375, -7.453125, -6.916015625, -6.37890625, -5.841796875, -5.3046875, -4.767578125, -4.23046875, -3.693359375, -3.15625, -2.619140625, -2.08203125, -1.544921875, -1.0078125, -0.470703125, 0.06640625, 0.603515625, 1.140625, 1.677734375, 2.21484375, 2.751953125, 3.2890625, 3.826171875, 4.36328125, 4.900390625, 5.4375, 5.974609375, 6.51171875, 7.048828125, 7.5859375, 8.123046875, 8.66015625, 9.197265625, 9.734375, 10.271484375, 10.80859375, 11.345703125, 11.8828125, 12.419921875, 12.95703125, 13.494140625, 14.03125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 15.0, 20.0, 33.0, 51.0, 83.0, 95.0, 143.0, 165.0, 108.0, 76.0, 52.0, 54.0, 17.0, 13.0, 12.0, 8.0, 5.0, 2.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2734375, -13.7987060546875, -13.323974609375, -12.8492431640625, -12.37451171875, -11.8997802734375, -11.425048828125, -10.9503173828125, -10.4755859375, -10.0008544921875, -9.526123046875, -9.0513916015625, -8.57666015625, -8.1019287109375, -7.627197265625, -7.1524658203125, -6.677734375, -6.2030029296875, -5.728271484375, -5.2535400390625, -4.77880859375, -4.3040771484375, -3.829345703125, -3.3546142578125, -2.8798828125, -2.4051513671875, -1.930419921875, -1.4556884765625, -0.98095703125, -0.5062255859375, -0.031494140625, 0.4432373046875, 0.91796875, 1.3927001953125, 1.867431640625, 2.3421630859375, 2.81689453125, 3.2916259765625, 3.766357421875, 4.2410888671875, 4.7158203125, 5.1905517578125, 5.665283203125, 6.1400146484375, 6.61474609375, 7.0894775390625, 7.564208984375, 8.0389404296875, 8.513671875, 8.9884033203125, 9.463134765625, 9.9378662109375, 10.41259765625, 10.8873291015625, 11.362060546875, 11.8367919921875, 12.3115234375, 12.7862548828125, 13.260986328125, 13.7357177734375, 14.21044921875, 14.6851806640625, 15.159912109375, 15.6346435546875, 16.109375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 10.0, 46.0, 241.0, 384.0, 241.0, 57.0, 12.0, 14.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-919.341064453125, -900.3383178710938, -881.3356323242188, -862.3328857421875, -843.3302001953125, -824.3274536132812, -805.3247680664062, -786.322021484375, -767.3193359375, -748.3165893554688, -729.3139038085938, -710.3111572265625, -691.3084716796875, -672.3057250976562, -653.3030395507812, -634.30029296875, -615.2975463867188, -596.2947998046875, -577.2921142578125, -558.2893676757812, -539.2866821289062, -520.283935546875, -501.2812194824219, -482.27850341796875, -463.2757873535156, -444.2730712890625, -425.2703552246094, -406.26763916015625, -387.264892578125, -368.26220703125, -349.25946044921875, -330.2567443847656, -311.2539978027344, -292.25128173828125, -273.2485656738281, -254.24583435058594, -235.2431182861328, -216.2404022216797, -197.2376708984375, -178.23495483398438, -159.23223876953125, -140.22952270507812, -121.22679901123047, -102.22407531738281, -83.22135925292969, -64.21864318847656, -45.215919494628906, -26.21319580078125, -7.210479736328125, 11.792240142822266, 30.794960021972656, 49.79767990112305, 68.80039978027344, 87.80311584472656, 106.80583953857422, 125.80856323242188, 144.811279296875, 163.81399536132812, 182.81671142578125, 201.81944274902344, 220.82215881347656, 239.8248748779297, 258.8276062011719, 277.830322265625, 296.8330383300781]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 9.0, 9.0, 13.0, 14.0, 9.0, 27.0, 18.0, 29.0, 39.0, 35.0, 50.0, 49.0, 62.0, 58.0, 62.0, 56.0, 53.0, 57.0, 36.0, 40.0, 38.0, 33.0, 36.0, 29.0, 22.0, 23.0, 13.0, 10.0, 11.0, 12.0, 4.0, 11.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.1280517578125, -136.09954833984375, -132.07106018066406, -128.04257202148438, -124.01406860351562, -119.9855728149414, -115.95707702636719, -111.92858123779297, -107.90008544921875, -103.87158966064453, -99.84309387207031, -95.8145980834961, -91.78610229492188, -87.75760650634766, -83.72911071777344, -79.70061492919922, -75.672119140625, -71.64362335205078, -67.61512756347656, -63.586631774902344, -59.558135986328125, -55.529640197753906, -51.50114440917969, -47.47264862060547, -43.44415283203125, -39.41565704345703, -35.38716125488281, -31.358665466308594, -27.330169677734375, -23.301673889160156, -19.273178100585938, -15.244682312011719, -11.216201782226562, -7.187705993652344, -3.159210205078125, 0.8692855834960938, 4.8977813720703125, 8.926277160644531, 12.95477294921875, 16.98326873779297, 21.011764526367188, 25.040260314941406, 29.068756103515625, 33.097251892089844, 37.12574768066406, 41.15424346923828, 45.1827392578125, 49.21123504638672, 53.23973083496094, 57.268226623535156, 61.296722412109375, 65.3252182006836, 69.35371398925781, 73.38220977783203, 77.41070556640625, 81.43920135498047, 85.46769714355469, 89.4961929321289, 93.52468872070312, 97.55318450927734, 101.58168029785156, 105.61017608642578, 109.638671875, 113.66716766357422, 117.69566345214844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 4.0, 4.0, 7.0, 12.0, 18.0, 22.0, 39.0, 70.0, 113.0, 259.0, 469.0, 1166.0, 2684.0, 7762.0, 32221.0, 647965.0, 3417028.0, 65764.0, 12251.0, 3789.0, 1427.0, 615.0, 276.0, 136.0, 77.0, 33.0, 26.0, 13.0, 9.0, 11.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-27.421875, -26.755859375, -26.08984375, -25.423828125, -24.7578125, -24.091796875, -23.42578125, -22.759765625, -22.09375, -21.427734375, -20.76171875, -20.095703125, -19.4296875, -18.763671875, -18.09765625, -17.431640625, -16.765625, -16.099609375, -15.43359375, -14.767578125, -14.1015625, -13.435546875, -12.76953125, -12.103515625, -11.4375, -10.771484375, -10.10546875, -9.439453125, -8.7734375, -8.107421875, -7.44140625, -6.775390625, -6.109375, -5.443359375, -4.77734375, -4.111328125, -3.4453125, -2.779296875, -2.11328125, -1.447265625, -0.78125, -0.115234375, 0.55078125, 1.216796875, 1.8828125, 2.548828125, 3.21484375, 3.880859375, 4.546875, 5.212890625, 5.87890625, 6.544921875, 7.2109375, 7.876953125, 8.54296875, 9.208984375, 9.875, 10.541015625, 11.20703125, 11.873046875, 12.5390625, 13.205078125, 13.87109375, 14.537109375, 15.203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 16.0, 16.0, 31.0, 49.0, 57.0, 87.0, 92.0, 101.0, 133.0, 100.0, 87.0, 82.0, 47.0, 31.0, 17.0, 16.0, 4.0, 11.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.98486328125, -9.6416015625, -9.29833984375, -8.955078125, -8.61181640625, -8.2685546875, -7.92529296875, -7.58203125, -7.23876953125, -6.8955078125, -6.55224609375, -6.208984375, -5.86572265625, -5.5224609375, -5.17919921875, -4.8359375, -4.49267578125, -4.1494140625, -3.80615234375, -3.462890625, -3.11962890625, -2.7763671875, -2.43310546875, -2.08984375, -1.74658203125, -1.4033203125, -1.06005859375, -0.716796875, -0.37353515625, -0.0302734375, 0.31298828125, 0.65625, 0.99951171875, 1.3427734375, 1.68603515625, 2.029296875, 2.37255859375, 2.7158203125, 3.05908203125, 3.40234375, 3.74560546875, 4.0888671875, 4.43212890625, 4.775390625, 5.11865234375, 5.4619140625, 5.80517578125, 6.1484375, 6.49169921875, 6.8349609375, 7.17822265625, 7.521484375, 7.86474609375, 8.2080078125, 8.55126953125, 8.89453125, 9.23779296875, 9.5810546875, 9.92431640625, 10.267578125, 10.61083984375, 10.9541015625, 11.29736328125, 11.640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 11.0, 13.0, 15.0, 41.0, 79.0, 107.0, 196.0, 401.0, 918.0, 2791.0, 11505.0, 84784.0, 3812708.0, 253258.0, 21226.0, 4150.0, 1226.0, 421.0, 182.0, 94.0, 56.0, 24.0, 25.0, 10.0, 3.0, 4.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.52685546875, -17.7099609375, -16.89306640625, -16.076171875, -15.25927734375, -14.4423828125, -13.62548828125, -12.80859375, -11.99169921875, -11.1748046875, -10.35791015625, -9.541015625, -8.72412109375, -7.9072265625, -7.09033203125, -6.2734375, -5.45654296875, -4.6396484375, -3.82275390625, -3.005859375, -2.18896484375, -1.3720703125, -0.55517578125, 0.26171875, 1.07861328125, 1.8955078125, 2.71240234375, 3.529296875, 4.34619140625, 5.1630859375, 5.97998046875, 6.796875, 7.61376953125, 8.4306640625, 9.24755859375, 10.064453125, 10.88134765625, 11.6982421875, 12.51513671875, 13.33203125, 14.14892578125, 14.9658203125, 15.78271484375, 16.599609375, 17.41650390625, 18.2333984375, 19.05029296875, 19.8671875, 20.68408203125, 21.5009765625, 22.31787109375, 23.134765625, 23.95166015625, 24.7685546875, 25.58544921875, 26.40234375, 27.21923828125, 28.0361328125, 28.85302734375, 29.669921875, 30.48681640625, 31.3037109375, 32.12060546875, 32.9375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 19.0, 19.0, 23.0, 21.0, 45.0, 76.0, 109.0, 317.0, 1069.0, 1508.0, 479.0, 162.0, 69.0, 57.0, 27.0, 21.0, 19.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.5350341796875, -28.835693359375, -28.1363525390625, -27.43701171875, -26.7376708984375, -26.038330078125, -25.3389892578125, -24.6396484375, -23.9403076171875, -23.240966796875, -22.5416259765625, -21.84228515625, -21.1429443359375, -20.443603515625, -19.7442626953125, -19.044921875, -18.3455810546875, -17.646240234375, -16.9468994140625, -16.24755859375, -15.5482177734375, -14.848876953125, -14.1495361328125, -13.4501953125, -12.7508544921875, -12.051513671875, -11.3521728515625, -10.65283203125, -9.9534912109375, -9.254150390625, -8.5548095703125, -7.85546875, -7.1561279296875, -6.456787109375, -5.7574462890625, -5.05810546875, -4.3587646484375, -3.659423828125, -2.9600830078125, -2.2607421875, -1.5614013671875, -0.862060546875, -0.1627197265625, 0.53662109375, 1.2359619140625, 1.935302734375, 2.6346435546875, 3.333984375, 4.0333251953125, 4.732666015625, 5.4320068359375, 6.13134765625, 6.8306884765625, 7.530029296875, 8.2293701171875, 8.9287109375, 9.6280517578125, 10.327392578125, 11.0267333984375, 11.72607421875, 12.4254150390625, 13.124755859375, 13.8240966796875, 14.5234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 11.0, 15.0, 20.0, 52.0, 99.0, 144.0, 171.0, 175.0, 137.0, 69.0, 45.0, 16.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.33547973632812, -142.62643432617188, -137.9174041748047, -133.20835876464844, -128.49932861328125, -123.790283203125, -119.08123779296875, -114.37220001220703, -109.66316223144531, -104.9541244506836, -100.24508666992188, -95.53604125976562, -90.8270034790039, -86.11796569824219, -81.40892028808594, -76.69988250732422, -71.9908447265625, -67.28180694580078, -62.5727653503418, -57.86372375488281, -53.154685974121094, -48.445648193359375, -43.73660659790039, -39.027565002441406, -34.31852722167969, -29.609487533569336, -24.900447845458984, -20.191408157348633, -15.482368469238281, -10.77332878112793, -6.064289093017578, -1.3552474975585938, 3.353790283203125, 8.062829971313477, 12.771869659423828, 17.48090934753418, 22.18994903564453, 26.898988723754883, 31.608028411865234, 36.31707000732422, 41.02610778808594, 45.735145568847656, 50.44418716430664, 55.153228759765625, 59.862266540527344, 64.57130432128906, 69.28034973144531, 73.98938751220703, 78.69842529296875, 83.40746307373047, 88.11650085449219, 92.82554626464844, 97.53458404541016, 102.24362182617188, 106.95266723632812, 111.66170501708984, 116.37074279785156, 121.07978057861328, 125.788818359375, 130.49786376953125, 135.2069091796875, 139.9159393310547, 144.62498474121094, 149.33401489257812, 154.04306030273438]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 11.0, 16.0, 12.0, 22.0, 22.0, 23.0, 31.0, 43.0, 43.0, 41.0, 45.0, 54.0, 49.0, 57.0, 62.0, 49.0, 59.0, 57.0, 43.0, 40.0, 41.0, 41.0, 28.0, 22.0, 25.0, 22.0, 7.0, 8.0, 9.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.73100280761719, -65.34998321533203, -62.96896743774414, -60.587947845458984, -58.206932067871094, -55.82591247558594, -53.44489288330078, -51.063873291015625, -48.682857513427734, -46.30183792114258, -43.92082214355469, -41.53980255126953, -39.158782958984375, -36.777767181396484, -34.39674758911133, -32.01573181152344, -29.63471221923828, -27.253694534301758, -24.872676849365234, -22.491657257080078, -20.110639572143555, -17.72962188720703, -15.348603248596191, -12.967584609985352, -10.586566925048828, -8.205549240112305, -5.824530601501465, -3.443512439727783, -1.0624942779541016, 1.3185234069824219, 3.6995420455932617, 6.080560684204102, 8.461585998535156, 10.84260368347168, 13.22362232208252, 15.60464096069336, 17.985658645629883, 20.366676330566406, 22.747695922851562, 25.128713607788086, 27.50973129272461, 29.890748977661133, 32.271766662597656, 34.65278625488281, 37.03380584716797, 39.41482162475586, 41.795841217041016, 44.176856994628906, 46.55787658691406, 48.93889617919922, 51.31991195678711, 53.700931549072266, 56.081947326660156, 58.46296691894531, 60.84398651123047, 63.225006103515625, 65.60601806640625, 67.9870376586914, 70.36805725097656, 72.74906921386719, 75.13008880615234, 77.5111083984375, 79.89212799072266, 82.27314758300781, 84.65416717529297]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 9.0, 5.0, 12.0, 12.0, 19.0, 19.0, 30.0, 49.0, 71.0, 116.0, 181.0, 294.0, 474.0, 868.0, 1636.0, 3736.0, 9049.0, 26684.0, 93580.0, 403866.0, 378594.0, 87790.0, 25208.0, 8894.0, 3631.0, 1634.0, 823.0, 453.0, 285.0, 179.0, 97.0, 76.0, 50.0, 39.0, 25.0, 16.0, 11.0, 8.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.975830078125, -15.40478515625, -14.833740234375, -14.2626953125, -13.691650390625, -13.12060546875, -12.549560546875, -11.978515625, -11.407470703125, -10.83642578125, -10.265380859375, -9.6943359375, -9.123291015625, -8.55224609375, -7.981201171875, -7.41015625, -6.839111328125, -6.26806640625, -5.697021484375, -5.1259765625, -4.554931640625, -3.98388671875, -3.412841796875, -2.841796875, -2.270751953125, -1.69970703125, -1.128662109375, -0.5576171875, 0.013427734375, 0.58447265625, 1.155517578125, 1.7265625, 2.297607421875, 2.86865234375, 3.439697265625, 4.0107421875, 4.581787109375, 5.15283203125, 5.723876953125, 6.294921875, 6.865966796875, 7.43701171875, 8.008056640625, 8.5791015625, 9.150146484375, 9.72119140625, 10.292236328125, 10.86328125, 11.434326171875, 12.00537109375, 12.576416015625, 13.1474609375, 13.718505859375, 14.28955078125, 14.860595703125, 15.431640625, 16.002685546875, 16.57373046875, 17.144775390625, 17.7158203125, 18.286865234375, 18.85791015625, 19.428955078125, 20.0]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 11.0, 17.0, 16.0, 34.0, 38.0, 45.0, 81.0, 98.0, 121.0, 112.0, 103.0, 96.0, 82.0, 43.0, 38.0, 22.0, 15.0, 12.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2139892578125, -9.865478515625, -9.5169677734375, -9.16845703125, -8.8199462890625, -8.471435546875, -8.1229248046875, -7.7744140625, -7.4259033203125, -7.077392578125, -6.7288818359375, -6.38037109375, -6.0318603515625, -5.683349609375, -5.3348388671875, -4.986328125, -4.6378173828125, -4.289306640625, -3.9407958984375, -3.59228515625, -3.2437744140625, -2.895263671875, -2.5467529296875, -2.1982421875, -1.8497314453125, -1.501220703125, -1.1527099609375, -0.80419921875, -0.4556884765625, -0.107177734375, 0.2413330078125, 0.58984375, 0.9383544921875, 1.286865234375, 1.6353759765625, 1.98388671875, 2.3323974609375, 2.680908203125, 3.0294189453125, 3.3779296875, 3.7264404296875, 4.074951171875, 4.4234619140625, 4.77197265625, 5.1204833984375, 5.468994140625, 5.8175048828125, 6.166015625, 6.5145263671875, 6.863037109375, 7.2115478515625, 7.56005859375, 7.9085693359375, 8.257080078125, 8.6055908203125, 8.9541015625, 9.3026123046875, 9.651123046875, 9.9996337890625, 10.34814453125, 10.6966552734375, 11.045166015625, 11.3936767578125, 11.7421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 11.0, 18.0, 13.0, 19.0, 17.0, 32.0, 48.0, 90.0, 165.0, 263.0, 653.0, 1548.0, 6102.0, 110274.0, 906452.0, 18141.0, 2905.0, 875.0, 388.0, 195.0, 114.0, 70.0, 35.0, 30.0, 21.0, 17.0, 8.0, 8.0, 4.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-71.75, -69.525390625, -67.30078125, -65.076171875, -62.8515625, -60.626953125, -58.40234375, -56.177734375, -53.953125, -51.728515625, -49.50390625, -47.279296875, -45.0546875, -42.830078125, -40.60546875, -38.380859375, -36.15625, -33.931640625, -31.70703125, -29.482421875, -27.2578125, -25.033203125, -22.80859375, -20.583984375, -18.359375, -16.134765625, -13.91015625, -11.685546875, -9.4609375, -7.236328125, -5.01171875, -2.787109375, -0.5625, 1.662109375, 3.88671875, 6.111328125, 8.3359375, 10.560546875, 12.78515625, 15.009765625, 17.234375, 19.458984375, 21.68359375, 23.908203125, 26.1328125, 28.357421875, 30.58203125, 32.806640625, 35.03125, 37.255859375, 39.48046875, 41.705078125, 43.9296875, 46.154296875, 48.37890625, 50.603515625, 52.828125, 55.052734375, 57.27734375, 59.501953125, 61.7265625, 63.951171875, 66.17578125, 68.400390625, 70.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 3.0, 10.0, 16.0, 22.0, 36.0, 39.0, 77.0, 93.0, 92.0, 90.0, 109.0, 90.0, 93.0, 68.0, 40.0, 33.0, 26.0, 13.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.875, -46.22705078125, -44.5791015625, -42.93115234375, -41.283203125, -39.63525390625, -37.9873046875, -36.33935546875, -34.69140625, -33.04345703125, -31.3955078125, -29.74755859375, -28.099609375, -26.45166015625, -24.8037109375, -23.15576171875, -21.5078125, -19.85986328125, -18.2119140625, -16.56396484375, -14.916015625, -13.26806640625, -11.6201171875, -9.97216796875, -8.32421875, -6.67626953125, -5.0283203125, -3.38037109375, -1.732421875, -0.08447265625, 1.5634765625, 3.21142578125, 4.859375, 6.50732421875, 8.1552734375, 9.80322265625, 11.451171875, 13.09912109375, 14.7470703125, 16.39501953125, 18.04296875, 19.69091796875, 21.3388671875, 22.98681640625, 24.634765625, 26.28271484375, 27.9306640625, 29.57861328125, 31.2265625, 32.87451171875, 34.5224609375, 36.17041015625, 37.818359375, 39.46630859375, 41.1142578125, 42.76220703125, 44.41015625, 46.05810546875, 47.7060546875, 49.35400390625, 51.001953125, 52.64990234375, 54.2978515625, 55.94580078125, 57.59375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 4.0, 12.0, 11.0, 18.0, 28.0, 50.0, 68.0, 116.0, 254.0, 686.0, 2633.0, 34236.0, 997191.0, 10573.0, 1683.0, 480.0, 169.0, 113.0, 51.0, 44.0, 28.0, 17.0, 19.0, 7.0, 2.0, 11.0, 5.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84375, -31.7958984375, -30.748046875, -29.7001953125, -28.65234375, -27.6044921875, -26.556640625, -25.5087890625, -24.4609375, -23.4130859375, -22.365234375, -21.3173828125, -20.26953125, -19.2216796875, -18.173828125, -17.1259765625, -16.078125, -15.0302734375, -13.982421875, -12.9345703125, -11.88671875, -10.8388671875, -9.791015625, -8.7431640625, -7.6953125, -6.6474609375, -5.599609375, -4.5517578125, -3.50390625, -2.4560546875, -1.408203125, -0.3603515625, 0.6875, 1.7353515625, 2.783203125, 3.8310546875, 4.87890625, 5.9267578125, 6.974609375, 8.0224609375, 9.0703125, 10.1181640625, 11.166015625, 12.2138671875, 13.26171875, 14.3095703125, 15.357421875, 16.4052734375, 17.453125, 18.5009765625, 19.548828125, 20.5966796875, 21.64453125, 22.6923828125, 23.740234375, 24.7880859375, 25.8359375, 26.8837890625, 27.931640625, 28.9794921875, 30.02734375, 31.0751953125, 32.123046875, 33.1708984375, 34.21875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 11.0, 14.0, 45.0, 112.0, 317.0, 313.0, 99.0, 35.0, 22.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004207611083984375, -0.004057466983795166, -0.003907322883605957, -0.003757178783416748, -0.003607034683227539, -0.00345689058303833, -0.003306746482849121, -0.003156602382659912, -0.003006458282470703, -0.002856314182281494, -0.002706170082092285, -0.002556025981903076, -0.002405881881713867, -0.002255737781524658, -0.0021055936813354492, -0.0019554495811462402, -0.0018053054809570312, -0.0016551613807678223, -0.0015050172805786133, -0.0013548731803894043, -0.0012047290802001953, -0.0010545849800109863, -0.0009044408798217773, -0.0007542967796325684, -0.0006041526794433594, -0.0004540085792541504, -0.0003038644790649414, -0.00015372037887573242, -3.5762786865234375e-06, 0.00014656782150268555, 0.00029671192169189453, 0.0004468560218811035, 0.0005970001220703125, 0.0007471442222595215, 0.0008972883224487305, 0.0010474324226379395, 0.0011975765228271484, 0.0013477206230163574, 0.0014978647232055664, 0.0016480088233947754, 0.0017981529235839844, 0.0019482970237731934, 0.0020984411239624023, 0.0022485852241516113, 0.0023987293243408203, 0.0025488734245300293, 0.0026990175247192383, 0.0028491616249084473, 0.0029993057250976562, 0.0031494498252868652, 0.0032995939254760742, 0.003449738025665283, 0.003599882125854492, 0.003750026226043701, 0.00390017032623291, 0.004050314426422119, 0.004200458526611328, 0.004350602626800537, 0.004500746726989746, 0.004650890827178955, 0.004801034927368164, 0.004951179027557373, 0.005101323127746582, 0.005251467227935791, 0.005401611328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 16.0, 18.0, 16.0, 21.0, 31.0, 43.0, 79.0, 127.0, 274.0, 668.0, 2277.0, 12299.0, 937215.0, 88487.0, 4761.0, 1224.0, 451.0, 204.0, 101.0, 67.0, 42.0, 30.0, 16.0, 9.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.609375, -23.809326171875, -23.00927734375, -22.209228515625, -21.4091796875, -20.609130859375, -19.80908203125, -19.009033203125, -18.208984375, -17.408935546875, -16.60888671875, -15.808837890625, -15.0087890625, -14.208740234375, -13.40869140625, -12.608642578125, -11.80859375, -11.008544921875, -10.20849609375, -9.408447265625, -8.6083984375, -7.808349609375, -7.00830078125, -6.208251953125, -5.408203125, -4.608154296875, -3.80810546875, -3.008056640625, -2.2080078125, -1.407958984375, -0.60791015625, 0.192138671875, 0.9921875, 1.792236328125, 2.59228515625, 3.392333984375, 4.1923828125, 4.992431640625, 5.79248046875, 6.592529296875, 7.392578125, 8.192626953125, 8.99267578125, 9.792724609375, 10.5927734375, 11.392822265625, 12.19287109375, 12.992919921875, 13.79296875, 14.593017578125, 15.39306640625, 16.193115234375, 16.9931640625, 17.793212890625, 18.59326171875, 19.393310546875, 20.193359375, 20.993408203125, 21.79345703125, 22.593505859375, 23.3935546875, 24.193603515625, 24.99365234375, 25.793701171875, 26.59375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 14.0, 35.0, 51.0, 109.0, 182.0, 236.0, 156.0, 82.0, 54.0, 25.0, 5.0, 8.0, 5.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.734375, -16.142822265625, -15.55126953125, -14.959716796875, -14.3681640625, -13.776611328125, -13.18505859375, -12.593505859375, -12.001953125, -11.410400390625, -10.81884765625, -10.227294921875, -9.6357421875, -9.044189453125, -8.45263671875, -7.861083984375, -7.26953125, -6.677978515625, -6.08642578125, -5.494873046875, -4.9033203125, -4.311767578125, -3.72021484375, -3.128662109375, -2.537109375, -1.945556640625, -1.35400390625, -0.762451171875, -0.1708984375, 0.420654296875, 1.01220703125, 1.603759765625, 2.1953125, 2.786865234375, 3.37841796875, 3.969970703125, 4.5615234375, 5.153076171875, 5.74462890625, 6.336181640625, 6.927734375, 7.519287109375, 8.11083984375, 8.702392578125, 9.2939453125, 9.885498046875, 10.47705078125, 11.068603515625, 11.66015625, 12.251708984375, 12.84326171875, 13.434814453125, 14.0263671875, 14.617919921875, 15.20947265625, 15.801025390625, 16.392578125, 16.984130859375, 17.57568359375, 18.167236328125, 18.7587890625, 19.350341796875, 19.94189453125, 20.533447265625, 21.125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 19.0, 34.0, 194.0, 465.0, 240.0, 39.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-807.2546997070312, -790.6134033203125, -773.9721069335938, -757.330810546875, -740.6895141601562, -724.0482177734375, -707.4069213867188, -690.765625, -674.124267578125, -657.4829711914062, -640.8416748046875, -624.2003784179688, -607.55908203125, -590.9177856445312, -574.2764892578125, -557.6351318359375, -540.993896484375, -524.3526000976562, -507.7113037109375, -491.07000732421875, -474.4287109375, -457.78741455078125, -441.1460876464844, -424.5047912597656, -407.8634948730469, -391.2221984863281, -374.5809020996094, -357.9396057128906, -341.29827880859375, -324.656982421875, -308.01568603515625, -291.3743896484375, -274.733154296875, -258.09185791015625, -241.4505615234375, -224.8092498779297, -208.16795349121094, -191.5266571044922, -174.88534545898438, -158.24404907226562, -141.60275268554688, -124.96145629882812, -108.32015228271484, -91.67884826660156, -75.03755187988281, -58.39625549316406, -41.75495147705078, -25.1136474609375, -8.47235107421875, 8.168949127197266, 24.81024932861328, 41.4515495300293, 58.09284973144531, 74.73414611816406, 91.37545013427734, 108.01675415039062, 124.65805053710938, 141.29934692382812, 157.94064331054688, 174.5819549560547, 191.22325134277344, 207.8645477294922, 224.505859375, 241.14715576171875, 257.7884521484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 13.0, 16.0, 16.0, 27.0, 24.0, 31.0, 39.0, 38.0, 47.0, 73.0, 73.0, 74.0, 70.0, 80.0, 75.0, 49.0, 47.0, 35.0, 36.0, 35.0, 30.0, 25.0, 15.0, 5.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-146.8711700439453, -142.57101440429688, -138.27084350585938, -133.97068786621094, -129.6705322265625, -125.370361328125, -121.07020568847656, -116.7700424194336, -112.46987915039062, -108.16971588134766, -103.86955261230469, -99.56939697265625, -95.26923370361328, -90.96907043457031, -86.66891479492188, -82.3687515258789, -78.06858825683594, -73.76842498779297, -69.46826171875, -65.16810607910156, -60.867942810058594, -56.567779541015625, -52.26762008666992, -47.96746063232422, -43.66729736328125, -39.36713409423828, -35.06697463989258, -30.766813278198242, -26.466651916503906, -22.16649055480957, -17.866329193115234, -13.566167831420898, -9.266021728515625, -4.965860366821289, -0.6656990051269531, 3.634462356567383, 7.934623718261719, 12.234785079956055, 16.53494644165039, 20.835107803344727, 25.135269165039062, 29.4354305267334, 33.735591888427734, 38.03575134277344, 42.335914611816406, 46.636077880859375, 50.93623733520508, 55.23639678955078, 59.53656005859375, 63.83672332763672, 68.13688659667969, 72.43704223632812, 76.7372055053711, 81.03736877441406, 85.3375244140625, 89.63768768310547, 93.93785095214844, 98.2380142211914, 102.53817749023438, 106.83833312988281, 111.13849639892578, 115.43865966796875, 119.73881530761719, 124.03897857666016, 128.33914184570312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 9.0, 38.0, 64.0, 130.0, 419.0, 1794.0, 12020.0, 930025.0, 3228996.0, 17687.0, 2252.0, 526.0, 166.0, 66.0, 29.0, 16.0, 4.0, 10.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.363525390625, -18.39892578125, -17.434326171875, -16.4697265625, -15.505126953125, -14.54052734375, -13.575927734375, -12.611328125, -11.646728515625, -10.68212890625, -9.717529296875, -8.7529296875, -7.788330078125, -6.82373046875, -5.859130859375, -4.89453125, -3.929931640625, -2.96533203125, -2.000732421875, -1.0361328125, -0.071533203125, 0.89306640625, 1.857666015625, 2.822265625, 3.786865234375, 4.75146484375, 5.716064453125, 6.6806640625, 7.645263671875, 8.60986328125, 9.574462890625, 10.5390625, 11.503662109375, 12.46826171875, 13.432861328125, 14.3974609375, 15.362060546875, 16.32666015625, 17.291259765625, 18.255859375, 19.220458984375, 20.18505859375, 21.149658203125, 22.1142578125, 23.078857421875, 24.04345703125, 25.008056640625, 25.97265625, 26.937255859375, 27.90185546875, 28.866455078125, 29.8310546875, 30.795654296875, 31.76025390625, 32.724853515625, 33.689453125, 34.654052734375, 35.61865234375, 36.583251953125, 37.5478515625, 38.512451171875, 39.47705078125, 40.441650390625, 41.40625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 14.0, 21.0, 24.0, 24.0, 38.0, 40.0, 61.0, 57.0, 65.0, 74.0, 68.0, 88.0, 76.0, 66.0, 60.0, 51.0, 39.0, 30.0, 35.0, 11.0, 12.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.49066162109375, -4.2508544921875, -4.01104736328125, -3.771240234375, -3.53143310546875, -3.2916259765625, -3.05181884765625, -2.81201171875, -2.57220458984375, -2.3323974609375, -2.09259033203125, -1.852783203125, -1.61297607421875, -1.3731689453125, -1.13336181640625, -0.8935546875, -0.65374755859375, -0.4139404296875, -0.17413330078125, 0.065673828125, 0.30548095703125, 0.5452880859375, 0.78509521484375, 1.02490234375, 1.26470947265625, 1.5045166015625, 1.74432373046875, 1.984130859375, 2.22393798828125, 2.4637451171875, 2.70355224609375, 2.943359375, 3.18316650390625, 3.4229736328125, 3.66278076171875, 3.902587890625, 4.14239501953125, 4.3822021484375, 4.62200927734375, 4.86181640625, 5.10162353515625, 5.3414306640625, 5.58123779296875, 5.821044921875, 6.06085205078125, 6.3006591796875, 6.54046630859375, 6.7802734375, 7.02008056640625, 7.2598876953125, 7.49969482421875, 7.739501953125, 7.97930908203125, 8.2191162109375, 8.45892333984375, 8.69873046875, 8.93853759765625, 9.1783447265625, 9.41815185546875, 9.657958984375, 9.89776611328125, 10.1375732421875, 10.37738037109375, 10.6171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 11.0, 28.0, 44.0, 78.0, 115.0, 213.0, 464.0, 901.0, 2109.0, 5627.0, 19596.0, 105030.0, 3259506.0, 733368.0, 49406.0, 11544.0, 3617.0, 1351.0, 604.0, 305.0, 152.0, 81.0, 52.0, 23.0, 17.0, 6.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2890625, -12.7532958984375, -12.217529296875, -11.6817626953125, -11.14599609375, -10.6102294921875, -10.074462890625, -9.5386962890625, -9.0029296875, -8.4671630859375, -7.931396484375, -7.3956298828125, -6.85986328125, -6.3240966796875, -5.788330078125, -5.2525634765625, -4.716796875, -4.1810302734375, -3.645263671875, -3.1094970703125, -2.57373046875, -2.0379638671875, -1.502197265625, -0.9664306640625, -0.4306640625, 0.1051025390625, 0.640869140625, 1.1766357421875, 1.71240234375, 2.2481689453125, 2.783935546875, 3.3197021484375, 3.85546875, 4.3912353515625, 4.927001953125, 5.4627685546875, 5.99853515625, 6.5343017578125, 7.070068359375, 7.6058349609375, 8.1416015625, 8.6773681640625, 9.213134765625, 9.7489013671875, 10.28466796875, 10.8204345703125, 11.356201171875, 11.8919677734375, 12.427734375, 12.9635009765625, 13.499267578125, 14.0350341796875, 14.57080078125, 15.1065673828125, 15.642333984375, 16.1781005859375, 16.7138671875, 17.2496337890625, 17.785400390625, 18.3211669921875, 18.85693359375, 19.3927001953125, 19.928466796875, 20.4642333984375, 21.0]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 18.0, 17.0, 19.0, 33.0, 60.0, 58.0, 149.0, 268.0, 674.0, 1257.0, 771.0, 340.0, 142.0, 83.0, 58.0, 32.0, 31.0, 15.0, 12.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.625, -18.1295166015625, -17.634033203125, -17.1385498046875, -16.64306640625, -16.1475830078125, -15.652099609375, -15.1566162109375, -14.6611328125, -14.1656494140625, -13.670166015625, -13.1746826171875, -12.67919921875, -12.1837158203125, -11.688232421875, -11.1927490234375, -10.697265625, -10.2017822265625, -9.706298828125, -9.2108154296875, -8.71533203125, -8.2198486328125, -7.724365234375, -7.2288818359375, -6.7333984375, -6.2379150390625, -5.742431640625, -5.2469482421875, -4.75146484375, -4.2559814453125, -3.760498046875, -3.2650146484375, -2.76953125, -2.2740478515625, -1.778564453125, -1.2830810546875, -0.78759765625, -0.2921142578125, 0.203369140625, 0.6988525390625, 1.1943359375, 1.6898193359375, 2.185302734375, 2.6807861328125, 3.17626953125, 3.6717529296875, 4.167236328125, 4.6627197265625, 5.158203125, 5.6536865234375, 6.149169921875, 6.6446533203125, 7.14013671875, 7.6356201171875, 8.131103515625, 8.6265869140625, 9.1220703125, 9.6175537109375, 10.113037109375, 10.6085205078125, 11.10400390625, 11.5994873046875, 12.094970703125, 12.5904541015625, 13.0859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 14.0, 37.0, 151.0, 390.0, 284.0, 80.0, 20.0, 8.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-347.1724853515625, -339.01263427734375, -330.852783203125, -322.6929626464844, -314.5331115722656, -306.3732604980469, -298.2134094238281, -290.0535888671875, -281.89373779296875, -273.73388671875, -265.57403564453125, -257.4142150878906, -249.25436401367188, -241.09451293945312, -232.93466186523438, -224.7748260498047, -216.61497497558594, -208.4551239013672, -200.2952880859375, -192.13543701171875, -183.97560119628906, -175.8157501220703, -167.65591430664062, -159.49606323242188, -151.33621215820312, -143.17636108398438, -135.0165252685547, -126.85667419433594, -118.69683837890625, -110.5369873046875, -102.37714385986328, -94.21730041503906, -86.05746459960938, -77.89762115478516, -69.73777770996094, -61.57793045043945, -53.418087005615234, -45.258243560791016, -37.09839630126953, -28.938552856445312, -20.778709411621094, -12.618865013122559, -4.459020614624023, 3.700824737548828, 11.860668182373047, 20.020511627197266, 28.18035888671875, 36.34020233154297, 44.50004577636719, 52.659889221191406, 60.819732666015625, 68.97958374023438, 77.13941955566406, 85.29927062988281, 93.45911407470703, 101.61895751953125, 109.77880096435547, 117.93864440917969, 126.0984878540039, 134.25833129882812, 142.41818237304688, 150.57801818847656, 158.7378692626953, 166.897705078125, 175.05755615234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 19.0, 10.0, 15.0, 16.0, 21.0, 35.0, 38.0, 29.0, 38.0, 63.0, 51.0, 48.0, 61.0, 62.0, 52.0, 63.0, 64.0, 48.0, 44.0, 45.0, 35.0, 35.0, 19.0, 18.0, 11.0, 13.0, 8.0, 5.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.07528305053711, -54.089576721191406, -52.10386657714844, -50.11815643310547, -48.132450103759766, -46.14674377441406, -44.161033630371094, -42.175323486328125, -40.18961715698242, -38.20391082763672, -36.21820068359375, -34.23249053955078, -32.24678421020508, -30.261075973510742, -28.275367736816406, -26.28965950012207, -24.303951263427734, -22.3182430267334, -20.332534790039062, -18.346826553344727, -16.36111831665039, -14.375410079956055, -12.389701843261719, -10.403993606567383, -8.418285369873047, -6.432577133178711, -4.446868896484375, -2.461160659790039, -0.4754524230957031, 1.5102558135986328, 3.4959640502929688, 5.481672286987305, 7.467376708984375, 9.453084945678711, 11.438793182373047, 13.424501419067383, 15.410209655761719, 17.395917892456055, 19.38162612915039, 21.367334365844727, 23.353042602539062, 25.3387508392334, 27.324459075927734, 29.31016731262207, 31.295875549316406, 33.281585693359375, 35.26729202270508, 37.25299835205078, 39.23870849609375, 41.22441864013672, 43.21012496948242, 45.195831298828125, 47.181541442871094, 49.16725158691406, 51.152957916259766, 53.13866424560547, 55.12437438964844, 57.110084533691406, 59.09579086303711, 61.08149719238281, 63.06720733642578, 65.05291748046875, 67.03861999511719, 69.02433013916016, 71.01004028320312]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 13.0, 9.0, 17.0, 19.0, 30.0, 68.0, 89.0, 148.0, 238.0, 412.0, 799.0, 1843.0, 3891.0, 9525.0, 26699.0, 83307.0, 303480.0, 430414.0, 126674.0, 38068.0, 13058.0, 5158.0, 2233.0, 1083.0, 535.0, 266.0, 183.0, 102.0, 62.0, 32.0, 23.0, 20.0, 19.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5703125, -14.102783203125, -13.63525390625, -13.167724609375, -12.7001953125, -12.232666015625, -11.76513671875, -11.297607421875, -10.830078125, -10.362548828125, -9.89501953125, -9.427490234375, -8.9599609375, -8.492431640625, -8.02490234375, -7.557373046875, -7.08984375, -6.622314453125, -6.15478515625, -5.687255859375, -5.2197265625, -4.752197265625, -4.28466796875, -3.817138671875, -3.349609375, -2.882080078125, -2.41455078125, -1.947021484375, -1.4794921875, -1.011962890625, -0.54443359375, -0.076904296875, 0.390625, 0.858154296875, 1.32568359375, 1.793212890625, 2.2607421875, 2.728271484375, 3.19580078125, 3.663330078125, 4.130859375, 4.598388671875, 5.06591796875, 5.533447265625, 6.0009765625, 6.468505859375, 6.93603515625, 7.403564453125, 7.87109375, 8.338623046875, 8.80615234375, 9.273681640625, 9.7412109375, 10.208740234375, 10.67626953125, 11.143798828125, 11.611328125, 12.078857421875, 12.54638671875, 13.013916015625, 13.4814453125, 13.948974609375, 14.41650390625, 14.884033203125, 15.3515625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 14.0, 9.0, 15.0, 20.0, 21.0, 18.0, 22.0, 27.0, 29.0, 36.0, 39.0, 34.0, 37.0, 53.0, 54.0, 49.0, 43.0, 35.0, 51.0, 50.0, 44.0, 37.0, 43.0, 35.0, 18.0, 30.0, 23.0, 25.0, 19.0, 14.0, 13.0, 10.0, 5.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.71514892578125, -4.5592041015625, -4.40325927734375, -4.247314453125, -4.09136962890625, -3.9354248046875, -3.77947998046875, -3.62353515625, -3.46759033203125, -3.3116455078125, -3.15570068359375, -2.999755859375, -2.84381103515625, -2.6878662109375, -2.53192138671875, -2.3759765625, -2.22003173828125, -2.0640869140625, -1.90814208984375, -1.752197265625, -1.59625244140625, -1.4403076171875, -1.28436279296875, -1.12841796875, -0.97247314453125, -0.8165283203125, -0.66058349609375, -0.504638671875, -0.34869384765625, -0.1927490234375, -0.03680419921875, 0.119140625, 0.27508544921875, 0.4310302734375, 0.58697509765625, 0.742919921875, 0.89886474609375, 1.0548095703125, 1.21075439453125, 1.36669921875, 1.52264404296875, 1.6785888671875, 1.83453369140625, 1.990478515625, 2.14642333984375, 2.3023681640625, 2.45831298828125, 2.6142578125, 2.77020263671875, 2.9261474609375, 3.08209228515625, 3.238037109375, 3.39398193359375, 3.5499267578125, 3.70587158203125, 3.86181640625, 4.01776123046875, 4.1737060546875, 4.32965087890625, 4.485595703125, 4.64154052734375, 4.7974853515625, 4.95343017578125, 5.109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 8.0, 14.0, 12.0, 21.0, 13.0, 28.0, 64.0, 73.0, 120.0, 240.0, 459.0, 902.0, 2246.0, 8007.0, 50135.0, 670115.0, 281432.0, 26343.0, 5071.0, 1662.0, 697.0, 330.0, 201.0, 109.0, 73.0, 53.0, 33.0, 26.0, 15.0, 6.0, 1.0, 12.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.78125, -27.84814453125, -26.9150390625, -25.98193359375, -25.048828125, -24.11572265625, -23.1826171875, -22.24951171875, -21.31640625, -20.38330078125, -19.4501953125, -18.51708984375, -17.583984375, -16.65087890625, -15.7177734375, -14.78466796875, -13.8515625, -12.91845703125, -11.9853515625, -11.05224609375, -10.119140625, -9.18603515625, -8.2529296875, -7.31982421875, -6.38671875, -5.45361328125, -4.5205078125, -3.58740234375, -2.654296875, -1.72119140625, -0.7880859375, 0.14501953125, 1.078125, 2.01123046875, 2.9443359375, 3.87744140625, 4.810546875, 5.74365234375, 6.6767578125, 7.60986328125, 8.54296875, 9.47607421875, 10.4091796875, 11.34228515625, 12.275390625, 13.20849609375, 14.1416015625, 15.07470703125, 16.0078125, 16.94091796875, 17.8740234375, 18.80712890625, 19.740234375, 20.67333984375, 21.6064453125, 22.53955078125, 23.47265625, 24.40576171875, 25.3388671875, 26.27197265625, 27.205078125, 28.13818359375, 29.0712890625, 30.00439453125, 30.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 3.0, 5.0, 8.0, 6.0, 11.0, 16.0, 12.0, 19.0, 20.0, 25.0, 30.0, 33.0, 40.0, 37.0, 33.0, 42.0, 50.0, 50.0, 49.0, 53.0, 52.0, 35.0, 46.0, 38.0, 39.0, 36.0, 35.0, 34.0, 15.0, 18.0, 25.0, 29.0, 13.0, 9.0, 7.0, 2.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -17.949462890625, -17.33642578125, -16.723388671875, -16.1103515625, -15.497314453125, -14.88427734375, -14.271240234375, -13.658203125, -13.045166015625, -12.43212890625, -11.819091796875, -11.2060546875, -10.593017578125, -9.97998046875, -9.366943359375, -8.75390625, -8.140869140625, -7.52783203125, -6.914794921875, -6.3017578125, -5.688720703125, -5.07568359375, -4.462646484375, -3.849609375, -3.236572265625, -2.62353515625, -2.010498046875, -1.3974609375, -0.784423828125, -0.17138671875, 0.441650390625, 1.0546875, 1.667724609375, 2.28076171875, 2.893798828125, 3.5068359375, 4.119873046875, 4.73291015625, 5.345947265625, 5.958984375, 6.572021484375, 7.18505859375, 7.798095703125, 8.4111328125, 9.024169921875, 9.63720703125, 10.250244140625, 10.86328125, 11.476318359375, 12.08935546875, 12.702392578125, 13.3154296875, 13.928466796875, 14.54150390625, 15.154541015625, 15.767578125, 16.380615234375, 16.99365234375, 17.606689453125, 18.2197265625, 18.832763671875, 19.44580078125, 20.058837890625, 20.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 11.0, 29.0, 52.0, 117.0, 368.0, 1774.0, 58438.0, 981286.0, 5342.0, 720.0, 228.0, 96.0, 30.0, 14.0, 14.0, 5.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.875, -41.723388671875, -40.57177734375, -39.420166015625, -38.2685546875, -37.116943359375, -35.96533203125, -34.813720703125, -33.662109375, -32.510498046875, -31.35888671875, -30.207275390625, -29.0556640625, -27.904052734375, -26.75244140625, -25.600830078125, -24.44921875, -23.297607421875, -22.14599609375, -20.994384765625, -19.8427734375, -18.691162109375, -17.53955078125, -16.387939453125, -15.236328125, -14.084716796875, -12.93310546875, -11.781494140625, -10.6298828125, -9.478271484375, -8.32666015625, -7.175048828125, -6.0234375, -4.871826171875, -3.72021484375, -2.568603515625, -1.4169921875, -0.265380859375, 0.88623046875, 2.037841796875, 3.189453125, 4.341064453125, 5.49267578125, 6.644287109375, 7.7958984375, 8.947509765625, 10.09912109375, 11.250732421875, 12.40234375, 13.553955078125, 14.70556640625, 15.857177734375, 17.0087890625, 18.160400390625, 19.31201171875, 20.463623046875, 21.615234375, 22.766845703125, 23.91845703125, 25.070068359375, 26.2216796875, 27.373291015625, 28.52490234375, 29.676513671875, 30.828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 26.0, 16.0, 35.0, 36.0, 64.0, 108.0, 159.0, 200.0, 100.0, 64.0, 41.0, 29.0, 35.0, 11.0, 17.0, 13.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.002227783203125, -0.0021677911281585693, -0.0021077990531921387, -0.002047806978225708, -0.0019878149032592773, -0.0019278228282928467, -0.001867830753326416, -0.0018078386783599854, -0.0017478466033935547, -0.001687854528427124, -0.0016278624534606934, -0.0015678703784942627, -0.001507878303527832, -0.0014478862285614014, -0.0013878941535949707, -0.00132790207862854, -0.0012679100036621094, -0.0012079179286956787, -0.001147925853729248, -0.0010879337787628174, -0.0010279417037963867, -0.0009679496288299561, -0.0009079575538635254, -0.0008479654788970947, -0.0007879734039306641, -0.0007279813289642334, -0.0006679892539978027, -0.0006079971790313721, -0.0005480051040649414, -0.00048801302909851074, -0.0004280209541320801, -0.0003680288791656494, -0.00030803680419921875, -0.0002480447292327881, -0.00018805265426635742, -0.00012806057929992676, -6.80685043334961e-05, -8.07642936706543e-06, 5.1915645599365234e-05, 0.0001119077205657959, 0.00017189979553222656, 0.00023189187049865723, 0.0002918839454650879, 0.00035187602043151855, 0.0004118680953979492, 0.0004718601703643799, 0.0005318522453308105, 0.0005918443202972412, 0.0006518363952636719, 0.0007118284702301025, 0.0007718205451965332, 0.0008318126201629639, 0.0008918046951293945, 0.0009517967700958252, 0.0010117888450622559, 0.0010717809200286865, 0.0011317729949951172, 0.0011917650699615479, 0.0012517571449279785, 0.0013117492198944092, 0.0013717412948608398, 0.0014317333698272705, 0.0014917254447937012, 0.0015517175197601318, 0.0016117095947265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 12.0, 15.0, 13.0, 24.0, 34.0, 43.0, 101.0, 174.0, 311.0, 794.0, 2122.0, 8077.0, 72049.0, 887544.0, 65930.0, 7702.0, 2081.0, 796.0, 342.0, 150.0, 81.0, 42.0, 34.0, 27.0, 17.0, 6.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.70458984375, -9.2529296875, -8.80126953125, -8.349609375, -7.89794921875, -7.4462890625, -6.99462890625, -6.54296875, -6.09130859375, -5.6396484375, -5.18798828125, -4.736328125, -4.28466796875, -3.8330078125, -3.38134765625, -2.9296875, -2.47802734375, -2.0263671875, -1.57470703125, -1.123046875, -0.67138671875, -0.2197265625, 0.23193359375, 0.68359375, 1.13525390625, 1.5869140625, 2.03857421875, 2.490234375, 2.94189453125, 3.3935546875, 3.84521484375, 4.296875, 4.74853515625, 5.2001953125, 5.65185546875, 6.103515625, 6.55517578125, 7.0068359375, 7.45849609375, 7.91015625, 8.36181640625, 8.8134765625, 9.26513671875, 9.716796875, 10.16845703125, 10.6201171875, 11.07177734375, 11.5234375, 11.97509765625, 12.4267578125, 12.87841796875, 13.330078125, 13.78173828125, 14.2333984375, 14.68505859375, 15.13671875, 15.58837890625, 16.0400390625, 16.49169921875, 16.943359375, 17.39501953125, 17.8466796875, 18.29833984375, 18.75]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 18.0, 26.0, 30.0, 43.0, 64.0, 93.0, 92.0, 118.0, 139.0, 90.0, 91.0, 53.0, 36.0, 26.0, 10.0, 14.0, 10.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.93359375, -5.63214111328125, -5.3306884765625, -5.02923583984375, -4.727783203125, -4.42633056640625, -4.1248779296875, -3.82342529296875, -3.52197265625, -3.22052001953125, -2.9190673828125, -2.61761474609375, -2.316162109375, -2.01470947265625, -1.7132568359375, -1.41180419921875, -1.1103515625, -0.80889892578125, -0.5074462890625, -0.20599365234375, 0.095458984375, 0.39691162109375, 0.6983642578125, 0.99981689453125, 1.30126953125, 1.60272216796875, 1.9041748046875, 2.20562744140625, 2.507080078125, 2.80853271484375, 3.1099853515625, 3.41143798828125, 3.712890625, 4.01434326171875, 4.3157958984375, 4.61724853515625, 4.918701171875, 5.22015380859375, 5.5216064453125, 5.82305908203125, 6.12451171875, 6.42596435546875, 6.7274169921875, 7.02886962890625, 7.330322265625, 7.63177490234375, 7.9332275390625, 8.23468017578125, 8.5361328125, 8.83758544921875, 9.1390380859375, 9.44049072265625, 9.741943359375, 10.04339599609375, 10.3448486328125, 10.64630126953125, 10.94775390625, 11.24920654296875, 11.5506591796875, 11.85211181640625, 12.153564453125, 12.45501708984375, 12.7564697265625, 13.05792236328125, 13.359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 12.0, 30.0, 128.0, 375.0, 300.0, 100.0, 29.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.58331298828125, -368.02154541015625, -357.4598083496094, -346.8980407714844, -336.3362731933594, -325.7745361328125, -315.2127685546875, -304.6510009765625, -294.0892333984375, -283.5274658203125, -272.9657287597656, -262.4039611816406, -251.84219360351562, -241.2804412841797, -230.71868896484375, -220.15692138671875, -209.59518432617188, -199.03343200683594, -188.47166442871094, -177.909912109375, -167.34814453125, -156.78639221191406, -146.22463989257812, -135.66287231445312, -125.10111999511719, -114.53936004638672, -103.97760009765625, -93.41584777832031, -82.85408782958984, -72.29232788085938, -61.73057174682617, -51.16881561279297, -40.6070556640625, -30.045297622680664, -19.483539581298828, -8.921781539916992, 1.6399765014648438, 12.201736450195312, 22.763492584228516, 33.32524871826172, 43.88700866699219, 54.448768615722656, 65.01052856445312, 75.57228088378906, 86.13404083251953, 96.69580078125, 107.25755310058594, 117.8193130493164, 128.38107299804688, 138.9428253173828, 149.5045928955078, 160.06634521484375, 170.62811279296875, 181.1898651123047, 191.75161743164062, 202.31338500976562, 212.87513732910156, 223.4368896484375, 233.9986572265625, 244.56040954589844, 255.12216186523438, 265.6839294433594, 276.2456970214844, 286.80743408203125, 297.36920166015625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 7.0, 11.0, 12.0, 11.0, 20.0, 24.0, 20.0, 31.0, 43.0, 36.0, 36.0, 34.0, 35.0, 54.0, 54.0, 63.0, 70.0, 47.0, 43.0, 35.0, 37.0, 38.0, 38.0, 24.0, 23.0, 20.0, 25.0, 14.0, 16.0, 11.0, 14.0, 7.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-89.90695190429688, -87.3105239868164, -84.71410369873047, -82.11767578125, -79.52125549316406, -76.9248275756836, -74.32839965820312, -71.73197937011719, -69.13555145263672, -66.53912353515625, -63.94270324707031, -61.346275329589844, -58.74985122680664, -56.15342712402344, -53.55699920654297, -50.960575103759766, -48.36415100097656, -45.76772689819336, -43.171302795410156, -40.57487487792969, -37.978450775146484, -35.38202667236328, -32.78559875488281, -30.18917465209961, -27.592750549316406, -24.996326446533203, -22.399900436401367, -19.80347442626953, -17.207050323486328, -14.610625267028809, -12.014200210571289, -9.417774200439453, -6.82135009765625, -4.2249250411987305, -1.628499984741211, 0.9679250717163086, 3.564350128173828, 6.160775184631348, 8.757200241088867, 11.353626251220703, 13.950050354003906, 16.54647445678711, 19.142900466918945, 21.73932647705078, 24.335750579833984, 26.932174682617188, 29.528600692749023, 32.12502670288086, 34.72145080566406, 37.317874908447266, 39.91429901123047, 42.51072692871094, 45.10715103149414, 47.703575134277344, 50.30000305175781, 52.896427154541016, 55.49285125732422, 58.08927536010742, 60.685699462890625, 63.282127380371094, 65.87855529785156, 68.4749755859375, 71.07140350341797, 73.66783142089844, 76.26425170898438]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 17.0, 13.0, 29.0, 30.0, 68.0, 133.0, 267.0, 644.0, 1866.0, 7167.0, 39501.0, 608260.0, 3368869.0, 144042.0, 17760.0, 3789.0, 1072.0, 361.0, 141.0, 80.0, 39.0, 40.0, 16.0, 12.0, 13.0, 3.0, 6.0, 5.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.8878173828125, -11.377197265625, -10.8665771484375, -10.35595703125, -9.8453369140625, -9.334716796875, -8.8240966796875, -8.3134765625, -7.8028564453125, -7.292236328125, -6.7816162109375, -6.27099609375, -5.7603759765625, -5.249755859375, -4.7391357421875, -4.228515625, -3.7178955078125, -3.207275390625, -2.6966552734375, -2.18603515625, -1.6754150390625, -1.164794921875, -0.6541748046875, -0.1435546875, 0.3670654296875, 0.877685546875, 1.3883056640625, 1.89892578125, 2.4095458984375, 2.920166015625, 3.4307861328125, 3.94140625, 4.4520263671875, 4.962646484375, 5.4732666015625, 5.98388671875, 6.4945068359375, 7.005126953125, 7.5157470703125, 8.0263671875, 8.5369873046875, 9.047607421875, 9.5582275390625, 10.06884765625, 10.5794677734375, 11.090087890625, 11.6007080078125, 12.111328125, 12.6219482421875, 13.132568359375, 13.6431884765625, 14.15380859375, 14.6644287109375, 15.175048828125, 15.6856689453125, 16.1962890625, 16.7069091796875, 17.217529296875, 17.7281494140625, 18.23876953125, 18.7493896484375, 19.260009765625, 19.7706298828125, 20.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 8.0, 8.0, 12.0, 11.0, 13.0, 14.0, 17.0, 30.0, 31.0, 34.0, 37.0, 40.0, 32.0, 37.0, 60.0, 45.0, 52.0, 50.0, 51.0, 49.0, 48.0, 35.0, 34.0, 21.0, 29.0, 35.0, 32.0, 24.0, 17.0, 15.0, 15.0, 7.0, 10.0, 12.0, 4.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.2340087890625, -4.096923828125, -3.9598388671875, -3.82275390625, -3.6856689453125, -3.548583984375, -3.4114990234375, -3.2744140625, -3.1373291015625, -3.000244140625, -2.8631591796875, -2.72607421875, -2.5889892578125, -2.451904296875, -2.3148193359375, -2.177734375, -2.0406494140625, -1.903564453125, -1.7664794921875, -1.62939453125, -1.4923095703125, -1.355224609375, -1.2181396484375, -1.0810546875, -0.9439697265625, -0.806884765625, -0.6697998046875, -0.53271484375, -0.3956298828125, -0.258544921875, -0.1214599609375, 0.015625, 0.1527099609375, 0.289794921875, 0.4268798828125, 0.56396484375, 0.7010498046875, 0.838134765625, 0.9752197265625, 1.1123046875, 1.2493896484375, 1.386474609375, 1.5235595703125, 1.66064453125, 1.7977294921875, 1.934814453125, 2.0718994140625, 2.208984375, 2.3460693359375, 2.483154296875, 2.6202392578125, 2.75732421875, 2.8944091796875, 3.031494140625, 3.1685791015625, 3.3056640625, 3.4427490234375, 3.579833984375, 3.7169189453125, 3.85400390625, 3.9910888671875, 4.128173828125, 4.2652587890625, 4.40234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 12.0, 25.0, 34.0, 48.0, 75.0, 113.0, 238.0, 517.0, 1108.0, 2711.0, 8606.0, 31532.0, 165629.0, 2442358.0, 1394796.0, 112209.0, 23416.0, 6685.0, 2264.0, 911.0, 430.0, 212.0, 116.0, 72.0, 48.0, 22.0, 19.0, 17.0, 10.0, 5.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.657958984375, -12.26123046875, -11.864501953125, -11.4677734375, -11.071044921875, -10.67431640625, -10.277587890625, -9.880859375, -9.484130859375, -9.08740234375, -8.690673828125, -8.2939453125, -7.897216796875, -7.50048828125, -7.103759765625, -6.70703125, -6.310302734375, -5.91357421875, -5.516845703125, -5.1201171875, -4.723388671875, -4.32666015625, -3.929931640625, -3.533203125, -3.136474609375, -2.73974609375, -2.343017578125, -1.9462890625, -1.549560546875, -1.15283203125, -0.756103515625, -0.359375, 0.037353515625, 0.43408203125, 0.830810546875, 1.2275390625, 1.624267578125, 2.02099609375, 2.417724609375, 2.814453125, 3.211181640625, 3.60791015625, 4.004638671875, 4.4013671875, 4.798095703125, 5.19482421875, 5.591552734375, 5.98828125, 6.385009765625, 6.78173828125, 7.178466796875, 7.5751953125, 7.971923828125, 8.36865234375, 8.765380859375, 9.162109375, 9.558837890625, 9.95556640625, 10.352294921875, 10.7490234375, 11.145751953125, 11.54248046875, 11.939208984375, 12.3359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 6.0, 11.0, 8.0, 18.0, 23.0, 26.0, 27.0, 39.0, 68.0, 75.0, 95.0, 136.0, 187.0, 274.0, 421.0, 619.0, 600.0, 446.0, 272.0, 209.0, 130.0, 77.0, 70.0, 58.0, 38.0, 28.0, 25.0, 15.0, 15.0, 8.0, 6.0, 8.0, 4.0, 5.0, 5.0, 7.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8125, -10.4749755859375, -10.137451171875, -9.7999267578125, -9.46240234375, -9.1248779296875, -8.787353515625, -8.4498291015625, -8.1123046875, -7.7747802734375, -7.437255859375, -7.0997314453125, -6.76220703125, -6.4246826171875, -6.087158203125, -5.7496337890625, -5.412109375, -5.0745849609375, -4.737060546875, -4.3995361328125, -4.06201171875, -3.7244873046875, -3.386962890625, -3.0494384765625, -2.7119140625, -2.3743896484375, -2.036865234375, -1.6993408203125, -1.36181640625, -1.0242919921875, -0.686767578125, -0.3492431640625, -0.01171875, 0.3258056640625, 0.663330078125, 1.0008544921875, 1.33837890625, 1.6759033203125, 2.013427734375, 2.3509521484375, 2.6884765625, 3.0260009765625, 3.363525390625, 3.7010498046875, 4.03857421875, 4.3760986328125, 4.713623046875, 5.0511474609375, 5.388671875, 5.7261962890625, 6.063720703125, 6.4012451171875, 6.73876953125, 7.0762939453125, 7.413818359375, 7.7513427734375, 8.0888671875, 8.4263916015625, 8.763916015625, 9.1014404296875, 9.43896484375, 9.7764892578125, 10.114013671875, 10.4515380859375, 10.7890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 8.0, 14.0, 32.0, 68.0, 154.0, 215.0, 204.0, 162.0, 66.0, 26.0, 14.0, 5.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.7950439453125, -124.1967544555664, -118.59846496582031, -113.00017547607422, -107.40188598632812, -101.80359649658203, -96.20530700683594, -90.60701751708984, -85.00872802734375, -79.41043853759766, -73.81214904785156, -68.21385955810547, -62.615570068359375, -57.01728057861328, -51.41899108886719, -45.820701599121094, -40.222412109375, -34.624122619628906, -29.025833129882812, -23.42754364013672, -17.829254150390625, -12.230964660644531, -6.6326751708984375, -1.0343856811523438, 4.56390380859375, 10.162193298339844, 15.760482788085938, 21.35877227783203, 26.957061767578125, 32.55535125732422, 38.15364074707031, 43.751930236816406, 49.3502197265625, 54.948509216308594, 60.54679870605469, 66.14508819580078, 71.74337768554688, 77.34166717529297, 82.93995666503906, 88.53824615478516, 94.13653564453125, 99.73482513427734, 105.33311462402344, 110.93140411376953, 116.52969360351562, 122.12798309326172, 127.72627258300781, 133.32455444335938, 138.9228515625, 144.52114868164062, 150.1194305419922, 155.71771240234375, 161.31600952148438, 166.914306640625, 172.51258850097656, 178.11087036132812, 183.70916748046875, 189.30746459960938, 194.90574645996094, 200.5040283203125, 206.10232543945312, 211.70062255859375, 217.2989044189453, 222.89718627929688, 228.4954833984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 3.0, 10.0, 14.0, 20.0, 15.0, 21.0, 23.0, 31.0, 35.0, 18.0, 27.0, 47.0, 39.0, 43.0, 49.0, 54.0, 51.0, 44.0, 45.0, 43.0, 50.0, 50.0, 31.0, 30.0, 33.0, 30.0, 26.0, 20.0, 14.0, 22.0, 11.0, 12.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.21015548706055, -58.33202362060547, -56.453887939453125, -54.57575607299805, -52.69762420654297, -50.81949234008789, -48.94136047363281, -47.06322479248047, -45.18509292602539, -43.30696105957031, -41.42882537841797, -39.55069351196289, -37.67256164550781, -35.794429779052734, -33.916297912597656, -32.03816223144531, -30.160030364990234, -28.281898498535156, -26.403764724731445, -24.525630950927734, -22.647499084472656, -20.769367218017578, -18.891233444213867, -17.013099670410156, -15.134967803955078, -13.256834983825684, -11.378702163696289, -9.500569343566895, -7.6224365234375, -5.7443037033081055, -3.866170883178711, -1.9880380630493164, -0.1099090576171875, 1.768223762512207, 3.6463565826416016, 5.524489402770996, 7.402622222900391, 9.280755043029785, 11.15888786315918, 13.037020683288574, 14.915153503417969, 16.793285369873047, 18.671419143676758, 20.54955291748047, 22.427684783935547, 24.305816650390625, 26.183950424194336, 28.062084197998047, 29.940216064453125, 31.818347930908203, 33.69647979736328, 35.574615478515625, 37.4527473449707, 39.33087921142578, 41.209014892578125, 43.0871467590332, 44.96527862548828, 46.84341049194336, 48.72154235839844, 50.59967803955078, 52.47780990600586, 54.35594177246094, 56.23407745361328, 58.11220932006836, 59.99034118652344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 7.0, 6.0, 6.0, 14.0, 14.0, 21.0, 32.0, 48.0, 104.0, 135.0, 258.0, 454.0, 1024.0, 2326.0, 6576.0, 21979.0, 83647.0, 318753.0, 439683.0, 125516.0, 32892.0, 9201.0, 3208.0, 1336.0, 576.0, 282.0, 158.0, 95.0, 58.0, 47.0, 26.0, 24.0, 13.0, 9.0, 2.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.01708984375, -15.5029296875, -14.98876953125, -14.474609375, -13.96044921875, -13.4462890625, -12.93212890625, -12.41796875, -11.90380859375, -11.3896484375, -10.87548828125, -10.361328125, -9.84716796875, -9.3330078125, -8.81884765625, -8.3046875, -7.79052734375, -7.2763671875, -6.76220703125, -6.248046875, -5.73388671875, -5.2197265625, -4.70556640625, -4.19140625, -3.67724609375, -3.1630859375, -2.64892578125, -2.134765625, -1.62060546875, -1.1064453125, -0.59228515625, -0.078125, 0.43603515625, 0.9501953125, 1.46435546875, 1.978515625, 2.49267578125, 3.0068359375, 3.52099609375, 4.03515625, 4.54931640625, 5.0634765625, 5.57763671875, 6.091796875, 6.60595703125, 7.1201171875, 7.63427734375, 8.1484375, 8.66259765625, 9.1767578125, 9.69091796875, 10.205078125, 10.71923828125, 11.2333984375, 11.74755859375, 12.26171875, 12.77587890625, 13.2900390625, 13.80419921875, 14.318359375, 14.83251953125, 15.3466796875, 15.86083984375, 16.375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 2.0, 5.0, 7.0, 9.0, 8.0, 13.0, 9.0, 13.0, 21.0, 22.0, 25.0, 28.0, 28.0, 41.0, 31.0, 39.0, 43.0, 40.0, 43.0, 48.0, 42.0, 39.0, 55.0, 43.0, 52.0, 43.0, 38.0, 33.0, 23.0, 23.0, 19.0, 18.0, 18.0, 15.0, 16.0, 9.0, 9.0, 8.0, 9.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.13641357421875, -4.0032958984375, -3.87017822265625, -3.737060546875, -3.60394287109375, -3.4708251953125, -3.33770751953125, -3.20458984375, -3.07147216796875, -2.9383544921875, -2.80523681640625, -2.672119140625, -2.53900146484375, -2.4058837890625, -2.27276611328125, -2.1396484375, -2.00653076171875, -1.8734130859375, -1.74029541015625, -1.607177734375, -1.47406005859375, -1.3409423828125, -1.20782470703125, -1.07470703125, -0.94158935546875, -0.8084716796875, -0.67535400390625, -0.542236328125, -0.40911865234375, -0.2760009765625, -0.14288330078125, -0.009765625, 0.12335205078125, 0.2564697265625, 0.38958740234375, 0.522705078125, 0.65582275390625, 0.7889404296875, 0.92205810546875, 1.05517578125, 1.18829345703125, 1.3214111328125, 1.45452880859375, 1.587646484375, 1.72076416015625, 1.8538818359375, 1.98699951171875, 2.1201171875, 2.25323486328125, 2.3863525390625, 2.51947021484375, 2.652587890625, 2.78570556640625, 2.9188232421875, 3.05194091796875, 3.18505859375, 3.31817626953125, 3.4512939453125, 3.58441162109375, 3.717529296875, 3.85064697265625, 3.9837646484375, 4.11688232421875, 4.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 21.0, 25.0, 26.0, 49.0, 80.0, 138.0, 263.0, 436.0, 873.0, 2041.0, 7720.0, 113225.0, 877504.0, 38205.0, 4793.0, 1570.0, 668.0, 360.0, 203.0, 106.0, 56.0, 45.0, 35.0, 16.0, 20.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.375, -41.02294921875, -39.6708984375, -38.31884765625, -36.966796875, -35.61474609375, -34.2626953125, -32.91064453125, -31.55859375, -30.20654296875, -28.8544921875, -27.50244140625, -26.150390625, -24.79833984375, -23.4462890625, -22.09423828125, -20.7421875, -19.39013671875, -18.0380859375, -16.68603515625, -15.333984375, -13.98193359375, -12.6298828125, -11.27783203125, -9.92578125, -8.57373046875, -7.2216796875, -5.86962890625, -4.517578125, -3.16552734375, -1.8134765625, -0.46142578125, 0.890625, 2.24267578125, 3.5947265625, 4.94677734375, 6.298828125, 7.65087890625, 9.0029296875, 10.35498046875, 11.70703125, 13.05908203125, 14.4111328125, 15.76318359375, 17.115234375, 18.46728515625, 19.8193359375, 21.17138671875, 22.5234375, 23.87548828125, 25.2275390625, 26.57958984375, 27.931640625, 29.28369140625, 30.6357421875, 31.98779296875, 33.33984375, 34.69189453125, 36.0439453125, 37.39599609375, 38.748046875, 40.10009765625, 41.4521484375, 42.80419921875, 44.15625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 8.0, 13.0, 16.0, 16.0, 19.0, 24.0, 19.0, 40.0, 44.0, 30.0, 49.0, 41.0, 66.0, 61.0, 68.0, 61.0, 71.0, 50.0, 41.0, 48.0, 40.0, 31.0, 28.0, 27.0, 16.0, 16.0, 15.0, 12.0, 9.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.19189453125, -19.4306640625, -18.66943359375, -17.908203125, -17.14697265625, -16.3857421875, -15.62451171875, -14.86328125, -14.10205078125, -13.3408203125, -12.57958984375, -11.818359375, -11.05712890625, -10.2958984375, -9.53466796875, -8.7734375, -8.01220703125, -7.2509765625, -6.48974609375, -5.728515625, -4.96728515625, -4.2060546875, -3.44482421875, -2.68359375, -1.92236328125, -1.1611328125, -0.39990234375, 0.361328125, 1.12255859375, 1.8837890625, 2.64501953125, 3.40625, 4.16748046875, 4.9287109375, 5.68994140625, 6.451171875, 7.21240234375, 7.9736328125, 8.73486328125, 9.49609375, 10.25732421875, 11.0185546875, 11.77978515625, 12.541015625, 13.30224609375, 14.0634765625, 14.82470703125, 15.5859375, 16.34716796875, 17.1083984375, 17.86962890625, 18.630859375, 19.39208984375, 20.1533203125, 20.91455078125, 21.67578125, 22.43701171875, 23.1982421875, 23.95947265625, 24.720703125, 25.48193359375, 26.2431640625, 27.00439453125, 27.765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 12.0, 8.0, 6.0, 7.0, 15.0, 20.0, 16.0, 29.0, 79.0, 108.0, 204.0, 560.0, 2611.0, 26913.0, 909966.0, 100956.0, 5455.0, 940.0, 312.0, 137.0, 63.0, 43.0, 25.0, 19.0, 13.0, 5.0, 4.0, 4.0, 2.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1875, -12.711181640625, -12.23486328125, -11.758544921875, -11.2822265625, -10.805908203125, -10.32958984375, -9.853271484375, -9.376953125, -8.900634765625, -8.42431640625, -7.947998046875, -7.4716796875, -6.995361328125, -6.51904296875, -6.042724609375, -5.56640625, -5.090087890625, -4.61376953125, -4.137451171875, -3.6611328125, -3.184814453125, -2.70849609375, -2.232177734375, -1.755859375, -1.279541015625, -0.80322265625, -0.326904296875, 0.1494140625, 0.625732421875, 1.10205078125, 1.578369140625, 2.0546875, 2.531005859375, 3.00732421875, 3.483642578125, 3.9599609375, 4.436279296875, 4.91259765625, 5.388916015625, 5.865234375, 6.341552734375, 6.81787109375, 7.294189453125, 7.7705078125, 8.246826171875, 8.72314453125, 9.199462890625, 9.67578125, 10.152099609375, 10.62841796875, 11.104736328125, 11.5810546875, 12.057373046875, 12.53369140625, 13.010009765625, 13.486328125, 13.962646484375, 14.43896484375, 14.915283203125, 15.3916015625, 15.867919921875, 16.34423828125, 16.820556640625, 17.296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 11.0, 4.0, 9.0, 16.0, 12.0, 19.0, 28.0, 34.0, 38.0, 45.0, 67.0, 85.0, 146.0, 130.0, 78.0, 49.0, 33.0, 34.0, 27.0, 23.0, 15.0, 15.0, 20.0, 7.0, 9.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0018224716186523438, -0.0017727762460708618, -0.0017230808734893799, -0.001673385500907898, -0.001623690128326416, -0.001573994755744934, -0.0015242993831634521, -0.0014746040105819702, -0.0014249086380004883, -0.0013752132654190063, -0.0013255178928375244, -0.0012758225202560425, -0.0012261271476745605, -0.0011764317750930786, -0.0011267364025115967, -0.0010770410299301147, -0.0010273456573486328, -0.0009776502847671509, -0.0009279549121856689, -0.000878259539604187, -0.0008285641670227051, -0.0007788687944412231, -0.0007291734218597412, -0.0006794780492782593, -0.0006297826766967773, -0.0005800873041152954, -0.0005303919315338135, -0.00048069655895233154, -0.0004310011863708496, -0.0003813058137893677, -0.00033161044120788574, -0.0002819150686264038, -0.00023221969604492188, -0.00018252432346343994, -0.000132828950881958, -8.313357830047607e-05, -3.343820571899414e-05, 1.6257166862487793e-05, 6.595253944396973e-05, 0.00011564791202545166, 0.0001653432846069336, 0.00021503865718841553, 0.00026473402976989746, 0.0003144294023513794, 0.00036412477493286133, 0.00041382014751434326, 0.0004635155200958252, 0.0005132108926773071, 0.0005629062652587891, 0.000612601637840271, 0.0006622970104217529, 0.0007119923830032349, 0.0007616877555847168, 0.0008113831281661987, 0.0008610785007476807, 0.0009107738733291626, 0.0009604692459106445, 0.0010101646184921265, 0.0010598599910736084, 0.0011095553636550903, 0.0011592507362365723, 0.0012089461088180542, 0.0012586414813995361, 0.001308336853981018, 0.0013580322265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 10.0, 9.0, 8.0, 14.0, 26.0, 40.0, 73.0, 94.0, 144.0, 264.0, 494.0, 1081.0, 2598.0, 8852.0, 54876.0, 828631.0, 130613.0, 14125.0, 3809.0, 1317.0, 637.0, 299.0, 180.0, 111.0, 64.0, 41.0, 30.0, 32.0, 13.0, 15.0, 9.0, 5.0, 7.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-10.9375, -10.6307373046875, -10.323974609375, -10.0172119140625, -9.71044921875, -9.4036865234375, -9.096923828125, -8.7901611328125, -8.4833984375, -8.1766357421875, -7.869873046875, -7.5631103515625, -7.25634765625, -6.9495849609375, -6.642822265625, -6.3360595703125, -6.029296875, -5.7225341796875, -5.415771484375, -5.1090087890625, -4.80224609375, -4.4954833984375, -4.188720703125, -3.8819580078125, -3.5751953125, -3.2684326171875, -2.961669921875, -2.6549072265625, -2.34814453125, -2.0413818359375, -1.734619140625, -1.4278564453125, -1.12109375, -0.8143310546875, -0.507568359375, -0.2008056640625, 0.10595703125, 0.4127197265625, 0.719482421875, 1.0262451171875, 1.3330078125, 1.6397705078125, 1.946533203125, 2.2532958984375, 2.56005859375, 2.8668212890625, 3.173583984375, 3.4803466796875, 3.787109375, 4.0938720703125, 4.400634765625, 4.7073974609375, 5.01416015625, 5.3209228515625, 5.627685546875, 5.9344482421875, 6.2412109375, 6.5479736328125, 6.854736328125, 7.1614990234375, 7.46826171875, 7.7750244140625, 8.081787109375, 8.3885498046875, 8.6953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 15.0, 15.0, 27.0, 33.0, 43.0, 56.0, 64.0, 94.0, 131.0, 122.0, 106.0, 83.0, 49.0, 37.0, 33.0, 13.0, 15.0, 7.0, 6.0, 3.0, 7.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.58984375, -6.34527587890625, -6.1007080078125, -5.85614013671875, -5.611572265625, -5.36700439453125, -5.1224365234375, -4.87786865234375, -4.63330078125, -4.38873291015625, -4.1441650390625, -3.89959716796875, -3.655029296875, -3.41046142578125, -3.1658935546875, -2.92132568359375, -2.6767578125, -2.43218994140625, -2.1876220703125, -1.94305419921875, -1.698486328125, -1.45391845703125, -1.2093505859375, -0.96478271484375, -0.72021484375, -0.47564697265625, -0.2310791015625, 0.01348876953125, 0.258056640625, 0.50262451171875, 0.7471923828125, 0.99176025390625, 1.236328125, 1.48089599609375, 1.7254638671875, 1.97003173828125, 2.214599609375, 2.45916748046875, 2.7037353515625, 2.94830322265625, 3.19287109375, 3.43743896484375, 3.6820068359375, 3.92657470703125, 4.171142578125, 4.41571044921875, 4.6602783203125, 4.90484619140625, 5.1494140625, 5.39398193359375, 5.6385498046875, 5.88311767578125, 6.127685546875, 6.37225341796875, 6.6168212890625, 6.86138916015625, 7.10595703125, 7.35052490234375, 7.5950927734375, 7.83966064453125, 8.084228515625, 8.32879638671875, 8.5733642578125, 8.81793212890625, 9.0625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 10.0, 21.0, 34.0, 63.0, 115.0, 204.0, 232.0, 134.0, 87.0, 40.0, 18.0, 10.0, 5.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.42556762695312, -152.39869689941406, -147.371826171875, -142.34495544433594, -137.31808471679688, -132.29119873046875, -127.26433563232422, -122.23745727539062, -117.21058654785156, -112.1837158203125, -107.15684509277344, -102.12997436523438, -97.10309600830078, -92.07622528076172, -87.04935455322266, -82.02247619628906, -76.99561309814453, -71.96874237060547, -66.9418716430664, -61.91499710083008, -56.88812255859375, -51.86125183105469, -46.834381103515625, -41.8075065612793, -36.780635833740234, -31.75376319885254, -26.726890563964844, -21.70001983642578, -16.673147201538086, -11.64627456665039, -6.619403839111328, -1.592529296875, 3.4343414306640625, 8.461214065551758, 13.488085746765137, 18.514957427978516, 23.54183006286621, 28.568702697753906, 33.59557342529297, 38.6224479675293, 43.64931869506836, 48.67618942260742, 53.70306396484375, 58.72993469238281, 63.756805419921875, 68.78367614746094, 73.810546875, 78.8374252319336, 83.86429595947266, 88.89116668701172, 93.91803741455078, 98.94491577148438, 103.97178649902344, 108.9986572265625, 114.02552795410156, 119.05239868164062, 124.07926940917969, 129.10614013671875, 134.1330108642578, 139.15988159179688, 144.18675231933594, 149.213623046875, 154.24050903320312, 159.2673797607422, 164.29425048828125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 12.0, 10.0, 11.0, 7.0, 18.0, 20.0, 32.0, 26.0, 28.0, 29.0, 30.0, 33.0, 37.0, 39.0, 49.0, 64.0, 55.0, 45.0, 56.0, 51.0, 44.0, 25.0, 36.0, 37.0, 24.0, 20.0, 20.0, 14.0, 14.0, 10.0, 16.0, 12.0, 8.0, 6.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-68.70359802246094, -66.64787292480469, -64.5921401977539, -62.53641128540039, -60.480682373046875, -58.42495346069336, -56.369224548339844, -54.31349563598633, -52.25776672363281, -50.2020378112793, -48.14630889892578, -46.090579986572266, -44.03485107421875, -41.979122161865234, -39.92339324951172, -37.8676643371582, -35.81193542480469, -33.75620651245117, -31.700477600097656, -29.64474868774414, -27.589019775390625, -25.53329086303711, -23.477561950683594, -21.421833038330078, -19.366104125976562, -17.310375213623047, -15.254646301269531, -13.198917388916016, -11.1431884765625, -9.087459564208984, -7.031730651855469, -4.976001739501953, -2.920276641845703, -0.8645477294921875, 1.1911811828613281, 3.2469100952148438, 5.302639007568359, 7.358367919921875, 9.41409683227539, 11.469825744628906, 13.525554656982422, 15.581283569335938, 17.637012481689453, 19.69274139404297, 21.748470306396484, 23.80419921875, 25.859928131103516, 27.91565704345703, 29.971385955810547, 32.02711486816406, 34.08284378051758, 36.138572692871094, 38.19430160522461, 40.250030517578125, 42.30575942993164, 44.361488342285156, 46.41721725463867, 48.47294616699219, 50.5286750793457, 52.58440399169922, 54.640132904052734, 56.69586181640625, 58.751590728759766, 60.80731964111328, 62.8630485534668]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 27.0, 23.0, 68.0, 186.0, 597.0, 2652.0, 26282.0, 3200767.0, 946646.0, 14620.0, 1704.0, 407.0, 147.0, 62.0, 25.0, 19.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.5, -16.735595703125, -15.97119140625, -15.206787109375, -14.4423828125, -13.677978515625, -12.91357421875, -12.149169921875, -11.384765625, -10.620361328125, -9.85595703125, -9.091552734375, -8.3271484375, -7.562744140625, -6.79833984375, -6.033935546875, -5.26953125, -4.505126953125, -3.74072265625, -2.976318359375, -2.2119140625, -1.447509765625, -0.68310546875, 0.081298828125, 0.845703125, 1.610107421875, 2.37451171875, 3.138916015625, 3.9033203125, 4.667724609375, 5.43212890625, 6.196533203125, 6.9609375, 7.725341796875, 8.48974609375, 9.254150390625, 10.0185546875, 10.782958984375, 11.54736328125, 12.311767578125, 13.076171875, 13.840576171875, 14.60498046875, 15.369384765625, 16.1337890625, 16.898193359375, 17.66259765625, 18.427001953125, 19.19140625, 19.955810546875, 20.72021484375, 21.484619140625, 22.2490234375, 23.013427734375, 23.77783203125, 24.542236328125, 25.306640625, 26.071044921875, 26.83544921875, 27.599853515625, 28.3642578125, 29.128662109375, 29.89306640625, 30.657470703125, 31.421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 6.0, 11.0, 22.0, 14.0, 26.0, 19.0, 27.0, 22.0, 32.0, 39.0, 37.0, 41.0, 59.0, 51.0, 49.0, 49.0, 45.0, 49.0, 47.0, 52.0, 58.0, 46.0, 34.0, 29.0, 26.0, 24.0, 11.0, 17.0, 13.0, 7.0, 6.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-5.37890625, -5.230712890625, -5.08251953125, -4.934326171875, -4.7861328125, -4.637939453125, -4.48974609375, -4.341552734375, -4.193359375, -4.045166015625, -3.89697265625, -3.748779296875, -3.6005859375, -3.452392578125, -3.30419921875, -3.156005859375, -3.0078125, -2.859619140625, -2.71142578125, -2.563232421875, -2.4150390625, -2.266845703125, -2.11865234375, -1.970458984375, -1.822265625, -1.674072265625, -1.52587890625, -1.377685546875, -1.2294921875, -1.081298828125, -0.93310546875, -0.784912109375, -0.63671875, -0.488525390625, -0.34033203125, -0.192138671875, -0.0439453125, 0.104248046875, 0.25244140625, 0.400634765625, 0.548828125, 0.697021484375, 0.84521484375, 0.993408203125, 1.1416015625, 1.289794921875, 1.43798828125, 1.586181640625, 1.734375, 1.882568359375, 2.03076171875, 2.178955078125, 2.3271484375, 2.475341796875, 2.62353515625, 2.771728515625, 2.919921875, 3.068115234375, 3.21630859375, 3.364501953125, 3.5126953125, 3.660888671875, 3.80908203125, 3.957275390625, 4.10546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 15.0, 19.0, 24.0, 61.0, 96.0, 213.0, 501.0, 1199.0, 4702.0, 31956.0, 772040.0, 3303798.0, 68517.0, 8172.0, 1854.0, 615.0, 254.0, 122.0, 48.0, 27.0, 17.0, 9.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1171875, -14.4915771484375, -13.865966796875, -13.2403564453125, -12.61474609375, -11.9891357421875, -11.363525390625, -10.7379150390625, -10.1123046875, -9.4866943359375, -8.861083984375, -8.2354736328125, -7.60986328125, -6.9842529296875, -6.358642578125, -5.7330322265625, -5.107421875, -4.4818115234375, -3.856201171875, -3.2305908203125, -2.60498046875, -1.9793701171875, -1.353759765625, -0.7281494140625, -0.1025390625, 0.5230712890625, 1.148681640625, 1.7742919921875, 2.39990234375, 3.0255126953125, 3.651123046875, 4.2767333984375, 4.90234375, 5.5279541015625, 6.153564453125, 6.7791748046875, 7.40478515625, 8.0303955078125, 8.656005859375, 9.2816162109375, 9.9072265625, 10.5328369140625, 11.158447265625, 11.7840576171875, 12.40966796875, 13.0352783203125, 13.660888671875, 14.2864990234375, 14.912109375, 15.5377197265625, 16.163330078125, 16.7889404296875, 17.41455078125, 18.0401611328125, 18.665771484375, 19.2913818359375, 19.9169921875, 20.5426025390625, 21.168212890625, 21.7938232421875, 22.41943359375, 23.0450439453125, 23.670654296875, 24.2962646484375, 24.921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 14.0, 27.0, 31.0, 43.0, 67.0, 109.0, 232.0, 490.0, 921.0, 1026.0, 522.0, 242.0, 124.0, 67.0, 39.0, 28.0, 16.0, 17.0, 12.0, 15.0, 10.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.9586181640625, -19.448486328125, -18.9383544921875, -18.42822265625, -17.9180908203125, -17.407958984375, -16.8978271484375, -16.3876953125, -15.8775634765625, -15.367431640625, -14.8572998046875, -14.34716796875, -13.8370361328125, -13.326904296875, -12.8167724609375, -12.306640625, -11.7965087890625, -11.286376953125, -10.7762451171875, -10.26611328125, -9.7559814453125, -9.245849609375, -8.7357177734375, -8.2255859375, -7.7154541015625, -7.205322265625, -6.6951904296875, -6.18505859375, -5.6749267578125, -5.164794921875, -4.6546630859375, -4.14453125, -3.6343994140625, -3.124267578125, -2.6141357421875, -2.10400390625, -1.5938720703125, -1.083740234375, -0.5736083984375, -0.0634765625, 0.4466552734375, 0.956787109375, 1.4669189453125, 1.97705078125, 2.4871826171875, 2.997314453125, 3.5074462890625, 4.017578125, 4.5277099609375, 5.037841796875, 5.5479736328125, 6.05810546875, 6.5682373046875, 7.078369140625, 7.5885009765625, 8.0986328125, 8.6087646484375, 9.118896484375, 9.6290283203125, 10.13916015625, 10.6492919921875, 11.159423828125, 11.6695556640625, 12.1796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 15.0, 73.0, 330.0, 401.0, 138.0, 27.0, 6.0, 1.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-307.48004150390625, -298.24835205078125, -289.01666259765625, -279.78497314453125, -270.55328369140625, -261.32159423828125, -252.08990478515625, -242.85821533203125, -233.62652587890625, -224.39483642578125, -215.16314697265625, -205.93145751953125, -196.69976806640625, -187.46807861328125, -178.23638916015625, -169.00469970703125, -159.77301025390625, -150.54132080078125, -141.30963134765625, -132.07794189453125, -122.84625244140625, -113.61456298828125, -104.38287353515625, -95.15118408203125, -85.91949462890625, -76.68780517578125, -67.45611572265625, -58.22442626953125, -48.99273681640625, -39.76104736328125, -30.52935791015625, -21.29766845703125, -12.06597900390625, -2.83428955078125, 6.39739990234375, 15.62908935546875, 24.86077880859375, 34.09246826171875, 43.32415771484375, 52.55584716796875, 61.78753662109375, 71.01922607421875, 80.25091552734375, 89.48260498046875, 98.71429443359375, 107.94598388671875, 117.17767333984375, 126.40936279296875, 135.64105224609375, 144.87274169921875, 154.10443115234375, 163.33612060546875, 172.56781005859375, 181.79949951171875, 191.03118896484375, 200.26287841796875, 209.49456787109375, 218.72625732421875, 227.95794677734375, 237.18963623046875, 246.42132568359375, 255.65301513671875, 264.88470458984375, 274.11639404296875, 283.34808349609375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 13.0, 14.0, 13.0, 26.0, 37.0, 40.0, 39.0, 62.0, 55.0, 58.0, 70.0, 68.0, 80.0, 77.0, 64.0, 56.0, 50.0, 49.0, 39.0, 22.0, 28.0, 9.0, 10.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-105.33206176757812, -102.91027069091797, -100.48847961425781, -98.06668090820312, -95.64488983154297, -93.22309875488281, -90.80130767822266, -88.3795166015625, -85.95771789550781, -83.53592681884766, -81.1141357421875, -78.69233703613281, -76.27054595947266, -73.8487548828125, -71.42696380615234, -69.00517272949219, -66.5833740234375, -64.16158294677734, -61.73978805541992, -59.317996978759766, -56.896202087402344, -54.47441101074219, -52.05261993408203, -49.63082504272461, -47.20903778076172, -44.78724670410156, -42.36545181274414, -39.943660736083984, -37.52186584472656, -35.100074768066406, -32.67828369140625, -30.256488800048828, -27.834693908691406, -25.412900924682617, -22.991107940673828, -20.569316864013672, -18.14752197265625, -15.725729942321777, -13.303937911987305, -10.882144927978516, -8.460351943969727, -6.0385589599609375, -3.6167664527893066, -1.1949739456176758, 1.2268190383911133, 3.6486120223999023, 6.070404052734375, 8.492197036743164, 10.913990020751953, 13.335783004760742, 15.757575988769531, 18.179367065429688, 20.60116195678711, 23.022953033447266, 25.444746017456055, 27.866539001464844, 30.288331985473633, 32.71012496948242, 35.13191604614258, 37.5537109375, 39.975502014160156, 42.39729690551758, 44.819087982177734, 47.240882873535156, 49.66267395019531]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 2.0, 4.0, 8.0, 7.0, 10.0, 21.0, 24.0, 36.0, 57.0, 106.0, 162.0, 328.0, 771.0, 1683.0, 4439.0, 14097.0, 53101.0, 254758.0, 550649.0, 125396.0, 29212.0, 8419.0, 2976.0, 1170.0, 521.0, 235.0, 120.0, 71.0, 46.0, 36.0, 26.0, 13.0, 13.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.4188232421875, -14.892333984375, -14.3658447265625, -13.83935546875, -13.3128662109375, -12.786376953125, -12.2598876953125, -11.7333984375, -11.2069091796875, -10.680419921875, -10.1539306640625, -9.62744140625, -9.1009521484375, -8.574462890625, -8.0479736328125, -7.521484375, -6.9949951171875, -6.468505859375, -5.9420166015625, -5.41552734375, -4.8890380859375, -4.362548828125, -3.8360595703125, -3.3095703125, -2.7830810546875, -2.256591796875, -1.7301025390625, -1.20361328125, -0.6771240234375, -0.150634765625, 0.3758544921875, 0.90234375, 1.4288330078125, 1.955322265625, 2.4818115234375, 3.00830078125, 3.5347900390625, 4.061279296875, 4.5877685546875, 5.1142578125, 5.6407470703125, 6.167236328125, 6.6937255859375, 7.22021484375, 7.7467041015625, 8.273193359375, 8.7996826171875, 9.326171875, 9.8526611328125, 10.379150390625, 10.9056396484375, 11.43212890625, 11.9586181640625, 12.485107421875, 13.0115966796875, 13.5380859375, 14.0645751953125, 14.591064453125, 15.1175537109375, 15.64404296875, 16.1705322265625, 16.697021484375, 17.2235107421875, 17.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 5.0, 5.0, 14.0, 13.0, 21.0, 10.0, 23.0, 25.0, 31.0, 34.0, 29.0, 36.0, 37.0, 41.0, 45.0, 50.0, 42.0, 57.0, 57.0, 55.0, 36.0, 40.0, 43.0, 53.0, 32.0, 37.0, 23.0, 20.0, 10.0, 15.0, 8.0, 14.0, 8.0, 4.0, 7.0, 0.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.2890625, -5.1422119140625, -4.995361328125, -4.8485107421875, -4.70166015625, -4.5548095703125, -4.407958984375, -4.2611083984375, -4.1142578125, -3.9674072265625, -3.820556640625, -3.6737060546875, -3.52685546875, -3.3800048828125, -3.233154296875, -3.0863037109375, -2.939453125, -2.7926025390625, -2.645751953125, -2.4989013671875, -2.35205078125, -2.2052001953125, -2.058349609375, -1.9114990234375, -1.7646484375, -1.6177978515625, -1.470947265625, -1.3240966796875, -1.17724609375, -1.0303955078125, -0.883544921875, -0.7366943359375, -0.58984375, -0.4429931640625, -0.296142578125, -0.1492919921875, -0.00244140625, 0.1444091796875, 0.291259765625, 0.4381103515625, 0.5849609375, 0.7318115234375, 0.878662109375, 1.0255126953125, 1.17236328125, 1.3192138671875, 1.466064453125, 1.6129150390625, 1.759765625, 1.9066162109375, 2.053466796875, 2.2003173828125, 2.34716796875, 2.4940185546875, 2.640869140625, 2.7877197265625, 2.9345703125, 3.0814208984375, 3.228271484375, 3.3751220703125, 3.52197265625, 3.6688232421875, 3.815673828125, 3.9625244140625, 4.109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 13.0, 13.0, 11.0, 27.0, 24.0, 56.0, 68.0, 141.0, 251.0, 456.0, 1013.0, 2874.0, 16097.0, 639129.0, 370442.0, 13393.0, 2568.0, 942.0, 422.0, 229.0, 120.0, 73.0, 48.0, 28.0, 20.0, 22.0, 17.0, 14.0, 7.0, 6.0, 1.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.77880859375, -37.5263671875, -36.27392578125, -35.021484375, -33.76904296875, -32.5166015625, -31.26416015625, -30.01171875, -28.75927734375, -27.5068359375, -26.25439453125, -25.001953125, -23.74951171875, -22.4970703125, -21.24462890625, -19.9921875, -18.73974609375, -17.4873046875, -16.23486328125, -14.982421875, -13.72998046875, -12.4775390625, -11.22509765625, -9.97265625, -8.72021484375, -7.4677734375, -6.21533203125, -4.962890625, -3.71044921875, -2.4580078125, -1.20556640625, 0.046875, 1.29931640625, 2.5517578125, 3.80419921875, 5.056640625, 6.30908203125, 7.5615234375, 8.81396484375, 10.06640625, 11.31884765625, 12.5712890625, 13.82373046875, 15.076171875, 16.32861328125, 17.5810546875, 18.83349609375, 20.0859375, 21.33837890625, 22.5908203125, 23.84326171875, 25.095703125, 26.34814453125, 27.6005859375, 28.85302734375, 30.10546875, 31.35791015625, 32.6103515625, 33.86279296875, 35.115234375, 36.36767578125, 37.6201171875, 38.87255859375, 40.125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 1.0, 9.0, 11.0, 16.0, 19.0, 22.0, 16.0, 22.0, 18.0, 30.0, 27.0, 39.0, 40.0, 39.0, 42.0, 55.0, 46.0, 52.0, 46.0, 47.0, 49.0, 36.0, 51.0, 33.0, 29.0, 26.0, 27.0, 16.0, 21.0, 19.0, 14.0, 12.0, 12.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.1875, -16.658203125, -16.12890625, -15.599609375, -15.0703125, -14.541015625, -14.01171875, -13.482421875, -12.953125, -12.423828125, -11.89453125, -11.365234375, -10.8359375, -10.306640625, -9.77734375, -9.248046875, -8.71875, -8.189453125, -7.66015625, -7.130859375, -6.6015625, -6.072265625, -5.54296875, -5.013671875, -4.484375, -3.955078125, -3.42578125, -2.896484375, -2.3671875, -1.837890625, -1.30859375, -0.779296875, -0.25, 0.279296875, 0.80859375, 1.337890625, 1.8671875, 2.396484375, 2.92578125, 3.455078125, 3.984375, 4.513671875, 5.04296875, 5.572265625, 6.1015625, 6.630859375, 7.16015625, 7.689453125, 8.21875, 8.748046875, 9.27734375, 9.806640625, 10.3359375, 10.865234375, 11.39453125, 11.923828125, 12.453125, 12.982421875, 13.51171875, 14.041015625, 14.5703125, 15.099609375, 15.62890625, 16.158203125, 16.6875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 22.0, 10.0, 11.0, 24.0, 29.0, 48.0, 67.0, 80.0, 140.0, 176.0, 286.0, 523.0, 1155.0, 3074.0, 11471.0, 79161.0, 812112.0, 118939.0, 14749.0, 3660.0, 1298.0, 586.0, 294.0, 188.0, 123.0, 81.0, 56.0, 31.0, 43.0, 23.0, 13.0, 11.0, 14.0, 13.0, 6.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-8.2109375, -7.98016357421875, -7.7493896484375, -7.51861572265625, -7.287841796875, -7.05706787109375, -6.8262939453125, -6.59552001953125, -6.36474609375, -6.13397216796875, -5.9031982421875, -5.67242431640625, -5.441650390625, -5.21087646484375, -4.9801025390625, -4.74932861328125, -4.5185546875, -4.28778076171875, -4.0570068359375, -3.82623291015625, -3.595458984375, -3.36468505859375, -3.1339111328125, -2.90313720703125, -2.67236328125, -2.44158935546875, -2.2108154296875, -1.98004150390625, -1.749267578125, -1.51849365234375, -1.2877197265625, -1.05694580078125, -0.826171875, -0.59539794921875, -0.3646240234375, -0.13385009765625, 0.096923828125, 0.32769775390625, 0.5584716796875, 0.78924560546875, 1.02001953125, 1.25079345703125, 1.4815673828125, 1.71234130859375, 1.943115234375, 2.17388916015625, 2.4046630859375, 2.63543701171875, 2.8662109375, 3.09698486328125, 3.3277587890625, 3.55853271484375, 3.789306640625, 4.02008056640625, 4.2508544921875, 4.48162841796875, 4.71240234375, 4.94317626953125, 5.1739501953125, 5.40472412109375, 5.635498046875, 5.86627197265625, 6.0970458984375, 6.32781982421875, 6.55859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 3.0, 8.0, 8.0, 15.0, 15.0, 14.0, 19.0, 31.0, 31.0, 56.0, 76.0, 104.0, 140.0, 140.0, 96.0, 70.0, 40.0, 15.0, 25.0, 18.0, 13.0, 10.0, 10.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012922286987304688, -0.0012472718954086304, -0.001202315092086792, -0.0011573582887649536, -0.0011124014854431152, -0.0010674446821212769, -0.0010224878787994385, -0.0009775310754776, -0.0009325742721557617, -0.0008876174688339233, -0.000842660665512085, -0.0007977038621902466, -0.0007527470588684082, -0.0007077902555465698, -0.0006628334522247314, -0.0006178766489028931, -0.0005729198455810547, -0.0005279630422592163, -0.00048300623893737793, -0.00043804943561553955, -0.00039309263229370117, -0.0003481358289718628, -0.0003031790256500244, -0.00025822222232818604, -0.00021326541900634766, -0.00016830861568450928, -0.0001233518123626709, -7.839500904083252e-05, -3.343820571899414e-05, 1.1518597602844238e-05, 5.647540092468262e-05, 0.000101432204246521, 0.00014638900756835938, 0.00019134581089019775, 0.00023630261421203613, 0.0002812594175338745, 0.0003262162208557129, 0.00037117302417755127, 0.00041612982749938965, 0.00046108663082122803, 0.0005060434341430664, 0.0005510002374649048, 0.0005959570407867432, 0.0006409138441085815, 0.0006858706474304199, 0.0007308274507522583, 0.0007757842540740967, 0.0008207410573959351, 0.0008656978607177734, 0.0009106546640396118, 0.0009556114673614502, 0.0010005682706832886, 0.001045525074005127, 0.0010904818773269653, 0.0011354386806488037, 0.001180395483970642, 0.0012253522872924805, 0.0012703090906143188, 0.0013152658939361572, 0.0013602226972579956, 0.001405179500579834, 0.0014501363039016724, 0.0014950931072235107, 0.0015400499105453491, 0.0015850067138671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 4.0, 4.0, 8.0, 3.0, 2.0, 7.0, 17.0, 21.0, 27.0, 35.0, 48.0, 67.0, 106.0, 183.0, 272.0, 440.0, 863.0, 1754.0, 4283.0, 13872.0, 88268.0, 768827.0, 141379.0, 18408.0, 5227.0, 2069.0, 985.0, 500.0, 315.0, 183.0, 110.0, 77.0, 64.0, 40.0, 22.0, 17.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.17950439453125, -4.9918212890625, -4.80413818359375, -4.616455078125, -4.42877197265625, -4.2410888671875, -4.05340576171875, -3.86572265625, -3.67803955078125, -3.4903564453125, -3.30267333984375, -3.114990234375, -2.92730712890625, -2.7396240234375, -2.55194091796875, -2.3642578125, -2.17657470703125, -1.9888916015625, -1.80120849609375, -1.613525390625, -1.42584228515625, -1.2381591796875, -1.05047607421875, -0.86279296875, -0.67510986328125, -0.4874267578125, -0.29974365234375, -0.112060546875, 0.07562255859375, 0.2633056640625, 0.45098876953125, 0.638671875, 0.82635498046875, 1.0140380859375, 1.20172119140625, 1.389404296875, 1.57708740234375, 1.7647705078125, 1.95245361328125, 2.14013671875, 2.32781982421875, 2.5155029296875, 2.70318603515625, 2.890869140625, 3.07855224609375, 3.2662353515625, 3.45391845703125, 3.6416015625, 3.82928466796875, 4.0169677734375, 4.20465087890625, 4.392333984375, 4.58001708984375, 4.7677001953125, 4.95538330078125, 5.14306640625, 5.33074951171875, 5.5184326171875, 5.70611572265625, 5.893798828125, 6.08148193359375, 6.2691650390625, 6.45684814453125, 6.64453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 14.0, 5.0, 27.0, 28.0, 25.0, 33.0, 50.0, 79.0, 108.0, 112.0, 94.0, 102.0, 75.0, 62.0, 34.0, 35.0, 24.0, 19.0, 12.0, 11.0, 8.0, 8.0, 5.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4296875, -6.25689697265625, -6.0841064453125, -5.91131591796875, -5.738525390625, -5.56573486328125, -5.3929443359375, -5.22015380859375, -5.04736328125, -4.87457275390625, -4.7017822265625, -4.52899169921875, -4.356201171875, -4.18341064453125, -4.0106201171875, -3.83782958984375, -3.6650390625, -3.49224853515625, -3.3194580078125, -3.14666748046875, -2.973876953125, -2.80108642578125, -2.6282958984375, -2.45550537109375, -2.28271484375, -2.10992431640625, -1.9371337890625, -1.76434326171875, -1.591552734375, -1.41876220703125, -1.2459716796875, -1.07318115234375, -0.900390625, -0.72760009765625, -0.5548095703125, -0.38201904296875, -0.209228515625, -0.03643798828125, 0.1363525390625, 0.30914306640625, 0.48193359375, 0.65472412109375, 0.8275146484375, 1.00030517578125, 1.173095703125, 1.34588623046875, 1.5186767578125, 1.69146728515625, 1.8642578125, 2.03704833984375, 2.2098388671875, 2.38262939453125, 2.555419921875, 2.72821044921875, 2.9010009765625, 3.07379150390625, 3.24658203125, 3.41937255859375, 3.5921630859375, 3.76495361328125, 3.937744140625, 4.11053466796875, 4.2833251953125, 4.45611572265625, 4.62890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 12.0, 45.0, 129.0, 360.0, 287.0, 101.0, 38.0, 10.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-319.18878173828125, -311.5707702636719, -303.9527587890625, -296.3347473144531, -288.71673583984375, -281.0987243652344, -273.480712890625, -265.86273193359375, -258.2447204589844, -250.626708984375, -243.00869750976562, -235.39068603515625, -227.77268981933594, -220.15467834472656, -212.5366668701172, -204.9186553955078, -197.30062866210938, -189.6826171875, -182.06460571289062, -174.44659423828125, -166.82859802246094, -159.21058654785156, -151.5925750732422, -143.9745635986328, -136.3565673828125, -128.73855590820312, -121.12055206298828, -113.5025405883789, -105.88452911376953, -98.26652526855469, -90.64851379394531, -83.03050231933594, -75.41249084472656, -67.79447937011719, -60.17647171020508, -52.55846405029297, -44.940452575683594, -37.322444915771484, -29.704437255859375, -22.08642578125, -14.46841812133789, -6.850409030914307, 0.7676000595092773, 8.385608673095703, 16.003618240356445, 23.621627807617188, 31.239635467529297, 38.85764694213867, 46.47565460205078, 54.09366226196289, 61.711673736572266, 69.32968139648438, 76.94769287109375, 84.56570434570312, 92.18370819091797, 99.80171966552734, 107.41972351074219, 115.03773498535156, 122.6557388305664, 130.27374267578125, 137.89175415039062, 145.509765625, 153.12777709960938, 160.74578857421875, 168.36380004882812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 2.0, 10.0, 12.0, 19.0, 18.0, 21.0, 30.0, 26.0, 37.0, 29.0, 36.0, 40.0, 50.0, 49.0, 56.0, 89.0, 73.0, 58.0, 44.0, 50.0, 30.0, 25.0, 27.0, 27.0, 21.0, 14.0, 16.0, 19.0, 9.0, 11.0, 7.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.75736999511719, -58.3917350769043, -56.026100158691406, -53.66046905517578, -51.29483413696289, -48.92919921875, -46.563568115234375, -44.197933197021484, -41.832298278808594, -39.4666633605957, -37.10102844238281, -34.73539733886719, -32.3697624206543, -30.004127502441406, -27.63849449157715, -25.27286148071289, -22.9072265625, -20.54159164428711, -18.17595863342285, -15.810324668884277, -13.444690704345703, -11.079056739807129, -8.713422775268555, -6.347789764404297, -3.9821548461914062, -1.616520881652832, 0.7491130828857422, 3.1147470474243164, 5.480381011962891, 7.846014976501465, 10.211648941040039, 12.577281951904297, 14.942916870117188, 17.308551788330078, 19.674184799194336, 22.039817810058594, 24.405452728271484, 26.771087646484375, 29.136720657348633, 31.50235366821289, 33.86798858642578, 36.23362350463867, 38.59925842285156, 40.96488952636719, 43.33052444458008, 45.69615936279297, 48.061790466308594, 50.427425384521484, 52.793060302734375, 55.158695220947266, 57.524330139160156, 59.88996124267578, 62.25559616088867, 64.62123107910156, 66.98686218261719, 69.35249328613281, 71.71813201904297, 74.0837631225586, 76.44940185546875, 78.81503295898438, 81.1806640625, 83.54630279541016, 85.91193389892578, 88.27757263183594, 90.64320373535156]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 15.0, 15.0, 26.0, 50.0, 99.0, 229.0, 624.0, 2703.0, 21372.0, 2990472.0, 1161992.0, 13782.0, 1984.0, 523.0, 182.0, 93.0, 48.0, 35.0, 9.0, 14.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.29248046875, -16.5380859375, -15.78369140625, -15.029296875, -14.27490234375, -13.5205078125, -12.76611328125, -12.01171875, -11.25732421875, -10.5029296875, -9.74853515625, -8.994140625, -8.23974609375, -7.4853515625, -6.73095703125, -5.9765625, -5.22216796875, -4.4677734375, -3.71337890625, -2.958984375, -2.20458984375, -1.4501953125, -0.69580078125, 0.05859375, 0.81298828125, 1.5673828125, 2.32177734375, 3.076171875, 3.83056640625, 4.5849609375, 5.33935546875, 6.09375, 6.84814453125, 7.6025390625, 8.35693359375, 9.111328125, 9.86572265625, 10.6201171875, 11.37451171875, 12.12890625, 12.88330078125, 13.6376953125, 14.39208984375, 15.146484375, 15.90087890625, 16.6552734375, 17.40966796875, 18.1640625, 18.91845703125, 19.6728515625, 20.42724609375, 21.181640625, 21.93603515625, 22.6904296875, 23.44482421875, 24.19921875, 24.95361328125, 25.7080078125, 26.46240234375, 27.216796875, 27.97119140625, 28.7255859375, 29.47998046875, 30.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 10.0, 8.0, 8.0, 15.0, 18.0, 29.0, 27.0, 25.0, 27.0, 39.0, 35.0, 41.0, 44.0, 53.0, 55.0, 68.0, 70.0, 62.0, 48.0, 50.0, 40.0, 41.0, 42.0, 25.0, 31.0, 20.0, 14.0, 13.0, 8.0, 9.0, 7.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.38067626953125, -4.2222900390625, -4.06390380859375, -3.905517578125, -3.74713134765625, -3.5887451171875, -3.43035888671875, -3.27197265625, -3.11358642578125, -2.9552001953125, -2.79681396484375, -2.638427734375, -2.48004150390625, -2.3216552734375, -2.16326904296875, -2.0048828125, -1.84649658203125, -1.6881103515625, -1.52972412109375, -1.371337890625, -1.21295166015625, -1.0545654296875, -0.89617919921875, -0.73779296875, -0.57940673828125, -0.4210205078125, -0.26263427734375, -0.104248046875, 0.05413818359375, 0.2125244140625, 0.37091064453125, 0.529296875, 0.68768310546875, 0.8460693359375, 1.00445556640625, 1.162841796875, 1.32122802734375, 1.4796142578125, 1.63800048828125, 1.79638671875, 1.95477294921875, 2.1131591796875, 2.27154541015625, 2.429931640625, 2.58831787109375, 2.7467041015625, 2.90509033203125, 3.0634765625, 3.22186279296875, 3.3802490234375, 3.53863525390625, 3.697021484375, 3.85540771484375, 4.0137939453125, 4.17218017578125, 4.33056640625, 4.48895263671875, 4.6473388671875, 4.80572509765625, 4.964111328125, 5.12249755859375, 5.2808837890625, 5.43927001953125, 5.59765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 10.0, 31.0, 38.0, 76.0, 129.0, 351.0, 880.0, 2810.0, 12946.0, 201809.0, 3885976.0, 75863.0, 9307.0, 2516.0, 816.0, 364.0, 162.0, 82.0, 44.0, 22.0, 6.0, 12.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.753173828125, -17.05322265625, -16.353271484375, -15.6533203125, -14.953369140625, -14.25341796875, -13.553466796875, -12.853515625, -12.153564453125, -11.45361328125, -10.753662109375, -10.0537109375, -9.353759765625, -8.65380859375, -7.953857421875, -7.25390625, -6.553955078125, -5.85400390625, -5.154052734375, -4.4541015625, -3.754150390625, -3.05419921875, -2.354248046875, -1.654296875, -0.954345703125, -0.25439453125, 0.445556640625, 1.1455078125, 1.845458984375, 2.54541015625, 3.245361328125, 3.9453125, 4.645263671875, 5.34521484375, 6.045166015625, 6.7451171875, 7.445068359375, 8.14501953125, 8.844970703125, 9.544921875, 10.244873046875, 10.94482421875, 11.644775390625, 12.3447265625, 13.044677734375, 13.74462890625, 14.444580078125, 15.14453125, 15.844482421875, 16.54443359375, 17.244384765625, 17.9443359375, 18.644287109375, 19.34423828125, 20.044189453125, 20.744140625, 21.444091796875, 22.14404296875, 22.843994140625, 23.5439453125, 24.243896484375, 24.94384765625, 25.643798828125, 26.34375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 9.0, 27.0, 39.0, 64.0, 112.0, 243.0, 634.0, 1455.0, 846.0, 309.0, 132.0, 55.0, 49.0, 19.0, 13.0, 10.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.36865234375, -17.7685546875, -17.16845703125, -16.568359375, -15.96826171875, -15.3681640625, -14.76806640625, -14.16796875, -13.56787109375, -12.9677734375, -12.36767578125, -11.767578125, -11.16748046875, -10.5673828125, -9.96728515625, -9.3671875, -8.76708984375, -8.1669921875, -7.56689453125, -6.966796875, -6.36669921875, -5.7666015625, -5.16650390625, -4.56640625, -3.96630859375, -3.3662109375, -2.76611328125, -2.166015625, -1.56591796875, -0.9658203125, -0.36572265625, 0.234375, 0.83447265625, 1.4345703125, 2.03466796875, 2.634765625, 3.23486328125, 3.8349609375, 4.43505859375, 5.03515625, 5.63525390625, 6.2353515625, 6.83544921875, 7.435546875, 8.03564453125, 8.6357421875, 9.23583984375, 9.8359375, 10.43603515625, 11.0361328125, 11.63623046875, 12.236328125, 12.83642578125, 13.4365234375, 14.03662109375, 14.63671875, 15.23681640625, 15.8369140625, 16.43701171875, 17.037109375, 17.63720703125, 18.2373046875, 18.83740234375, 19.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 12.0, 70.0, 411.0, 397.0, 54.0, 30.0, 9.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-325.65704345703125, -315.499267578125, -305.34149169921875, -295.1836853027344, -285.0259094238281, -274.8681335449219, -264.7103271484375, -254.55255126953125, -244.394775390625, -234.23699951171875, -224.07920837402344, -213.92141723632812, -203.76364135742188, -193.60586547851562, -183.4480743408203, -173.290283203125, -163.13250732421875, -152.9747314453125, -142.8169403076172, -132.65914916992188, -122.50137329101562, -112.34358978271484, -102.18580627441406, -92.02802276611328, -81.8702392578125, -71.71245574951172, -61.55467224121094, -51.396888732910156, -41.239105224609375, -31.081321716308594, -20.923538208007812, -10.765754699707031, -0.608001708984375, 9.549781799316406, 19.707565307617188, 29.86534881591797, 40.02313232421875, 50.18091583251953, 60.33869934082031, 70.4964828491211, 80.65426635742188, 90.81204986572266, 100.96983337402344, 111.12761688232422, 121.285400390625, 131.44317626953125, 141.60096740722656, 151.75875854492188, 161.91653442382812, 172.07431030273438, 182.2321014404297, 192.389892578125, 202.54766845703125, 212.7054443359375, 222.8632354736328, 233.02102661132812, 243.17880249023438, 253.33657836914062, 263.494384765625, 273.65216064453125, 283.8099365234375, 293.96771240234375, 304.12548828125, 314.2832946777344, 324.4410705566406]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 15.0, 20.0, 20.0, 32.0, 59.0, 62.0, 78.0, 86.0, 111.0, 113.0, 108.0, 97.0, 55.0, 46.0, 32.0, 23.0, 19.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-160.99249267578125, -157.40968322753906, -153.82688903808594, -150.24407958984375, -146.66127014160156, -143.07847595214844, -139.49566650390625, -135.91287231445312, -132.33006286621094, -128.74725341796875, -125.1644515991211, -121.58164978027344, -117.99884796142578, -114.41604614257812, -110.83323669433594, -107.25043487548828, -103.66763305664062, -100.08483123779297, -96.50202178955078, -92.91921997070312, -89.33641815185547, -85.75361633300781, -82.17080688476562, -78.58800506591797, -75.00519561767578, -71.42239379882812, -67.83958435058594, -64.25678253173828, -60.673980712890625, -57.0911750793457, -53.50836944580078, -49.925567626953125, -46.34276580810547, -42.75996017456055, -39.17715835571289, -35.59435272216797, -32.01155090332031, -28.42874526977539, -24.8459415435791, -21.263137817382812, -17.680334091186523, -14.097530364990234, -10.514726638793945, -6.93192195892334, -3.349118232727051, 0.2336864471435547, 3.8164901733398438, 7.399293899536133, 10.982097625732422, 14.564901351928711, 18.147705078125, 21.730510711669922, 25.313312530517578, 28.8961181640625, 32.478919982910156, 36.06172561645508, 39.64453125, 43.22733688354492, 46.81013870239258, 50.3929443359375, 53.975746154785156, 57.55855178833008, 61.141357421875, 64.72415924072266, 68.30696105957031]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 6.0, 12.0, 26.0, 32.0, 40.0, 53.0, 101.0, 222.0, 363.0, 682.0, 1467.0, 3389.0, 8772.0, 25536.0, 84058.0, 297797.0, 420862.0, 142378.0, 40413.0, 13283.0, 5017.0, 2025.0, 899.0, 464.0, 228.0, 155.0, 85.0, 46.0, 29.0, 27.0, 15.0, 14.0, 10.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.3046875, -10.011962890625, -9.71923828125, -9.426513671875, -9.1337890625, -8.841064453125, -8.54833984375, -8.255615234375, -7.962890625, -7.670166015625, -7.37744140625, -7.084716796875, -6.7919921875, -6.499267578125, -6.20654296875, -5.913818359375, -5.62109375, -5.328369140625, -5.03564453125, -4.742919921875, -4.4501953125, -4.157470703125, -3.86474609375, -3.572021484375, -3.279296875, -2.986572265625, -2.69384765625, -2.401123046875, -2.1083984375, -1.815673828125, -1.52294921875, -1.230224609375, -0.9375, -0.644775390625, -0.35205078125, -0.059326171875, 0.2333984375, 0.526123046875, 0.81884765625, 1.111572265625, 1.404296875, 1.697021484375, 1.98974609375, 2.282470703125, 2.5751953125, 2.867919921875, 3.16064453125, 3.453369140625, 3.74609375, 4.038818359375, 4.33154296875, 4.624267578125, 4.9169921875, 5.209716796875, 5.50244140625, 5.795166015625, 6.087890625, 6.380615234375, 6.67333984375, 6.966064453125, 7.2587890625, 7.551513671875, 7.84423828125, 8.136962890625, 8.4296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 10.0, 21.0, 18.0, 28.0, 31.0, 48.0, 44.0, 43.0, 79.0, 75.0, 86.0, 82.0, 68.0, 74.0, 65.0, 56.0, 43.0, 32.0, 26.0, 20.0, 13.0, 10.0, 10.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.1102294921875, -8.876708984375, -8.6431884765625, -8.40966796875, -8.1761474609375, -7.942626953125, -7.7091064453125, -7.4755859375, -7.2420654296875, -7.008544921875, -6.7750244140625, -6.54150390625, -6.3079833984375, -6.074462890625, -5.8409423828125, -5.607421875, -5.3739013671875, -5.140380859375, -4.9068603515625, -4.67333984375, -4.4398193359375, -4.206298828125, -3.9727783203125, -3.7392578125, -3.5057373046875, -3.272216796875, -3.0386962890625, -2.80517578125, -2.5716552734375, -2.338134765625, -2.1046142578125, -1.87109375, -1.6375732421875, -1.404052734375, -1.1705322265625, -0.93701171875, -0.7034912109375, -0.469970703125, -0.2364501953125, -0.0029296875, 0.2305908203125, 0.464111328125, 0.6976318359375, 0.93115234375, 1.1646728515625, 1.398193359375, 1.6317138671875, 1.865234375, 2.0987548828125, 2.332275390625, 2.5657958984375, 2.79931640625, 3.0328369140625, 3.266357421875, 3.4998779296875, 3.7333984375, 3.9669189453125, 4.200439453125, 4.4339599609375, 4.66748046875, 4.9010009765625, 5.134521484375, 5.3680419921875, 5.6015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 4.0, 5.0, 1.0, 6.0, 12.0, 10.0, 14.0, 21.0, 31.0, 43.0, 62.0, 107.0, 159.0, 247.0, 495.0, 1034.0, 2591.0, 7056.0, 23833.0, 107951.0, 626063.0, 218672.0, 41906.0, 11233.0, 3902.0, 1478.0, 641.0, 384.0, 207.0, 142.0, 77.0, 51.0, 32.0, 13.0, 15.0, 11.0, 15.0, 10.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.75, -12.3717041015625, -11.993408203125, -11.6151123046875, -11.23681640625, -10.8585205078125, -10.480224609375, -10.1019287109375, -9.7236328125, -9.3453369140625, -8.967041015625, -8.5887451171875, -8.21044921875, -7.8321533203125, -7.453857421875, -7.0755615234375, -6.697265625, -6.3189697265625, -5.940673828125, -5.5623779296875, -5.18408203125, -4.8057861328125, -4.427490234375, -4.0491943359375, -3.6708984375, -3.2926025390625, -2.914306640625, -2.5360107421875, -2.15771484375, -1.7794189453125, -1.401123046875, -1.0228271484375, -0.64453125, -0.2662353515625, 0.112060546875, 0.4903564453125, 0.86865234375, 1.2469482421875, 1.625244140625, 2.0035400390625, 2.3818359375, 2.7601318359375, 3.138427734375, 3.5167236328125, 3.89501953125, 4.2733154296875, 4.651611328125, 5.0299072265625, 5.408203125, 5.7864990234375, 6.164794921875, 6.5430908203125, 6.92138671875, 7.2996826171875, 7.677978515625, 8.0562744140625, 8.4345703125, 8.8128662109375, 9.191162109375, 9.5694580078125, 9.94775390625, 10.3260498046875, 10.704345703125, 11.0826416015625, 11.4609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 8.0, 2.0, 5.0, 7.0, 9.0, 7.0, 12.0, 16.0, 14.0, 22.0, 41.0, 38.0, 58.0, 49.0, 59.0, 69.0, 66.0, 55.0, 61.0, 65.0, 48.0, 59.0, 46.0, 29.0, 36.0, 23.0, 19.0, 21.0, 22.0, 10.0, 5.0, 7.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-25.734375, -25.0634765625, -24.392578125, -23.7216796875, -23.05078125, -22.3798828125, -21.708984375, -21.0380859375, -20.3671875, -19.6962890625, -19.025390625, -18.3544921875, -17.68359375, -17.0126953125, -16.341796875, -15.6708984375, -15.0, -14.3291015625, -13.658203125, -12.9873046875, -12.31640625, -11.6455078125, -10.974609375, -10.3037109375, -9.6328125, -8.9619140625, -8.291015625, -7.6201171875, -6.94921875, -6.2783203125, -5.607421875, -4.9365234375, -4.265625, -3.5947265625, -2.923828125, -2.2529296875, -1.58203125, -0.9111328125, -0.240234375, 0.4306640625, 1.1015625, 1.7724609375, 2.443359375, 3.1142578125, 3.78515625, 4.4560546875, 5.126953125, 5.7978515625, 6.46875, 7.1396484375, 7.810546875, 8.4814453125, 9.15234375, 9.8232421875, 10.494140625, 11.1650390625, 11.8359375, 12.5068359375, 13.177734375, 13.8486328125, 14.51953125, 15.1904296875, 15.861328125, 16.5322265625, 17.203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 10.0, 16.0, 21.0, 36.0, 36.0, 65.0, 122.0, 251.0, 555.0, 1319.0, 4339.0, 20084.0, 146091.0, 737438.0, 115207.0, 16885.0, 3825.0, 1190.0, 501.0, 236.0, 112.0, 64.0, 45.0, 25.0, 22.0, 20.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.643890380859375, -3.52801513671875, -3.412139892578125, -3.2962646484375, -3.180389404296875, -3.06451416015625, -2.948638916015625, -2.832763671875, -2.716888427734375, -2.60101318359375, -2.485137939453125, -2.3692626953125, -2.253387451171875, -2.13751220703125, -2.021636962890625, -1.90576171875, -1.789886474609375, -1.67401123046875, -1.558135986328125, -1.4422607421875, -1.326385498046875, -1.21051025390625, -1.094635009765625, -0.978759765625, -0.862884521484375, -0.74700927734375, -0.631134033203125, -0.5152587890625, -0.399383544921875, -0.28350830078125, -0.167633056640625, -0.0517578125, 0.064117431640625, 0.17999267578125, 0.295867919921875, 0.4117431640625, 0.527618408203125, 0.64349365234375, 0.759368896484375, 0.875244140625, 0.991119384765625, 1.10699462890625, 1.222869873046875, 1.3387451171875, 1.454620361328125, 1.57049560546875, 1.686370849609375, 1.80224609375, 1.918121337890625, 2.03399658203125, 2.149871826171875, 2.2657470703125, 2.381622314453125, 2.49749755859375, 2.613372802734375, 2.729248046875, 2.845123291015625, 2.96099853515625, 3.076873779296875, 3.1927490234375, 3.308624267578125, 3.42449951171875, 3.540374755859375, 3.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 7.0, 10.0, 29.0, 44.0, 76.0, 125.0, 120.0, 155.0, 129.0, 90.0, 57.0, 48.0, 28.0, 21.0, 13.0, 8.0, 2.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000820159912109375, -0.0007879436016082764, -0.0007557272911071777, -0.0007235109806060791, -0.0006912946701049805, -0.0006590783596038818, -0.0006268620491027832, -0.0005946457386016846, -0.0005624294281005859, -0.0005302131175994873, -0.0004979968070983887, -0.00046578049659729004, -0.0004335641860961914, -0.0004013478755950928, -0.00036913156509399414, -0.0003369152545928955, -0.0003046989440917969, -0.00027248263359069824, -0.0002402663230895996, -0.00020805001258850098, -0.00017583370208740234, -0.0001436173915863037, -0.00011140108108520508, -7.918477058410645e-05, -4.696846008300781e-05, -1.475214958190918e-05, 1.7464160919189453e-05, 4.9680471420288086e-05, 8.189678192138672e-05, 0.00011411309242248535, 0.00014632940292358398, 0.00017854571342468262, 0.00021076202392578125, 0.00024297833442687988, 0.0002751946449279785, 0.00030741095542907715, 0.0003396272659301758, 0.0003718435764312744, 0.00040405988693237305, 0.0004362761974334717, 0.0004684925079345703, 0.0005007088184356689, 0.0005329251289367676, 0.0005651414394378662, 0.0005973577499389648, 0.0006295740604400635, 0.0006617903709411621, 0.0006940066814422607, 0.0007262229919433594, 0.000758439302444458, 0.0007906556129455566, 0.0008228719234466553, 0.0008550882339477539, 0.0008873045444488525, 0.0009195208549499512, 0.0009517371654510498, 0.0009839534759521484, 0.001016169786453247, 0.0010483860969543457, 0.0010806024074554443, 0.001112818717956543, 0.0011450350284576416, 0.0011772513389587402, 0.0012094676494598389, 0.0012416839599609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 9.0, 15.0, 18.0, 38.0, 49.0, 92.0, 140.0, 293.0, 850.0, 2711.0, 11483.0, 84445.0, 754784.0, 168783.0, 18984.0, 3900.0, 1159.0, 394.0, 175.0, 74.0, 66.0, 26.0, 22.0, 16.0, 11.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.11712646484375, -1.9725341796875, -1.82794189453125, -1.683349609375, -1.53875732421875, -1.3941650390625, -1.24957275390625, -1.10498046875, -0.96038818359375, -0.8157958984375, -0.67120361328125, -0.526611328125, -0.38201904296875, -0.2374267578125, -0.09283447265625, 0.0517578125, 0.19635009765625, 0.3409423828125, 0.48553466796875, 0.630126953125, 0.77471923828125, 0.9193115234375, 1.06390380859375, 1.20849609375, 1.35308837890625, 1.4976806640625, 1.64227294921875, 1.786865234375, 1.93145751953125, 2.0760498046875, 2.22064208984375, 2.365234375, 2.50982666015625, 2.6544189453125, 2.79901123046875, 2.943603515625, 3.08819580078125, 3.2327880859375, 3.37738037109375, 3.52197265625, 3.66656494140625, 3.8111572265625, 3.95574951171875, 4.100341796875, 4.24493408203125, 4.3895263671875, 4.53411865234375, 4.6787109375, 4.82330322265625, 4.9678955078125, 5.11248779296875, 5.257080078125, 5.40167236328125, 5.5462646484375, 5.69085693359375, 5.83544921875, 5.98004150390625, 6.1246337890625, 6.26922607421875, 6.413818359375, 6.55841064453125, 6.7030029296875, 6.84759521484375, 6.9921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 8.0, 13.0, 25.0, 25.0, 34.0, 32.0, 48.0, 51.0, 62.0, 81.0, 71.0, 92.0, 87.0, 70.0, 68.0, 38.0, 30.0, 34.0, 30.0, 11.0, 26.0, 16.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.193359375, -3.09478759765625, -2.9962158203125, -2.89764404296875, -2.799072265625, -2.70050048828125, -2.6019287109375, -2.50335693359375, -2.40478515625, -2.30621337890625, -2.2076416015625, -2.10906982421875, -2.010498046875, -1.91192626953125, -1.8133544921875, -1.71478271484375, -1.6162109375, -1.51763916015625, -1.4190673828125, -1.32049560546875, -1.221923828125, -1.12335205078125, -1.0247802734375, -0.92620849609375, -0.82763671875, -0.72906494140625, -0.6304931640625, -0.53192138671875, -0.433349609375, -0.33477783203125, -0.2362060546875, -0.13763427734375, -0.0390625, 0.05950927734375, 0.1580810546875, 0.25665283203125, 0.355224609375, 0.45379638671875, 0.5523681640625, 0.65093994140625, 0.74951171875, 0.84808349609375, 0.9466552734375, 1.04522705078125, 1.143798828125, 1.24237060546875, 1.3409423828125, 1.43951416015625, 1.5380859375, 1.63665771484375, 1.7352294921875, 1.83380126953125, 1.932373046875, 2.03094482421875, 2.1295166015625, 2.22808837890625, 2.32666015625, 2.42523193359375, 2.5238037109375, 2.62237548828125, 2.720947265625, 2.81951904296875, 2.9180908203125, 3.01666259765625, 3.115234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 5.0, 8.0, 12.0, 21.0, 36.0, 69.0, 98.0, 185.0, 215.0, 130.0, 99.0, 40.0, 28.0, 18.0, 15.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.0500259399414, -80.3927993774414, -77.73558044433594, -75.07835388183594, -72.42112731933594, -69.76390075683594, -67.10667419433594, -64.44945526123047, -61.79222869873047, -59.13500213623047, -56.477779388427734, -53.820556640625, -51.163330078125, -48.506103515625, -45.848880767822266, -43.19165802001953, -40.53443145751953, -37.87720489501953, -35.2199821472168, -32.56275939941406, -29.905532836914062, -27.248308181762695, -24.591083526611328, -21.93385887145996, -19.276634216308594, -16.619409561157227, -13.96218490600586, -11.304960250854492, -8.647735595703125, -5.990510940551758, -3.3332862854003906, -0.6760616302490234, 1.981170654296875, 4.638395309448242, 7.295619964599609, 9.952844619750977, 12.610069274902344, 15.267293930053711, 17.924518585205078, 20.581743240356445, 23.238967895507812, 25.89619255065918, 28.553417205810547, 31.210641860961914, 33.86786651611328, 36.52509307861328, 39.182315826416016, 41.83953857421875, 44.49676513671875, 47.15399169921875, 49.811214447021484, 52.46843719482422, 55.12566375732422, 57.78289031982422, 60.44011306762695, 63.09733581542969, 65.75456237792969, 68.41178894042969, 71.06901550292969, 73.72623443603516, 76.38346099853516, 79.04068756103516, 81.69790649414062, 84.35513305664062, 87.01235961914062]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 9.0, 11.0, 10.0, 6.0, 14.0, 16.0, 23.0, 19.0, 22.0, 18.0, 30.0, 33.0, 30.0, 29.0, 45.0, 59.0, 66.0, 93.0, 74.0, 66.0, 33.0, 28.0, 23.0, 38.0, 41.0, 20.0, 18.0, 24.0, 19.0, 21.0, 8.0, 9.0, 5.0, 9.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-74.3485336303711, -72.12584686279297, -69.90316009521484, -67.68047332763672, -65.45779418945312, -63.235103607177734, -61.012420654296875, -58.78973388671875, -56.567047119140625, -54.3443603515625, -52.121673583984375, -49.898990631103516, -47.67630386352539, -45.453617095947266, -43.230934143066406, -41.00824737548828, -38.785560607910156, -36.56287384033203, -34.340187072753906, -32.11750411987305, -29.894817352294922, -27.672130584716797, -25.449445724487305, -23.226760864257812, -21.004074096679688, -18.781387329101562, -16.55870246887207, -14.336016654968262, -12.113330841064453, -9.890645027160645, -7.667959213256836, -5.445273399353027, -3.2225875854492188, -0.9999017715454102, 1.2227840423583984, 3.445469856262207, 5.668155670166016, 7.890841484069824, 10.113527297973633, 12.336213111877441, 14.55889892578125, 16.781585693359375, 19.004270553588867, 21.22695541381836, 23.449642181396484, 25.67232894897461, 27.8950138092041, 30.117698669433594, 32.34038543701172, 34.563072204589844, 36.78575897216797, 39.00844192504883, 41.23112869262695, 43.45381546020508, 45.67649841308594, 47.89918518066406, 50.12187194824219, 52.34455871582031, 54.56724548339844, 56.7899284362793, 59.01261520385742, 61.23530197143555, 63.457984924316406, 65.68067169189453, 67.90335845947266]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 10.0, 3.0, 11.0, 19.0, 14.0, 26.0, 57.0, 84.0, 105.0, 189.0, 289.0, 565.0, 1071.0, 2236.0, 5206.0, 15274.0, 63189.0, 478343.0, 2664506.0, 830484.0, 99318.0, 20962.0, 6883.0, 2721.0, 1283.0, 620.0, 322.0, 168.0, 126.0, 57.0, 49.0, 32.0, 13.0, 18.0, 8.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8359375, -4.6395263671875, -4.443115234375, -4.2467041015625, -4.05029296875, -3.8538818359375, -3.657470703125, -3.4610595703125, -3.2646484375, -3.0682373046875, -2.871826171875, -2.6754150390625, -2.47900390625, -2.2825927734375, -2.086181640625, -1.8897705078125, -1.693359375, -1.4969482421875, -1.300537109375, -1.1041259765625, -0.90771484375, -0.7113037109375, -0.514892578125, -0.3184814453125, -0.1220703125, 0.0743408203125, 0.270751953125, 0.4671630859375, 0.66357421875, 0.8599853515625, 1.056396484375, 1.2528076171875, 1.44921875, 1.6456298828125, 1.842041015625, 2.0384521484375, 2.23486328125, 2.4312744140625, 2.627685546875, 2.8240966796875, 3.0205078125, 3.2169189453125, 3.413330078125, 3.6097412109375, 3.80615234375, 4.0025634765625, 4.198974609375, 4.3953857421875, 4.591796875, 4.7882080078125, 4.984619140625, 5.1810302734375, 5.37744140625, 5.5738525390625, 5.770263671875, 5.9666748046875, 6.1630859375, 6.3594970703125, 6.555908203125, 6.7523193359375, 6.94873046875, 7.1451416015625, 7.341552734375, 7.5379638671875, 7.734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 9.0, 13.0, 10.0, 21.0, 21.0, 30.0, 33.0, 28.0, 33.0, 39.0, 34.0, 46.0, 55.0, 66.0, 46.0, 52.0, 66.0, 49.0, 44.0, 43.0, 41.0, 36.0, 25.0, 36.0, 19.0, 30.0, 14.0, 16.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.79296875, -5.6356201171875, -5.478271484375, -5.3209228515625, -5.16357421875, -5.0062255859375, -4.848876953125, -4.6915283203125, -4.5341796875, -4.3768310546875, -4.219482421875, -4.0621337890625, -3.90478515625, -3.7474365234375, -3.590087890625, -3.4327392578125, -3.275390625, -3.1180419921875, -2.960693359375, -2.8033447265625, -2.64599609375, -2.4886474609375, -2.331298828125, -2.1739501953125, -2.0166015625, -1.8592529296875, -1.701904296875, -1.5445556640625, -1.38720703125, -1.2298583984375, -1.072509765625, -0.9151611328125, -0.7578125, -0.6004638671875, -0.443115234375, -0.2857666015625, -0.12841796875, 0.0289306640625, 0.186279296875, 0.3436279296875, 0.5009765625, 0.6583251953125, 0.815673828125, 0.9730224609375, 1.13037109375, 1.2877197265625, 1.445068359375, 1.6024169921875, 1.759765625, 1.9171142578125, 2.074462890625, 2.2318115234375, 2.38916015625, 2.5465087890625, 2.703857421875, 2.8612060546875, 3.0185546875, 3.1759033203125, 3.333251953125, 3.4906005859375, 3.64794921875, 3.8052978515625, 3.962646484375, 4.1199951171875, 4.27734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 11.0, 10.0, 23.0, 28.0, 41.0, 111.0, 227.0, 588.0, 1756.0, 8276.0, 141726.0, 3934873.0, 97183.0, 6912.0, 1597.0, 512.0, 199.0, 84.0, 40.0, 26.0, 15.0, 11.0, 5.0, 8.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.078125, -15.5322265625, -14.986328125, -14.4404296875, -13.89453125, -13.3486328125, -12.802734375, -12.2568359375, -11.7109375, -11.1650390625, -10.619140625, -10.0732421875, -9.52734375, -8.9814453125, -8.435546875, -7.8896484375, -7.34375, -6.7978515625, -6.251953125, -5.7060546875, -5.16015625, -4.6142578125, -4.068359375, -3.5224609375, -2.9765625, -2.4306640625, -1.884765625, -1.3388671875, -0.79296875, -0.2470703125, 0.298828125, 0.8447265625, 1.390625, 1.9365234375, 2.482421875, 3.0283203125, 3.57421875, 4.1201171875, 4.666015625, 5.2119140625, 5.7578125, 6.3037109375, 6.849609375, 7.3955078125, 7.94140625, 8.4873046875, 9.033203125, 9.5791015625, 10.125, 10.6708984375, 11.216796875, 11.7626953125, 12.30859375, 12.8544921875, 13.400390625, 13.9462890625, 14.4921875, 15.0380859375, 15.583984375, 16.1298828125, 16.67578125, 17.2216796875, 17.767578125, 18.3134765625, 18.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 14.0, 17.0, 25.0, 29.0, 33.0, 69.0, 111.0, 174.0, 335.0, 564.0, 779.0, 726.0, 472.0, 276.0, 147.0, 94.0, 65.0, 30.0, 31.0, 22.0, 15.0, 4.0, 3.0, 4.0, 7.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.1484375, -10.8463134765625, -10.544189453125, -10.2420654296875, -9.93994140625, -9.6378173828125, -9.335693359375, -9.0335693359375, -8.7314453125, -8.4293212890625, -8.127197265625, -7.8250732421875, -7.52294921875, -7.2208251953125, -6.918701171875, -6.6165771484375, -6.314453125, -6.0123291015625, -5.710205078125, -5.4080810546875, -5.10595703125, -4.8038330078125, -4.501708984375, -4.1995849609375, -3.8974609375, -3.5953369140625, -3.293212890625, -2.9910888671875, -2.68896484375, -2.3868408203125, -2.084716796875, -1.7825927734375, -1.48046875, -1.1783447265625, -0.876220703125, -0.5740966796875, -0.27197265625, 0.0301513671875, 0.332275390625, 0.6343994140625, 0.9365234375, 1.2386474609375, 1.540771484375, 1.8428955078125, 2.14501953125, 2.4471435546875, 2.749267578125, 3.0513916015625, 3.353515625, 3.6556396484375, 3.957763671875, 4.2598876953125, 4.56201171875, 4.8641357421875, 5.166259765625, 5.4683837890625, 5.7705078125, 6.0726318359375, 6.374755859375, 6.6768798828125, 6.97900390625, 7.2811279296875, 7.583251953125, 7.8853759765625, 8.1875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 19.0, 32.0, 45.0, 103.0, 179.0, 184.0, 181.0, 119.0, 58.0, 25.0, 21.0, 12.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-113.70182800292969, -110.84175872802734, -107.98169708251953, -105.12162780761719, -102.26155853271484, -99.40149688720703, -96.54142761230469, -93.68136596679688, -90.82129669189453, -87.96122741699219, -85.10116577148438, -82.24109649658203, -79.38102722167969, -76.52096557617188, -73.66089630126953, -70.80082702636719, -67.94076538085938, -65.08069610595703, -62.22063064575195, -59.360565185546875, -56.5004997253418, -53.64043426513672, -50.780364990234375, -47.9202995300293, -45.06022644042969, -42.20016098022461, -39.340091705322266, -36.48002624511719, -33.61996078491211, -30.7598934173584, -27.899826049804688, -25.03976058959961, -22.17969512939453, -19.31962776184082, -16.459562301635742, -13.599494934082031, -10.739428520202637, -7.879362106323242, -5.019294738769531, -2.159229278564453, 0.7008380889892578, 3.5609047412872314, 6.420971393585205, 9.281038284301758, 12.141104698181152, 15.001171112060547, 17.861238479614258, 20.721303939819336, 23.581371307373047, 26.441438674926758, 29.301504135131836, 32.16157150268555, 35.021636962890625, 37.88170623779297, 40.74177169799805, 43.601837158203125, 46.46190643310547, 49.32197189331055, 52.18204116821289, 55.04210662841797, 57.90217208862305, 60.762237548828125, 63.62230682373047, 66.48237609863281, 69.34243774414062]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 8.0, 7.0, 11.0, 11.0, 12.0, 16.0, 27.0, 23.0, 29.0, 32.0, 32.0, 36.0, 45.0, 35.0, 31.0, 36.0, 49.0, 41.0, 38.0, 42.0, 41.0, 32.0, 43.0, 31.0, 33.0, 46.0, 29.0, 23.0, 29.0, 16.0, 17.0, 17.0, 9.0, 17.0, 6.0, 8.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.21644592285156, -34.16857147216797, -33.120697021484375, -32.07282257080078, -31.024946212768555, -29.97707176208496, -28.929195404052734, -27.88132095336914, -26.833446502685547, -25.785572052001953, -24.73769760131836, -23.689821243286133, -22.64194679260254, -21.594072341918945, -20.54619598388672, -19.498321533203125, -18.45044708251953, -17.402572631835938, -16.354698181152344, -15.306821823120117, -14.258947372436523, -13.21107292175293, -12.16319751739502, -11.11532211303711, -10.067447662353516, -9.019573211669922, -7.971697807312012, -6.92382287979126, -5.875947952270508, -4.828073024749756, -3.780198097229004, -2.732323169708252, -1.6844444274902344, -0.6365694999694824, 0.41130542755126953, 1.4591803550720215, 2.5070552825927734, 3.5549302101135254, 4.602805137634277, 5.650680065155029, 6.698554992675781, 7.746429920196533, 8.794304847717285, 9.842180252075195, 10.890054702758789, 11.937929153442383, 12.985804557800293, 14.033679962158203, 15.081554412841797, 16.12942886352539, 17.177303314208984, 18.22517967224121, 19.273054122924805, 20.3209285736084, 21.368804931640625, 22.41667938232422, 23.464553833007812, 24.512428283691406, 25.560302734375, 26.608179092407227, 27.65605354309082, 28.703927993774414, 29.75180435180664, 30.799678802490234, 31.847553253173828]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 6.0, 14.0, 30.0, 31.0, 56.0, 73.0, 167.0, 302.0, 601.0, 1255.0, 2663.0, 6619.0, 17715.0, 55840.0, 208773.0, 486259.0, 188785.0, 51532.0, 16513.0, 6302.0, 2591.0, 1160.0, 591.0, 283.0, 145.0, 81.0, 47.0, 40.0, 22.0, 21.0, 7.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.5125732421875, -9.251708984375, -8.9908447265625, -8.72998046875, -8.4691162109375, -8.208251953125, -7.9473876953125, -7.6865234375, -7.4256591796875, -7.164794921875, -6.9039306640625, -6.64306640625, -6.3822021484375, -6.121337890625, -5.8604736328125, -5.599609375, -5.3387451171875, -5.077880859375, -4.8170166015625, -4.55615234375, -4.2952880859375, -4.034423828125, -3.7735595703125, -3.5126953125, -3.2518310546875, -2.990966796875, -2.7301025390625, -2.46923828125, -2.2083740234375, -1.947509765625, -1.6866455078125, -1.42578125, -1.1649169921875, -0.904052734375, -0.6431884765625, -0.38232421875, -0.1214599609375, 0.139404296875, 0.4002685546875, 0.6611328125, 0.9219970703125, 1.182861328125, 1.4437255859375, 1.70458984375, 1.9654541015625, 2.226318359375, 2.4871826171875, 2.748046875, 3.0089111328125, 3.269775390625, 3.5306396484375, 3.79150390625, 4.0523681640625, 4.313232421875, 4.5740966796875, 4.8349609375, 5.0958251953125, 5.356689453125, 5.6175537109375, 5.87841796875, 6.1392822265625, 6.400146484375, 6.6610107421875, 6.921875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 6.0, 1.0, 7.0, 10.0, 15.0, 17.0, 18.0, 27.0, 29.0, 29.0, 24.0, 39.0, 65.0, 46.0, 46.0, 63.0, 58.0, 69.0, 56.0, 52.0, 46.0, 41.0, 43.0, 35.0, 30.0, 15.0, 25.0, 21.0, 15.0, 19.0, 10.0, 6.0, 2.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.90234375, -5.737548828125, -5.57275390625, -5.407958984375, -5.2431640625, -5.078369140625, -4.91357421875, -4.748779296875, -4.583984375, -4.419189453125, -4.25439453125, -4.089599609375, -3.9248046875, -3.760009765625, -3.59521484375, -3.430419921875, -3.265625, -3.100830078125, -2.93603515625, -2.771240234375, -2.6064453125, -2.441650390625, -2.27685546875, -2.112060546875, -1.947265625, -1.782470703125, -1.61767578125, -1.452880859375, -1.2880859375, -1.123291015625, -0.95849609375, -0.793701171875, -0.62890625, -0.464111328125, -0.29931640625, -0.134521484375, 0.0302734375, 0.195068359375, 0.35986328125, 0.524658203125, 0.689453125, 0.854248046875, 1.01904296875, 1.183837890625, 1.3486328125, 1.513427734375, 1.67822265625, 1.843017578125, 2.0078125, 2.172607421875, 2.33740234375, 2.502197265625, 2.6669921875, 2.831787109375, 2.99658203125, 3.161376953125, 3.326171875, 3.490966796875, 3.65576171875, 3.820556640625, 3.9853515625, 4.150146484375, 4.31494140625, 4.479736328125, 4.64453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 9.0, 8.0, 10.0, 7.0, 13.0, 16.0, 27.0, 21.0, 45.0, 49.0, 53.0, 84.0, 129.0, 174.0, 308.0, 464.0, 892.0, 1719.0, 4755.0, 19405.0, 142751.0, 763619.0, 92334.0, 14306.0, 3825.0, 1453.0, 770.0, 426.0, 290.0, 180.0, 129.0, 78.0, 56.0, 40.0, 29.0, 29.0, 11.0, 12.0, 9.0, 6.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-16.546875, -16.126953125, -15.70703125, -15.287109375, -14.8671875, -14.447265625, -14.02734375, -13.607421875, -13.1875, -12.767578125, -12.34765625, -11.927734375, -11.5078125, -11.087890625, -10.66796875, -10.248046875, -9.828125, -9.408203125, -8.98828125, -8.568359375, -8.1484375, -7.728515625, -7.30859375, -6.888671875, -6.46875, -6.048828125, -5.62890625, -5.208984375, -4.7890625, -4.369140625, -3.94921875, -3.529296875, -3.109375, -2.689453125, -2.26953125, -1.849609375, -1.4296875, -1.009765625, -0.58984375, -0.169921875, 0.25, 0.669921875, 1.08984375, 1.509765625, 1.9296875, 2.349609375, 2.76953125, 3.189453125, 3.609375, 4.029296875, 4.44921875, 4.869140625, 5.2890625, 5.708984375, 6.12890625, 6.548828125, 6.96875, 7.388671875, 7.80859375, 8.228515625, 8.6484375, 9.068359375, 9.48828125, 9.908203125, 10.328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 7.0, 12.0, 12.0, 19.0, 18.0, 34.0, 41.0, 39.0, 56.0, 56.0, 54.0, 64.0, 55.0, 59.0, 61.0, 59.0, 59.0, 63.0, 38.0, 32.0, 22.0, 29.0, 21.0, 15.0, 9.0, 11.0, 10.0, 8.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.484375, -20.9072265625, -20.330078125, -19.7529296875, -19.17578125, -18.5986328125, -18.021484375, -17.4443359375, -16.8671875, -16.2900390625, -15.712890625, -15.1357421875, -14.55859375, -13.9814453125, -13.404296875, -12.8271484375, -12.25, -11.6728515625, -11.095703125, -10.5185546875, -9.94140625, -9.3642578125, -8.787109375, -8.2099609375, -7.6328125, -7.0556640625, -6.478515625, -5.9013671875, -5.32421875, -4.7470703125, -4.169921875, -3.5927734375, -3.015625, -2.4384765625, -1.861328125, -1.2841796875, -0.70703125, -0.1298828125, 0.447265625, 1.0244140625, 1.6015625, 2.1787109375, 2.755859375, 3.3330078125, 3.91015625, 4.4873046875, 5.064453125, 5.6416015625, 6.21875, 6.7958984375, 7.373046875, 7.9501953125, 8.52734375, 9.1044921875, 9.681640625, 10.2587890625, 10.8359375, 11.4130859375, 11.990234375, 12.5673828125, 13.14453125, 13.7216796875, 14.298828125, 14.8759765625, 15.453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 6.0, 4.0, 10.0, 16.0, 15.0, 29.0, 49.0, 69.0, 96.0, 155.0, 265.0, 516.0, 1020.0, 2470.0, 6352.0, 19964.0, 93900.0, 750917.0, 134075.0, 25604.0, 7541.0, 2830.0, 1240.0, 546.0, 301.0, 183.0, 119.0, 68.0, 52.0, 35.0, 14.0, 18.0, 13.0, 11.0, 3.0, 4.0, 10.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4453125, -3.342742919921875, -3.24017333984375, -3.137603759765625, -3.0350341796875, -2.932464599609375, -2.82989501953125, -2.727325439453125, -2.624755859375, -2.522186279296875, -2.41961669921875, -2.317047119140625, -2.2144775390625, -2.111907958984375, -2.00933837890625, -1.906768798828125, -1.80419921875, -1.701629638671875, -1.59906005859375, -1.496490478515625, -1.3939208984375, -1.291351318359375, -1.18878173828125, -1.086212158203125, -0.983642578125, -0.881072998046875, -0.77850341796875, -0.675933837890625, -0.5733642578125, -0.470794677734375, -0.36822509765625, -0.265655517578125, -0.1630859375, -0.060516357421875, 0.04205322265625, 0.144622802734375, 0.2471923828125, 0.349761962890625, 0.45233154296875, 0.554901123046875, 0.657470703125, 0.760040283203125, 0.86260986328125, 0.965179443359375, 1.0677490234375, 1.170318603515625, 1.27288818359375, 1.375457763671875, 1.47802734375, 1.580596923828125, 1.68316650390625, 1.785736083984375, 1.8883056640625, 1.990875244140625, 2.09344482421875, 2.196014404296875, 2.298583984375, 2.401153564453125, 2.50372314453125, 2.606292724609375, 2.7088623046875, 2.811431884765625, 2.91400146484375, 3.016571044921875, 3.119140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 11.0, 7.0, 9.0, 14.0, 14.0, 26.0, 36.0, 42.0, 63.0, 93.0, 114.0, 159.0, 100.0, 95.0, 53.0, 43.0, 28.0, 20.0, 13.0, 7.0, 5.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006971359252929688, -0.0006725043058395386, -0.0006478726863861084, -0.0006232410669326782, -0.000598609447479248, -0.0005739778280258179, -0.0005493462085723877, -0.0005247145891189575, -0.0005000829696655273, -0.00047545135021209717, -0.000450819730758667, -0.0004261881113052368, -0.00040155649185180664, -0.00037692487239837646, -0.0003522932529449463, -0.0003276616334915161, -0.00030303001403808594, -0.00027839839458465576, -0.0002537667751312256, -0.0002291351556777954, -0.00020450353622436523, -0.00017987191677093506, -0.00015524029731750488, -0.0001306086778640747, -0.00010597705841064453, -8.134543895721436e-05, -5.671381950378418e-05, -3.2082200050354004e-05, -7.450580596923828e-06, 1.7181038856506348e-05, 4.1812658309936523e-05, 6.64442777633667e-05, 9.107589721679688e-05, 0.00011570751667022705, 0.00014033913612365723, 0.0001649707555770874, 0.00018960237503051758, 0.00021423399448394775, 0.00023886561393737793, 0.0002634972333908081, 0.0002881288528442383, 0.00031276047229766846, 0.00033739209175109863, 0.0003620237112045288, 0.000386655330657959, 0.00041128695011138916, 0.00043591856956481934, 0.0004605501890182495, 0.0004851818084716797, 0.0005098134279251099, 0.00053444504737854, 0.0005590766668319702, 0.0005837082862854004, 0.0006083399057388306, 0.0006329715251922607, 0.0006576031446456909, 0.0006822347640991211, 0.0007068663835525513, 0.0007314980030059814, 0.0007561296224594116, 0.0007807612419128418, 0.000805392861366272, 0.0008300244808197021, 0.0008546561002731323, 0.0008792877197265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 11.0, 16.0, 12.0, 23.0, 37.0, 45.0, 66.0, 104.0, 169.0, 291.0, 494.0, 982.0, 2256.0, 6351.0, 22782.0, 126814.0, 756813.0, 101585.0, 19813.0, 5569.0, 2121.0, 962.0, 483.0, 248.0, 152.0, 95.0, 72.0, 45.0, 30.0, 24.0, 17.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.552734375, -3.4432373046875, -3.333740234375, -3.2242431640625, -3.11474609375, -3.0052490234375, -2.895751953125, -2.7862548828125, -2.6767578125, -2.5672607421875, -2.457763671875, -2.3482666015625, -2.23876953125, -2.1292724609375, -2.019775390625, -1.9102783203125, -1.80078125, -1.6912841796875, -1.581787109375, -1.4722900390625, -1.36279296875, -1.2532958984375, -1.143798828125, -1.0343017578125, -0.9248046875, -0.8153076171875, -0.705810546875, -0.5963134765625, -0.48681640625, -0.3773193359375, -0.267822265625, -0.1583251953125, -0.048828125, 0.0606689453125, 0.170166015625, 0.2796630859375, 0.38916015625, 0.4986572265625, 0.608154296875, 0.7176513671875, 0.8271484375, 0.9366455078125, 1.046142578125, 1.1556396484375, 1.26513671875, 1.3746337890625, 1.484130859375, 1.5936279296875, 1.703125, 1.8126220703125, 1.922119140625, 2.0316162109375, 2.14111328125, 2.2506103515625, 2.360107421875, 2.4696044921875, 2.5791015625, 2.6885986328125, 2.798095703125, 2.9075927734375, 3.01708984375, 3.1265869140625, 3.236083984375, 3.3455810546875, 3.455078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 4.0, 6.0, 11.0, 18.0, 18.0, 15.0, 34.0, 56.0, 58.0, 78.0, 116.0, 118.0, 105.0, 104.0, 64.0, 45.0, 28.0, 31.0, 21.0, 9.0, 11.0, 6.0, 5.0, 5.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.6328125, -3.52740478515625, -3.4219970703125, -3.31658935546875, -3.211181640625, -3.10577392578125, -3.0003662109375, -2.89495849609375, -2.78955078125, -2.68414306640625, -2.5787353515625, -2.47332763671875, -2.367919921875, -2.26251220703125, -2.1571044921875, -2.05169677734375, -1.9462890625, -1.84088134765625, -1.7354736328125, -1.63006591796875, -1.524658203125, -1.41925048828125, -1.3138427734375, -1.20843505859375, -1.10302734375, -0.99761962890625, -0.8922119140625, -0.78680419921875, -0.681396484375, -0.57598876953125, -0.4705810546875, -0.36517333984375, -0.259765625, -0.15435791015625, -0.0489501953125, 0.05645751953125, 0.161865234375, 0.26727294921875, 0.3726806640625, 0.47808837890625, 0.58349609375, 0.68890380859375, 0.7943115234375, 0.89971923828125, 1.005126953125, 1.11053466796875, 1.2159423828125, 1.32135009765625, 1.4267578125, 1.53216552734375, 1.6375732421875, 1.74298095703125, 1.848388671875, 1.95379638671875, 2.0592041015625, 2.16461181640625, 2.27001953125, 2.37542724609375, 2.4808349609375, 2.58624267578125, 2.691650390625, 2.79705810546875, 2.9024658203125, 3.00787353515625, 3.11328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 7.0, 13.0, 21.0, 59.0, 137.0, 294.0, 241.0, 115.0, 51.0, 27.0, 7.0, 3.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.01658630371094, -49.671199798583984, -46.32581329345703, -42.98042678833008, -39.635040283203125, -36.28965377807617, -32.94426727294922, -29.598880767822266, -26.253494262695312, -22.90810775756836, -19.562721252441406, -16.217334747314453, -12.8719482421875, -9.526561737060547, -6.181175231933594, -2.8357887268066406, 0.5095977783203125, 3.8549842834472656, 7.200370788574219, 10.545757293701172, 13.891143798828125, 17.236530303955078, 20.58191680908203, 23.927303314208984, 27.272689819335938, 30.61807632446289, 33.963462829589844, 37.3088493347168, 40.65423583984375, 43.9996223449707, 47.345008850097656, 50.69039535522461, 54.03578186035156, 57.381168365478516, 60.72655487060547, 64.07194519042969, 67.41732788085938, 70.76271057128906, 74.10810089111328, 77.4534912109375, 80.79887390136719, 84.14425659179688, 87.4896469116211, 90.83503723144531, 94.180419921875, 97.52580261230469, 100.8711929321289, 104.21658325195312, 107.56196594238281, 110.9073486328125, 114.25273895263672, 117.59812927246094, 120.94351196289062, 124.28889465332031, 127.63428497314453, 130.97967529296875, 134.32505798339844, 137.67044067382812, 141.01583862304688, 144.36122131347656, 147.70660400390625, 151.05198669433594, 154.39736938476562, 157.74276733398438, 161.08815002441406]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 9.0, 9.0, 8.0, 10.0, 11.0, 8.0, 16.0, 14.0, 25.0, 27.0, 24.0, 32.0, 16.0, 47.0, 29.0, 47.0, 64.0, 102.0, 95.0, 62.0, 45.0, 30.0, 31.0, 27.0, 26.0, 32.0, 26.0, 20.0, 7.0, 17.0, 11.0, 8.0, 8.0, 9.0, 8.0, 4.0, 6.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-48.36821365356445, -46.6351318359375, -44.90205001831055, -43.168968200683594, -41.43588638305664, -39.70280456542969, -37.969722747802734, -36.23664093017578, -34.50355911254883, -32.770477294921875, -31.037395477294922, -29.30431365966797, -27.571231842041016, -25.838150024414062, -24.10506820678711, -22.371986389160156, -20.638904571533203, -18.90582275390625, -17.172740936279297, -15.439659118652344, -13.70657730102539, -11.973495483398438, -10.240413665771484, -8.507331848144531, -6.774250030517578, -5.041168212890625, -3.308086395263672, -1.5750045776367188, 0.15807723999023438, 1.8911590576171875, 3.6242408752441406, 5.357322692871094, 7.090400695800781, 8.823482513427734, 10.556564331054688, 12.28964614868164, 14.022727966308594, 15.755809783935547, 17.4888916015625, 19.221973419189453, 20.955055236816406, 22.68813705444336, 24.421218872070312, 26.154300689697266, 27.88738250732422, 29.620464324951172, 31.353546142578125, 33.08662796020508, 34.81970977783203, 36.552791595458984, 38.28587341308594, 40.01895523071289, 41.752037048339844, 43.4851188659668, 45.21820068359375, 46.9512825012207, 48.684364318847656, 50.41744613647461, 52.15052795410156, 53.883609771728516, 55.61669158935547, 57.34977340698242, 59.082855224609375, 60.81593704223633, 62.54901885986328]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 13.0, 18.0, 32.0, 54.0, 108.0, 241.0, 627.0, 1807.0, 7019.0, 44251.0, 717607.0, 3096175.0, 294392.0, 24929.0, 4741.0, 1352.0, 494.0, 218.0, 73.0, 41.0, 28.0, 16.0, 13.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.034423828125, -7.74072265625, -7.447021484375, -7.1533203125, -6.859619140625, -6.56591796875, -6.272216796875, -5.978515625, -5.684814453125, -5.39111328125, -5.097412109375, -4.8037109375, -4.510009765625, -4.21630859375, -3.922607421875, -3.62890625, -3.335205078125, -3.04150390625, -2.747802734375, -2.4541015625, -2.160400390625, -1.86669921875, -1.572998046875, -1.279296875, -0.985595703125, -0.69189453125, -0.398193359375, -0.1044921875, 0.189208984375, 0.48291015625, 0.776611328125, 1.0703125, 1.364013671875, 1.65771484375, 1.951416015625, 2.2451171875, 2.538818359375, 2.83251953125, 3.126220703125, 3.419921875, 3.713623046875, 4.00732421875, 4.301025390625, 4.5947265625, 4.888427734375, 5.18212890625, 5.475830078125, 5.76953125, 6.063232421875, 6.35693359375, 6.650634765625, 6.9443359375, 7.238037109375, 7.53173828125, 7.825439453125, 8.119140625, 8.412841796875, 8.70654296875, 9.000244140625, 9.2939453125, 9.587646484375, 9.88134765625, 10.175048828125, 10.46875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 2.0, 8.0, 14.0, 12.0, 10.0, 26.0, 19.0, 26.0, 22.0, 28.0, 26.0, 37.0, 39.0, 41.0, 62.0, 63.0, 35.0, 46.0, 46.0, 56.0, 58.0, 34.0, 32.0, 33.0, 32.0, 26.0, 30.0, 26.0, 15.0, 16.0, 14.0, 16.0, 16.0, 15.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.0859375, -4.946746826171875, -4.80755615234375, -4.668365478515625, -4.5291748046875, -4.389984130859375, -4.25079345703125, -4.111602783203125, -3.972412109375, -3.833221435546875, -3.69403076171875, -3.554840087890625, -3.4156494140625, -3.276458740234375, -3.13726806640625, -2.998077392578125, -2.85888671875, -2.719696044921875, -2.58050537109375, -2.441314697265625, -2.3021240234375, -2.162933349609375, -2.02374267578125, -1.884552001953125, -1.745361328125, -1.606170654296875, -1.46697998046875, -1.327789306640625, -1.1885986328125, -1.049407958984375, -0.91021728515625, -0.771026611328125, -0.6318359375, -0.492645263671875, -0.35345458984375, -0.214263916015625, -0.0750732421875, 0.064117431640625, 0.20330810546875, 0.342498779296875, 0.481689453125, 0.620880126953125, 0.76007080078125, 0.899261474609375, 1.0384521484375, 1.177642822265625, 1.31683349609375, 1.456024169921875, 1.59521484375, 1.734405517578125, 1.87359619140625, 2.012786865234375, 2.1519775390625, 2.291168212890625, 2.43035888671875, 2.569549560546875, 2.708740234375, 2.847930908203125, 2.98712158203125, 3.126312255859375, 3.2655029296875, 3.404693603515625, 3.54388427734375, 3.683074951171875, 3.822265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 22.0, 27.0, 47.0, 76.0, 156.0, 337.0, 862.0, 4744.0, 88151.0, 3985438.0, 107423.0, 5325.0, 926.0, 360.0, 168.0, 100.0, 43.0, 26.0, 8.0, 7.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8671875, -15.2906494140625, -14.714111328125, -14.1375732421875, -13.56103515625, -12.9844970703125, -12.407958984375, -11.8314208984375, -11.2548828125, -10.6783447265625, -10.101806640625, -9.5252685546875, -8.94873046875, -8.3721923828125, -7.795654296875, -7.2191162109375, -6.642578125, -6.0660400390625, -5.489501953125, -4.9129638671875, -4.33642578125, -3.7598876953125, -3.183349609375, -2.6068115234375, -2.0302734375, -1.4537353515625, -0.877197265625, -0.3006591796875, 0.27587890625, 0.8524169921875, 1.428955078125, 2.0054931640625, 2.58203125, 3.1585693359375, 3.735107421875, 4.3116455078125, 4.88818359375, 5.4647216796875, 6.041259765625, 6.6177978515625, 7.1943359375, 7.7708740234375, 8.347412109375, 8.9239501953125, 9.50048828125, 10.0770263671875, 10.653564453125, 11.2301025390625, 11.806640625, 12.3831787109375, 12.959716796875, 13.5362548828125, 14.11279296875, 14.6893310546875, 15.265869140625, 15.8424072265625, 16.4189453125, 16.9954833984375, 17.572021484375, 18.1485595703125, 18.72509765625, 19.3016357421875, 19.878173828125, 20.4547119140625, 21.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 12.0, 19.0, 18.0, 58.0, 107.0, 189.0, 447.0, 826.0, 1045.0, 660.0, 326.0, 131.0, 99.0, 53.0, 32.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.29193115234375, -6.8455810546875, -6.39923095703125, -5.952880859375, -5.50653076171875, -5.0601806640625, -4.61383056640625, -4.16748046875, -3.72113037109375, -3.2747802734375, -2.82843017578125, -2.382080078125, -1.93572998046875, -1.4893798828125, -1.04302978515625, -0.5966796875, -0.15032958984375, 0.2960205078125, 0.74237060546875, 1.188720703125, 1.63507080078125, 2.0814208984375, 2.52777099609375, 2.97412109375, 3.42047119140625, 3.8668212890625, 4.31317138671875, 4.759521484375, 5.20587158203125, 5.6522216796875, 6.09857177734375, 6.544921875, 6.99127197265625, 7.4376220703125, 7.88397216796875, 8.330322265625, 8.77667236328125, 9.2230224609375, 9.66937255859375, 10.11572265625, 10.56207275390625, 11.0084228515625, 11.45477294921875, 11.901123046875, 12.34747314453125, 12.7938232421875, 13.24017333984375, 13.6865234375, 14.13287353515625, 14.5792236328125, 15.02557373046875, 15.471923828125, 15.91827392578125, 16.3646240234375, 16.81097412109375, 17.25732421875, 17.70367431640625, 18.1500244140625, 18.59637451171875, 19.042724609375, 19.48907470703125, 19.9354248046875, 20.38177490234375, 20.828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 6.0, 18.0, 30.0, 46.0, 109.0, 215.0, 216.0, 171.0, 76.0, 45.0, 23.0, 13.0, 5.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.12738037109375, -125.0787353515625, -122.03008270263672, -118.98143005371094, -115.93278503417969, -112.88414001464844, -109.83548736572266, -106.78683471679688, -103.73818969726562, -100.68954467773438, -97.6408920288086, -94.59223937988281, -91.54359436035156, -88.49494934082031, -85.44629669189453, -82.39764404296875, -79.3489990234375, -76.30035400390625, -73.25170135498047, -70.20304870605469, -67.15440368652344, -64.10575866699219, -61.057106018066406, -58.00845718383789, -54.959808349609375, -51.91115951538086, -48.862510681152344, -45.81386184692383, -42.76521301269531, -39.7165641784668, -36.66791534423828, -33.619266510009766, -30.57061767578125, -27.521968841552734, -24.47332000732422, -21.424671173095703, -18.376022338867188, -15.327373504638672, -12.278724670410156, -9.23007583618164, -6.181427001953125, -3.1327781677246094, -0.08412933349609375, 2.964519500732422, 6.0131683349609375, 9.061817169189453, 12.110466003417969, 15.159114837646484, 18.207763671875, 21.256412506103516, 24.30506134033203, 27.353710174560547, 30.402359008789062, 33.45100784301758, 36.499656677246094, 39.54830551147461, 42.596954345703125, 45.64560317993164, 48.694252014160156, 51.74290084838867, 54.79154968261719, 57.8401985168457, 60.88884735107422, 63.937496185302734, 66.98614501953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 10.0, 19.0, 15.0, 20.0, 19.0, 31.0, 28.0, 35.0, 37.0, 32.0, 42.0, 44.0, 48.0, 64.0, 69.0, 57.0, 52.0, 49.0, 41.0, 42.0, 37.0, 26.0, 21.0, 28.0, 18.0, 20.0, 12.0, 14.0, 9.0, 7.0, 4.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.152992248535156, -33.865177154541016, -32.577362060546875, -31.289546966552734, -30.001731872558594, -28.713916778564453, -27.42609977722168, -26.13828468322754, -24.8504695892334, -23.562654495239258, -22.274839401245117, -20.987024307250977, -19.699207305908203, -18.411392211914062, -17.123577117919922, -15.835762023925781, -14.54794692993164, -13.2601318359375, -11.97231674194336, -10.684500694274902, -9.396685600280762, -8.108870506286621, -6.821054935455322, -5.533239364624023, -4.245424270629883, -2.957608938217163, -1.6697936058044434, -0.38197827339172363, 0.9058370590209961, 2.1936521530151367, 3.4814677238464355, 4.769283294677734, 6.057098388671875, 7.344913482666016, 8.632728576660156, 9.920544624328613, 11.208359718322754, 12.496174812316895, 13.783990859985352, 15.071805953979492, 16.359621047973633, 17.647436141967773, 18.935251235961914, 20.223066329956055, 21.510883331298828, 22.79869842529297, 24.08651351928711, 25.37432861328125, 26.66214370727539, 27.94995880126953, 29.237773895263672, 30.525588989257812, 31.813404083251953, 33.101219177246094, 34.389034271240234, 35.676849365234375, 36.96466827392578, 38.25248336791992, 39.54029846191406, 40.8281135559082, 42.115928649902344, 43.403743743896484, 44.691558837890625, 45.97937774658203, 47.267189025878906]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 9.0, 22.0, 30.0, 26.0, 37.0, 59.0, 116.0, 165.0, 237.0, 385.0, 692.0, 1121.0, 2125.0, 4206.0, 9012.0, 20932.0, 53353.0, 158713.0, 416834.0, 247278.0, 79607.0, 29255.0, 12242.0, 5587.0, 2738.0, 1502.0, 846.0, 495.0, 352.0, 188.0, 121.0, 83.0, 45.0, 43.0, 15.0, 12.0, 14.0, 9.0, 4.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4296875, -6.213134765625, -5.99658203125, -5.780029296875, -5.5634765625, -5.346923828125, -5.13037109375, -4.913818359375, -4.697265625, -4.480712890625, -4.26416015625, -4.047607421875, -3.8310546875, -3.614501953125, -3.39794921875, -3.181396484375, -2.96484375, -2.748291015625, -2.53173828125, -2.315185546875, -2.0986328125, -1.882080078125, -1.66552734375, -1.448974609375, -1.232421875, -1.015869140625, -0.79931640625, -0.582763671875, -0.3662109375, -0.149658203125, 0.06689453125, 0.283447265625, 0.5, 0.716552734375, 0.93310546875, 1.149658203125, 1.3662109375, 1.582763671875, 1.79931640625, 2.015869140625, 2.232421875, 2.448974609375, 2.66552734375, 2.882080078125, 3.0986328125, 3.315185546875, 3.53173828125, 3.748291015625, 3.96484375, 4.181396484375, 4.39794921875, 4.614501953125, 4.8310546875, 5.047607421875, 5.26416015625, 5.480712890625, 5.697265625, 5.913818359375, 6.13037109375, 6.346923828125, 6.5634765625, 6.780029296875, 6.99658203125, 7.213134765625, 7.4296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 6.0, 8.0, 8.0, 7.0, 21.0, 12.0, 29.0, 26.0, 31.0, 34.0, 45.0, 46.0, 38.0, 48.0, 61.0, 42.0, 53.0, 45.0, 55.0, 55.0, 39.0, 36.0, 38.0, 28.0, 24.0, 32.0, 24.0, 17.0, 18.0, 14.0, 10.0, 7.0, 5.0, 12.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.9156494140625, -4.764892578125, -4.6141357421875, -4.46337890625, -4.3126220703125, -4.161865234375, -4.0111083984375, -3.8603515625, -3.7095947265625, -3.558837890625, -3.4080810546875, -3.25732421875, -3.1065673828125, -2.955810546875, -2.8050537109375, -2.654296875, -2.5035400390625, -2.352783203125, -2.2020263671875, -2.05126953125, -1.9005126953125, -1.749755859375, -1.5989990234375, -1.4482421875, -1.2974853515625, -1.146728515625, -0.9959716796875, -0.84521484375, -0.6944580078125, -0.543701171875, -0.3929443359375, -0.2421875, -0.0914306640625, 0.059326171875, 0.2100830078125, 0.36083984375, 0.5115966796875, 0.662353515625, 0.8131103515625, 0.9638671875, 1.1146240234375, 1.265380859375, 1.4161376953125, 1.56689453125, 1.7176513671875, 1.868408203125, 2.0191650390625, 2.169921875, 2.3206787109375, 2.471435546875, 2.6221923828125, 2.77294921875, 2.9237060546875, 3.074462890625, 3.2252197265625, 3.3759765625, 3.5267333984375, 3.677490234375, 3.8282470703125, 3.97900390625, 4.1297607421875, 4.280517578125, 4.4312744140625, 4.58203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 9.0, 6.0, 7.0, 13.0, 16.0, 21.0, 30.0, 34.0, 47.0, 68.0, 116.0, 148.0, 211.0, 317.0, 516.0, 954.0, 1755.0, 5239.0, 27264.0, 706987.0, 276532.0, 19899.0, 4419.0, 1691.0, 790.0, 497.0, 301.0, 199.0, 128.0, 81.0, 67.0, 47.0, 33.0, 22.0, 23.0, 18.0, 17.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.9921875, -15.4749755859375, -14.957763671875, -14.4405517578125, -13.92333984375, -13.4061279296875, -12.888916015625, -12.3717041015625, -11.8544921875, -11.3372802734375, -10.820068359375, -10.3028564453125, -9.78564453125, -9.2684326171875, -8.751220703125, -8.2340087890625, -7.716796875, -7.1995849609375, -6.682373046875, -6.1651611328125, -5.64794921875, -5.1307373046875, -4.613525390625, -4.0963134765625, -3.5791015625, -3.0618896484375, -2.544677734375, -2.0274658203125, -1.51025390625, -0.9930419921875, -0.475830078125, 0.0413818359375, 0.55859375, 1.0758056640625, 1.593017578125, 2.1102294921875, 2.62744140625, 3.1446533203125, 3.661865234375, 4.1790771484375, 4.6962890625, 5.2135009765625, 5.730712890625, 6.2479248046875, 6.76513671875, 7.2823486328125, 7.799560546875, 8.3167724609375, 8.833984375, 9.3511962890625, 9.868408203125, 10.3856201171875, 10.90283203125, 11.4200439453125, 11.937255859375, 12.4544677734375, 12.9716796875, 13.4888916015625, 14.006103515625, 14.5233154296875, 15.04052734375, 15.5577392578125, 16.074951171875, 16.5921630859375, 17.109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 12.0, 12.0, 13.0, 14.0, 19.0, 15.0, 16.0, 32.0, 40.0, 47.0, 48.0, 50.0, 52.0, 71.0, 63.0, 51.0, 70.0, 64.0, 57.0, 45.0, 29.0, 34.0, 25.0, 22.0, 19.0, 9.0, 4.0, 13.0, 6.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -19.169677734375, -18.60498046875, -18.040283203125, -17.4755859375, -16.910888671875, -16.34619140625, -15.781494140625, -15.216796875, -14.652099609375, -14.08740234375, -13.522705078125, -12.9580078125, -12.393310546875, -11.82861328125, -11.263916015625, -10.69921875, -10.134521484375, -9.56982421875, -9.005126953125, -8.4404296875, -7.875732421875, -7.31103515625, -6.746337890625, -6.181640625, -5.616943359375, -5.05224609375, -4.487548828125, -3.9228515625, -3.358154296875, -2.79345703125, -2.228759765625, -1.6640625, -1.099365234375, -0.53466796875, 0.030029296875, 0.5947265625, 1.159423828125, 1.72412109375, 2.288818359375, 2.853515625, 3.418212890625, 3.98291015625, 4.547607421875, 5.1123046875, 5.677001953125, 6.24169921875, 6.806396484375, 7.37109375, 7.935791015625, 8.50048828125, 9.065185546875, 9.6298828125, 10.194580078125, 10.75927734375, 11.323974609375, 11.888671875, 12.453369140625, 13.01806640625, 13.582763671875, 14.1474609375, 14.712158203125, 15.27685546875, 15.841552734375, 16.40625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 11.0, 10.0, 10.0, 10.0, 19.0, 25.0, 33.0, 35.0, 47.0, 66.0, 98.0, 137.0, 293.0, 584.0, 1482.0, 4899.0, 36125.0, 956583.0, 39679.0, 5371.0, 1537.0, 645.0, 305.0, 166.0, 105.0, 67.0, 43.0, 44.0, 35.0, 13.0, 12.0, 14.0, 9.0, 9.0, 7.0, 3.0, 8.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6171875, -5.43310546875, -5.2490234375, -5.06494140625, -4.880859375, -4.69677734375, -4.5126953125, -4.32861328125, -4.14453125, -3.96044921875, -3.7763671875, -3.59228515625, -3.408203125, -3.22412109375, -3.0400390625, -2.85595703125, -2.671875, -2.48779296875, -2.3037109375, -2.11962890625, -1.935546875, -1.75146484375, -1.5673828125, -1.38330078125, -1.19921875, -1.01513671875, -0.8310546875, -0.64697265625, -0.462890625, -0.27880859375, -0.0947265625, 0.08935546875, 0.2734375, 0.45751953125, 0.6416015625, 0.82568359375, 1.009765625, 1.19384765625, 1.3779296875, 1.56201171875, 1.74609375, 1.93017578125, 2.1142578125, 2.29833984375, 2.482421875, 2.66650390625, 2.8505859375, 3.03466796875, 3.21875, 3.40283203125, 3.5869140625, 3.77099609375, 3.955078125, 4.13916015625, 4.3232421875, 4.50732421875, 4.69140625, 4.87548828125, 5.0595703125, 5.24365234375, 5.427734375, 5.61181640625, 5.7958984375, 5.97998046875, 6.1640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 16.0, 28.0, 48.0, 113.0, 242.0, 273.0, 126.0, 41.0, 26.0, 14.0, 10.0, 7.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001537322998046875, -0.0014957785606384277, -0.0014542341232299805, -0.0014126896858215332, -0.001371145248413086, -0.0013296008110046387, -0.0012880563735961914, -0.0012465119361877441, -0.0012049674987792969, -0.0011634230613708496, -0.0011218786239624023, -0.001080334186553955, -0.0010387897491455078, -0.0009972453117370605, -0.0009557008743286133, -0.000914156436920166, -0.0008726119995117188, -0.0008310675621032715, -0.0007895231246948242, -0.000747978687286377, -0.0007064342498779297, -0.0006648898124694824, -0.0006233453750610352, -0.0005818009376525879, -0.0005402565002441406, -0.0004987120628356934, -0.0004571676254272461, -0.00041562318801879883, -0.00037407875061035156, -0.0003325343132019043, -0.00029098987579345703, -0.00024944543838500977, -0.0002079010009765625, -0.00016635656356811523, -0.00012481212615966797, -8.32676887512207e-05, -4.172325134277344e-05, -1.7881393432617188e-07, 4.1365623474121094e-05, 8.291006088256836e-05, 0.00012445449829101562, 0.0001659989356994629, 0.00020754337310791016, 0.0002490878105163574, 0.0002906322479248047, 0.00033217668533325195, 0.0003737211227416992, 0.0004152655601501465, 0.00045680999755859375, 0.000498354434967041, 0.0005398988723754883, 0.0005814433097839355, 0.0006229877471923828, 0.0006645321846008301, 0.0007060766220092773, 0.0007476210594177246, 0.0007891654968261719, 0.0008307099342346191, 0.0008722543716430664, 0.0009137988090515137, 0.0009553432464599609, 0.0009968876838684082, 0.0010384321212768555, 0.0010799765586853027, 0.00112152099609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 11.0, 8.0, 12.0, 21.0, 24.0, 37.0, 40.0, 84.0, 110.0, 154.0, 282.0, 584.0, 1372.0, 3978.0, 15555.0, 212289.0, 777803.0, 27010.0, 5671.0, 1882.0, 728.0, 335.0, 187.0, 122.0, 80.0, 56.0, 41.0, 29.0, 24.0, 3.0, 7.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.691680908203125, -3.56500244140625, -3.438323974609375, -3.3116455078125, -3.184967041015625, -3.05828857421875, -2.931610107421875, -2.804931640625, -2.678253173828125, -2.55157470703125, -2.424896240234375, -2.2982177734375, -2.171539306640625, -2.04486083984375, -1.918182373046875, -1.79150390625, -1.664825439453125, -1.53814697265625, -1.411468505859375, -1.2847900390625, -1.158111572265625, -1.03143310546875, -0.904754638671875, -0.778076171875, -0.651397705078125, -0.52471923828125, -0.398040771484375, -0.2713623046875, -0.144683837890625, -0.01800537109375, 0.108673095703125, 0.2353515625, 0.362030029296875, 0.48870849609375, 0.615386962890625, 0.7420654296875, 0.868743896484375, 0.99542236328125, 1.122100830078125, 1.248779296875, 1.375457763671875, 1.50213623046875, 1.628814697265625, 1.7554931640625, 1.882171630859375, 2.00885009765625, 2.135528564453125, 2.26220703125, 2.388885498046875, 2.51556396484375, 2.642242431640625, 2.7689208984375, 2.895599365234375, 3.02227783203125, 3.148956298828125, 3.275634765625, 3.402313232421875, 3.52899169921875, 3.655670166015625, 3.7823486328125, 3.909027099609375, 4.03570556640625, 4.162384033203125, 4.2890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 21.0, 17.0, 38.0, 37.0, 51.0, 86.0, 126.0, 143.0, 129.0, 88.0, 70.0, 45.0, 30.0, 27.0, 15.0, 9.0, 10.0, 5.0, 12.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.7421875, -4.62554931640625, -4.5089111328125, -4.39227294921875, -4.275634765625, -4.15899658203125, -4.0423583984375, -3.92572021484375, -3.80908203125, -3.69244384765625, -3.5758056640625, -3.45916748046875, -3.342529296875, -3.22589111328125, -3.1092529296875, -2.99261474609375, -2.8759765625, -2.75933837890625, -2.6427001953125, -2.52606201171875, -2.409423828125, -2.29278564453125, -2.1761474609375, -2.05950927734375, -1.94287109375, -1.82623291015625, -1.7095947265625, -1.59295654296875, -1.476318359375, -1.35968017578125, -1.2430419921875, -1.12640380859375, -1.009765625, -0.89312744140625, -0.7764892578125, -0.65985107421875, -0.543212890625, -0.42657470703125, -0.3099365234375, -0.19329833984375, -0.07666015625, 0.03997802734375, 0.1566162109375, 0.27325439453125, 0.389892578125, 0.50653076171875, 0.6231689453125, 0.73980712890625, 0.8564453125, 0.97308349609375, 1.0897216796875, 1.20635986328125, 1.322998046875, 1.43963623046875, 1.5562744140625, 1.67291259765625, 1.78955078125, 1.90618896484375, 2.0228271484375, 2.13946533203125, 2.256103515625, 2.37274169921875, 2.4893798828125, 2.60601806640625, 2.72265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 14.0, 32.0, 131.0, 550.0, 187.0, 56.0, 11.0, 12.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-253.48745727539062, -247.91746520996094, -242.34747314453125, -236.77748107910156, -231.20748901367188, -225.63751220703125, -220.06752014160156, -214.49752807617188, -208.9275360107422, -203.3575439453125, -197.7875518798828, -192.21755981445312, -186.6475830078125, -181.0775909423828, -175.50759887695312, -169.93760681152344, -164.36761474609375, -158.79762268066406, -153.22763061523438, -147.6576385498047, -142.087646484375, -136.51766967773438, -130.9476776123047, -125.377685546875, -119.80769348144531, -114.23770141601562, -108.66770935058594, -103.09772491455078, -97.5277328491211, -91.9577407836914, -86.38775634765625, -80.81776428222656, -75.24778747558594, -69.67779541015625, -64.10780334472656, -58.537818908691406, -52.96782684326172, -47.39783477783203, -41.82784652709961, -36.25785827636719, -30.6878662109375, -25.117876052856445, -19.54788589477539, -13.977895736694336, -8.407905578613281, -2.8379154205322266, 2.732074737548828, 8.30206298828125, 13.872055053710938, 19.442045211791992, 25.012035369873047, 30.5820255279541, 36.152015686035156, 41.722007751464844, 47.291996002197266, 52.86198425292969, 58.431976318359375, 64.00196838378906, 69.57196044921875, 75.1419448852539, 80.7119369506836, 86.28192901611328, 91.85191345214844, 97.42190551757812, 102.99189758300781]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 5.0, 8.0, 15.0, 8.0, 11.0, 15.0, 18.0, 22.0, 31.0, 36.0, 37.0, 47.0, 56.0, 95.0, 181.0, 98.0, 49.0, 48.0, 34.0, 27.0, 20.0, 15.0, 20.0, 23.0, 18.0, 10.0, 6.0, 8.0, 7.0, 2.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-90.15495300292969, -87.87124633789062, -85.5875473022461, -83.30384063720703, -81.0201416015625, -78.73643493652344, -76.45272827148438, -74.16902923583984, -71.88532257080078, -69.60161590576172, -67.31791687011719, -65.03421020507812, -62.75050735473633, -60.46680450439453, -58.183101654052734, -55.89939880371094, -53.61569595336914, -51.331993103027344, -49.04829025268555, -46.76458740234375, -44.48088073730469, -42.19717788696289, -39.913475036621094, -37.6297721862793, -35.3460693359375, -33.0623664855957, -30.778661727905273, -28.494958877563477, -26.211254119873047, -23.92755126953125, -21.643848419189453, -19.360145568847656, -17.076438903808594, -14.79273509979248, -12.509031295776367, -10.22532844543457, -7.941624641418457, -5.657920837402344, -3.374217987060547, -1.0905141830444336, 1.1931896209716797, 3.476893186569214, 5.760596752166748, 8.044300079345703, 10.328003883361816, 12.61170768737793, 14.895410537719727, 17.179115295410156, 19.462818145751953, 21.74652099609375, 24.03022575378418, 26.313928604125977, 28.597633361816406, 30.881336212158203, 33.1650390625, 35.4487419128418, 37.732444763183594, 40.01614761352539, 42.29985046386719, 44.58355712890625, 46.86725997924805, 49.150962829589844, 51.43466567993164, 53.71836853027344, 56.0020751953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 22.0, 27.0, 52.0, 101.0, 252.0, 640.0, 1952.0, 10601.0, 290738.0, 3636886.0, 239648.0, 10336.0, 1997.0, 573.0, 226.0, 107.0, 44.0, 26.0, 10.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.5697021484375, -9.022216796875, -8.4747314453125, -7.92724609375, -7.3797607421875, -6.832275390625, -6.2847900390625, -5.7373046875, -5.1898193359375, -4.642333984375, -4.0948486328125, -3.54736328125, -2.9998779296875, -2.452392578125, -1.9049072265625, -1.357421875, -0.8099365234375, -0.262451171875, 0.2850341796875, 0.83251953125, 1.3800048828125, 1.927490234375, 2.4749755859375, 3.0224609375, 3.5699462890625, 4.117431640625, 4.6649169921875, 5.21240234375, 5.7598876953125, 6.307373046875, 6.8548583984375, 7.40234375, 7.9498291015625, 8.497314453125, 9.0447998046875, 9.59228515625, 10.1397705078125, 10.687255859375, 11.2347412109375, 11.7822265625, 12.3297119140625, 12.877197265625, 13.4246826171875, 13.97216796875, 14.5196533203125, 15.067138671875, 15.6146240234375, 16.162109375, 16.7095947265625, 17.257080078125, 17.8045654296875, 18.35205078125, 18.8995361328125, 19.447021484375, 19.9945068359375, 20.5419921875, 21.0894775390625, 21.636962890625, 22.1844482421875, 22.73193359375, 23.2794189453125, 23.826904296875, 24.3743896484375, 24.921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 0.0, 3.0, 7.0, 9.0, 5.0, 11.0, 9.0, 23.0, 16.0, 17.0, 27.0, 27.0, 28.0, 44.0, 40.0, 39.0, 54.0, 36.0, 45.0, 57.0, 48.0, 43.0, 41.0, 55.0, 33.0, 44.0, 35.0, 36.0, 23.0, 22.0, 25.0, 20.0, 18.0, 11.0, 8.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.56640625, -4.4364013671875, -4.306396484375, -4.1763916015625, -4.04638671875, -3.9163818359375, -3.786376953125, -3.6563720703125, -3.5263671875, -3.3963623046875, -3.266357421875, -3.1363525390625, -3.00634765625, -2.8763427734375, -2.746337890625, -2.6163330078125, -2.486328125, -2.3563232421875, -2.226318359375, -2.0963134765625, -1.96630859375, -1.8363037109375, -1.706298828125, -1.5762939453125, -1.4462890625, -1.3162841796875, -1.186279296875, -1.0562744140625, -0.92626953125, -0.7962646484375, -0.666259765625, -0.5362548828125, -0.40625, -0.2762451171875, -0.146240234375, -0.0162353515625, 0.11376953125, 0.2437744140625, 0.373779296875, 0.5037841796875, 0.6337890625, 0.7637939453125, 0.893798828125, 1.0238037109375, 1.15380859375, 1.2838134765625, 1.413818359375, 1.5438232421875, 1.673828125, 1.8038330078125, 1.933837890625, 2.0638427734375, 2.19384765625, 2.3238525390625, 2.453857421875, 2.5838623046875, 2.7138671875, 2.8438720703125, 2.973876953125, 3.1038818359375, 3.23388671875, 3.3638916015625, 3.493896484375, 3.6239013671875, 3.75390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 11.0, 25.0, 46.0, 86.0, 155.0, 290.0, 625.0, 1755.0, 8118.0, 363294.0, 3797494.0, 17859.0, 2802.0, 904.0, 388.0, 171.0, 97.0, 46.0, 44.0, 18.0, 9.0, 9.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -20.826416015625, -19.88720703125, -18.947998046875, -18.0087890625, -17.069580078125, -16.13037109375, -15.191162109375, -14.251953125, -13.312744140625, -12.37353515625, -11.434326171875, -10.4951171875, -9.555908203125, -8.61669921875, -7.677490234375, -6.73828125, -5.799072265625, -4.85986328125, -3.920654296875, -2.9814453125, -2.042236328125, -1.10302734375, -0.163818359375, 0.775390625, 1.714599609375, 2.65380859375, 3.593017578125, 4.5322265625, 5.471435546875, 6.41064453125, 7.349853515625, 8.2890625, 9.228271484375, 10.16748046875, 11.106689453125, 12.0458984375, 12.985107421875, 13.92431640625, 14.863525390625, 15.802734375, 16.741943359375, 17.68115234375, 18.620361328125, 19.5595703125, 20.498779296875, 21.43798828125, 22.377197265625, 23.31640625, 24.255615234375, 25.19482421875, 26.134033203125, 27.0732421875, 28.012451171875, 28.95166015625, 29.890869140625, 30.830078125, 31.769287109375, 32.70849609375, 33.647705078125, 34.5869140625, 35.526123046875, 36.46533203125, 37.404541015625, 38.34375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 12.0, 12.0, 18.0, 17.0, 27.0, 27.0, 56.0, 68.0, 107.0, 149.0, 221.0, 360.0, 474.0, 600.0, 593.0, 426.0, 271.0, 183.0, 124.0, 97.0, 60.0, 44.0, 34.0, 27.0, 19.0, 11.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.15625, -12.7275390625, -12.298828125, -11.8701171875, -11.44140625, -11.0126953125, -10.583984375, -10.1552734375, -9.7265625, -9.2978515625, -8.869140625, -8.4404296875, -8.01171875, -7.5830078125, -7.154296875, -6.7255859375, -6.296875, -5.8681640625, -5.439453125, -5.0107421875, -4.58203125, -4.1533203125, -3.724609375, -3.2958984375, -2.8671875, -2.4384765625, -2.009765625, -1.5810546875, -1.15234375, -0.7236328125, -0.294921875, 0.1337890625, 0.5625, 0.9912109375, 1.419921875, 1.8486328125, 2.27734375, 2.7060546875, 3.134765625, 3.5634765625, 3.9921875, 4.4208984375, 4.849609375, 5.2783203125, 5.70703125, 6.1357421875, 6.564453125, 6.9931640625, 7.421875, 7.8505859375, 8.279296875, 8.7080078125, 9.13671875, 9.5654296875, 9.994140625, 10.4228515625, 10.8515625, 11.2802734375, 11.708984375, 12.1376953125, 12.56640625, 12.9951171875, 13.423828125, 13.8525390625, 14.28125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 1.0, 11.0, 27.0, 42.0, 89.0, 209.0, 297.0, 189.0, 68.0, 26.0, 12.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.8411865234375, -165.30868530273438, -158.7761688232422, -152.24366760253906, -145.71116638183594, -139.17864990234375, -132.64614868164062, -126.1136474609375, -119.58113861083984, -113.04862976074219, -106.51612854003906, -99.9836196899414, -93.45111083984375, -86.91860961914062, -80.38610076904297, -73.85359191894531, -67.32109069824219, -60.7885856628418, -54.256080627441406, -47.72357177734375, -41.19106674194336, -34.65856170654297, -28.126052856445312, -21.593547821044922, -15.061042785644531, -8.528536796569824, -1.9960308074951172, 4.536476135253906, 11.068981170654297, 17.601486206054688, 24.133995056152344, 30.666500091552734, 37.199005126953125, 43.731510162353516, 50.264015197753906, 56.79652404785156, 63.32902908325195, 69.86153411865234, 76.39404296875, 82.92654418945312, 89.45905303955078, 95.99156188964844, 102.52406311035156, 109.05657196044922, 115.58908081054688, 122.12158203125, 128.65408325195312, 135.1865997314453, 141.71910095214844, 148.25160217285156, 154.78411865234375, 161.31661987304688, 167.84912109375, 174.38162231445312, 180.9141387939453, 187.44664001464844, 193.97915649414062, 200.51165771484375, 207.04417419433594, 213.57667541503906, 220.1091766357422, 226.64169311523438, 233.1741943359375, 239.70669555664062, 246.23919677734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 12.0, 11.0, 14.0, 21.0, 26.0, 24.0, 33.0, 45.0, 31.0, 39.0, 42.0, 51.0, 61.0, 73.0, 60.0, 66.0, 60.0, 48.0, 43.0, 36.0, 34.0, 37.0, 18.0, 22.0, 22.0, 16.0, 17.0, 9.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.58037567138672, -88.0301284790039, -85.47987365722656, -82.92962646484375, -80.37937927246094, -77.8291244506836, -75.27887725830078, -72.72862243652344, -70.17837524414062, -67.62812805175781, -65.07787322998047, -62.527626037597656, -59.97737503051758, -57.4271240234375, -54.87687683105469, -52.32662582397461, -49.77637481689453, -47.22612380981445, -44.675872802734375, -42.12562561035156, -39.575374603271484, -37.025123596191406, -34.474876403808594, -31.924625396728516, -29.374374389648438, -26.82412338256836, -24.273874282836914, -21.72362518310547, -19.17337417602539, -16.623123168945312, -14.072874069213867, -11.522624969482422, -8.972381591796875, -6.422131538391113, -3.8718814849853516, -1.3216314315795898, 1.2286186218261719, 3.7788686752319336, 6.329118728637695, 8.87936782836914, 11.429618835449219, 13.97986888885498, 16.530118942260742, 19.080368041992188, 21.630619049072266, 24.180870056152344, 26.73111915588379, 29.281368255615234, 31.831619262695312, 34.38187026977539, 36.93212127685547, 39.48236846923828, 42.03261947631836, 44.58287048339844, 47.13311767578125, 49.68336868286133, 52.233619689941406, 54.783870697021484, 57.33412170410156, 59.884368896484375, 62.43461990356445, 64.98487091064453, 67.53511810302734, 70.08537292480469, 72.6356201171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 9.0, 9.0, 18.0, 27.0, 34.0, 52.0, 90.0, 119.0, 172.0, 287.0, 486.0, 887.0, 1620.0, 3289.0, 7025.0, 17477.0, 52082.0, 234092.0, 562176.0, 114951.0, 31506.0, 11708.0, 5039.0, 2346.0, 1253.0, 668.0, 410.0, 248.0, 166.0, 85.0, 54.0, 41.0, 32.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.734375, -7.5087890625, -7.283203125, -7.0576171875, -6.83203125, -6.6064453125, -6.380859375, -6.1552734375, -5.9296875, -5.7041015625, -5.478515625, -5.2529296875, -5.02734375, -4.8017578125, -4.576171875, -4.3505859375, -4.125, -3.8994140625, -3.673828125, -3.4482421875, -3.22265625, -2.9970703125, -2.771484375, -2.5458984375, -2.3203125, -2.0947265625, -1.869140625, -1.6435546875, -1.41796875, -1.1923828125, -0.966796875, -0.7412109375, -0.515625, -0.2900390625, -0.064453125, 0.1611328125, 0.38671875, 0.6123046875, 0.837890625, 1.0634765625, 1.2890625, 1.5146484375, 1.740234375, 1.9658203125, 2.19140625, 2.4169921875, 2.642578125, 2.8681640625, 3.09375, 3.3193359375, 3.544921875, 3.7705078125, 3.99609375, 4.2216796875, 4.447265625, 4.6728515625, 4.8984375, 5.1240234375, 5.349609375, 5.5751953125, 5.80078125, 6.0263671875, 6.251953125, 6.4775390625, 6.703125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 3.0, 7.0, 10.0, 5.0, 11.0, 13.0, 12.0, 28.0, 20.0, 13.0, 25.0, 34.0, 36.0, 27.0, 35.0, 30.0, 41.0, 48.0, 48.0, 52.0, 40.0, 46.0, 46.0, 39.0, 43.0, 43.0, 29.0, 27.0, 26.0, 21.0, 28.0, 28.0, 10.0, 11.0, 12.0, 6.0, 8.0, 4.0, 4.0, 8.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.6796875, -4.543701171875, -4.40771484375, -4.271728515625, -4.1357421875, -3.999755859375, -3.86376953125, -3.727783203125, -3.591796875, -3.455810546875, -3.31982421875, -3.183837890625, -3.0478515625, -2.911865234375, -2.77587890625, -2.639892578125, -2.50390625, -2.367919921875, -2.23193359375, -2.095947265625, -1.9599609375, -1.823974609375, -1.68798828125, -1.552001953125, -1.416015625, -1.280029296875, -1.14404296875, -1.008056640625, -0.8720703125, -0.736083984375, -0.60009765625, -0.464111328125, -0.328125, -0.192138671875, -0.05615234375, 0.079833984375, 0.2158203125, 0.351806640625, 0.48779296875, 0.623779296875, 0.759765625, 0.895751953125, 1.03173828125, 1.167724609375, 1.3037109375, 1.439697265625, 1.57568359375, 1.711669921875, 1.84765625, 1.983642578125, 2.11962890625, 2.255615234375, 2.3916015625, 2.527587890625, 2.66357421875, 2.799560546875, 2.935546875, 3.071533203125, 3.20751953125, 3.343505859375, 3.4794921875, 3.615478515625, 3.75146484375, 3.887451171875, 4.0234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 11.0, 18.0, 17.0, 33.0, 53.0, 52.0, 76.0, 96.0, 127.0, 224.0, 362.0, 625.0, 1361.0, 4221.0, 20947.0, 549607.0, 444054.0, 19743.0, 3852.0, 1372.0, 645.0, 353.0, 197.0, 144.0, 88.0, 72.0, 45.0, 41.0, 25.0, 26.0, 13.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5546875, -9.246337890625, -8.93798828125, -8.629638671875, -8.3212890625, -8.012939453125, -7.70458984375, -7.396240234375, -7.087890625, -6.779541015625, -6.47119140625, -6.162841796875, -5.8544921875, -5.546142578125, -5.23779296875, -4.929443359375, -4.62109375, -4.312744140625, -4.00439453125, -3.696044921875, -3.3876953125, -3.079345703125, -2.77099609375, -2.462646484375, -2.154296875, -1.845947265625, -1.53759765625, -1.229248046875, -0.9208984375, -0.612548828125, -0.30419921875, 0.004150390625, 0.3125, 0.620849609375, 0.92919921875, 1.237548828125, 1.5458984375, 1.854248046875, 2.16259765625, 2.470947265625, 2.779296875, 3.087646484375, 3.39599609375, 3.704345703125, 4.0126953125, 4.321044921875, 4.62939453125, 4.937744140625, 5.24609375, 5.554443359375, 5.86279296875, 6.171142578125, 6.4794921875, 6.787841796875, 7.09619140625, 7.404541015625, 7.712890625, 8.021240234375, 8.32958984375, 8.637939453125, 8.9462890625, 9.254638671875, 9.56298828125, 9.871337890625, 10.1796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 6.0, 7.0, 10.0, 10.0, 18.0, 19.0, 26.0, 23.0, 23.0, 26.0, 52.0, 54.0, 54.0, 85.0, 90.0, 99.0, 79.0, 43.0, 58.0, 47.0, 45.0, 28.0, 19.0, 14.0, 15.0, 6.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.870361328125, -20.19384765625, -19.517333984375, -18.8408203125, -18.164306640625, -17.48779296875, -16.811279296875, -16.134765625, -15.458251953125, -14.78173828125, -14.105224609375, -13.4287109375, -12.752197265625, -12.07568359375, -11.399169921875, -10.72265625, -10.046142578125, -9.36962890625, -8.693115234375, -8.0166015625, -7.340087890625, -6.66357421875, -5.987060546875, -5.310546875, -4.634033203125, -3.95751953125, -3.281005859375, -2.6044921875, -1.927978515625, -1.25146484375, -0.574951171875, 0.1015625, 0.778076171875, 1.45458984375, 2.131103515625, 2.8076171875, 3.484130859375, 4.16064453125, 4.837158203125, 5.513671875, 6.190185546875, 6.86669921875, 7.543212890625, 8.2197265625, 8.896240234375, 9.57275390625, 10.249267578125, 10.92578125, 11.602294921875, 12.27880859375, 12.955322265625, 13.6318359375, 14.308349609375, 14.98486328125, 15.661376953125, 16.337890625, 17.014404296875, 17.69091796875, 18.367431640625, 19.0439453125, 19.720458984375, 20.39697265625, 21.073486328125, 21.75]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 9.0, 9.0, 9.0, 9.0, 17.0, 21.0, 30.0, 39.0, 66.0, 117.0, 170.0, 282.0, 620.0, 1581.0, 4933.0, 25544.0, 876339.0, 121413.0, 12117.0, 3020.0, 1091.0, 458.0, 229.0, 115.0, 82.0, 46.0, 46.0, 26.0, 15.0, 17.0, 17.0, 24.0, 7.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.37109375, -2.3066558837890625, -2.242218017578125, -2.1777801513671875, -2.11334228515625, -2.0489044189453125, -1.984466552734375, -1.9200286865234375, -1.8555908203125, -1.7911529541015625, -1.726715087890625, -1.6622772216796875, -1.59783935546875, -1.5334014892578125, -1.468963623046875, -1.4045257568359375, -1.340087890625, -1.2756500244140625, -1.211212158203125, -1.1467742919921875, -1.08233642578125, -1.0178985595703125, -0.953460693359375, -0.8890228271484375, -0.8245849609375, -0.7601470947265625, -0.695709228515625, -0.6312713623046875, -0.56683349609375, -0.5023956298828125, -0.437957763671875, -0.3735198974609375, -0.30908203125, -0.2446441650390625, -0.180206298828125, -0.1157684326171875, -0.05133056640625, 0.0131072998046875, 0.077545166015625, 0.1419830322265625, 0.2064208984375, 0.2708587646484375, 0.335296630859375, 0.3997344970703125, 0.46417236328125, 0.5286102294921875, 0.593048095703125, 0.6574859619140625, 0.721923828125, 0.7863616943359375, 0.850799560546875, 0.9152374267578125, 0.97967529296875, 1.0441131591796875, 1.108551025390625, 1.1729888916015625, 1.2374267578125, 1.3018646240234375, 1.366302490234375, 1.4307403564453125, 1.49517822265625, 1.5596160888671875, 1.624053955078125, 1.6884918212890625, 1.7529296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 7.0, 15.0, 9.0, 13.0, 28.0, 34.0, 63.0, 74.0, 122.0, 141.0, 140.0, 107.0, 70.0, 34.0, 31.0, 20.0, 20.0, 12.0, 9.0, 8.0, 8.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004165172576904297, -0.0004042200744152069, -0.00039192289113998413, -0.00037962570786476135, -0.0003673285245895386, -0.0003550313413143158, -0.000342734158039093, -0.00033043697476387024, -0.00031813979148864746, -0.0003058426082134247, -0.0002935454249382019, -0.0002812482416629791, -0.00026895105838775635, -0.00025665387511253357, -0.0002443566918373108, -0.000232059508562088, -0.00021976232528686523, -0.00020746514201164246, -0.00019516795873641968, -0.0001828707754611969, -0.00017057359218597412, -0.00015827640891075134, -0.00014597922563552856, -0.00013368204236030579, -0.00012138485908508301, -0.00010908767580986023, -9.679049253463745e-05, -8.449330925941467e-05, -7.21961259841919e-05, -5.9898942708969116e-05, -4.760175943374634e-05, -3.530457615852356e-05, -2.300739288330078e-05, -1.0710209608078003e-05, 1.5869736671447754e-06, 1.3884156942367554e-05, 2.6181340217590332e-05, 3.847852349281311e-05, 5.077570676803589e-05, 6.307289004325867e-05, 7.537007331848145e-05, 8.766725659370422e-05, 9.9964439868927e-05, 0.00011226162314414978, 0.00012455880641937256, 0.00013685598969459534, 0.00014915317296981812, 0.0001614503562450409, 0.00017374753952026367, 0.00018604472279548645, 0.00019834190607070923, 0.000210639089345932, 0.00022293627262115479, 0.00023523345589637756, 0.00024753063917160034, 0.0002598278224468231, 0.0002721250057220459, 0.0002844221889972687, 0.00029671937227249146, 0.00030901655554771423, 0.000321313738822937, 0.0003336109220981598, 0.00034590810537338257, 0.00035820528864860535, 0.0003705024719238281]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 25.0, 23.0, 35.0, 67.0, 88.0, 186.0, 305.0, 591.0, 1262.0, 3050.0, 9690.0, 49680.0, 859488.0, 101108.0, 15364.0, 4207.0, 1688.0, 729.0, 385.0, 186.0, 123.0, 92.0, 47.0, 36.0, 22.0, 14.0, 10.0, 8.0, 5.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.41278076171875, -1.3616943359375, -1.31060791015625, -1.259521484375, -1.20843505859375, -1.1573486328125, -1.10626220703125, -1.05517578125, -1.00408935546875, -0.9530029296875, -0.90191650390625, -0.850830078125, -0.79974365234375, -0.7486572265625, -0.69757080078125, -0.646484375, -0.59539794921875, -0.5443115234375, -0.49322509765625, -0.442138671875, -0.39105224609375, -0.3399658203125, -0.28887939453125, -0.23779296875, -0.18670654296875, -0.1356201171875, -0.08453369140625, -0.033447265625, 0.01763916015625, 0.0687255859375, 0.11981201171875, 0.1708984375, 0.22198486328125, 0.2730712890625, 0.32415771484375, 0.375244140625, 0.42633056640625, 0.4774169921875, 0.52850341796875, 0.57958984375, 0.63067626953125, 0.6817626953125, 0.73284912109375, 0.783935546875, 0.83502197265625, 0.8861083984375, 0.93719482421875, 0.98828125, 1.03936767578125, 1.0904541015625, 1.14154052734375, 1.192626953125, 1.24371337890625, 1.2947998046875, 1.34588623046875, 1.39697265625, 1.44805908203125, 1.4991455078125, 1.55023193359375, 1.601318359375, 1.65240478515625, 1.7034912109375, 1.75457763671875, 1.8056640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 7.0, 22.0, 15.0, 43.0, 91.0, 210.0, 259.0, 154.0, 92.0, 26.0, 17.0, 15.0, 9.0, 12.0, 7.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.779449462890625, -3.65069580078125, -3.521942138671875, -3.3931884765625, -3.264434814453125, -3.13568115234375, -3.006927490234375, -2.878173828125, -2.749420166015625, -2.62066650390625, -2.491912841796875, -2.3631591796875, -2.234405517578125, -2.10565185546875, -1.976898193359375, -1.84814453125, -1.719390869140625, -1.59063720703125, -1.461883544921875, -1.3331298828125, -1.204376220703125, -1.07562255859375, -0.946868896484375, -0.818115234375, -0.689361572265625, -0.56060791015625, -0.431854248046875, -0.3031005859375, -0.174346923828125, -0.04559326171875, 0.083160400390625, 0.2119140625, 0.340667724609375, 0.46942138671875, 0.598175048828125, 0.7269287109375, 0.855682373046875, 0.98443603515625, 1.113189697265625, 1.241943359375, 1.370697021484375, 1.49945068359375, 1.628204345703125, 1.7569580078125, 1.885711669921875, 2.01446533203125, 2.143218994140625, 2.27197265625, 2.400726318359375, 2.52947998046875, 2.658233642578125, 2.7869873046875, 2.915740966796875, 3.04449462890625, 3.173248291015625, 3.302001953125, 3.430755615234375, 3.55950927734375, 3.688262939453125, 3.8170166015625, 3.945770263671875, 4.07452392578125, 4.203277587890625, 4.33203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 15.0, 41.0, 68.0, 490.0, 210.0, 75.0, 42.0, 15.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.13438415527344, -81.0976333618164, -78.06088256835938, -75.02412414550781, -71.98737335205078, -68.95062255859375, -65.91387176513672, -62.87711715698242, -59.840362548828125, -56.803611755371094, -53.7668571472168, -50.730106353759766, -47.69335174560547, -44.65660095214844, -41.619850158691406, -38.58309555053711, -35.54634475708008, -32.50959396362305, -29.47283935546875, -26.43608856201172, -23.399333953857422, -20.36258316040039, -17.325830459594727, -14.289077758789062, -11.252325057983398, -8.215572357177734, -5.1788201332092285, -2.1420679092407227, 0.8946847915649414, 3.9314374923706055, 6.968189239501953, 10.004941940307617, 13.041694641113281, 16.078447341918945, 19.11520004272461, 22.15195083618164, 25.188705444335938, 28.22545623779297, 31.262208938598633, 34.2989616394043, 37.335716247558594, 40.372467041015625, 43.40922164916992, 46.44597244262695, 49.48272705078125, 52.51947784423828, 55.55622863769531, 58.59298324584961, 61.62973403930664, 64.66648864746094, 67.70323944091797, 70.739990234375, 73.77674102783203, 76.8134994506836, 79.85025024414062, 82.88700103759766, 85.92375183105469, 88.96050262451172, 91.99725341796875, 95.03401184082031, 98.07076263427734, 101.10751342773438, 104.1442642211914, 107.18101501464844, 110.2177734375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 4.0, 10.0, 11.0, 16.0, 8.0, 22.0, 24.0, 23.0, 24.0, 24.0, 24.0, 84.0, 128.0, 153.0, 146.0, 60.0, 28.0, 21.0, 22.0, 19.0, 18.0, 15.0, 13.0, 5.0, 8.0, 10.0, 4.0, 8.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.177345275878906, -53.66476821899414, -52.152191162109375, -50.63961410522461, -49.127037048339844, -47.61445999145508, -46.10188293457031, -44.58930969238281, -43.07672882080078, -41.564151763916016, -40.05157470703125, -38.538997650146484, -37.02642059326172, -35.51384353637695, -34.00126647949219, -32.48869323730469, -30.976116180419922, -29.463539123535156, -27.95096206665039, -26.438385009765625, -24.92580795288086, -23.413230895996094, -21.90065574645996, -20.388078689575195, -18.87550163269043, -17.362924575805664, -15.850347518920898, -14.33777141571045, -12.825194358825684, -11.312617301940918, -9.800041198730469, -8.287464141845703, -6.7748870849609375, -5.262310028076172, -3.7497334480285645, -2.237156867980957, -0.7245798110961914, 0.7879972457885742, 2.3005733489990234, 3.813150405883789, 5.325727462768555, 6.83830451965332, 8.350881576538086, 9.863457679748535, 11.3760347366333, 12.888611793518066, 14.401187896728516, 15.913764953613281, 17.426342010498047, 18.938919067382812, 20.451496124267578, 21.964073181152344, 23.47665023803711, 24.989227294921875, 26.501802444458008, 28.014379501342773, 29.52695655822754, 31.039533615112305, 32.55210876464844, 34.0646858215332, 35.57726287841797, 37.089839935302734, 38.6024169921875, 40.114994049072266, 41.62757110595703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 16.0, 13.0, 19.0, 31.0, 31.0, 31.0, 36.0, 53.0, 135.0, 294.0, 69.0, 51.0, 34.0, 34.0, 33.0, 22.0, 31.0, 15.0, 7.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.7686767578125, -5.564697265625, -5.3607177734375, -5.15673828125, -4.9527587890625, -4.748779296875, -4.5447998046875, -4.3408203125, -4.1368408203125, -3.932861328125, -3.7288818359375, -3.52490234375, -3.3209228515625, -3.116943359375, -2.9129638671875, -2.708984375, -2.5050048828125, -2.301025390625, -2.0970458984375, -1.89306640625, -1.6890869140625, -1.485107421875, -1.2811279296875, -1.0771484375, -0.8731689453125, -0.669189453125, -0.4652099609375, -0.26123046875, -0.0572509765625, 0.146728515625, 0.3507080078125, 0.5546875, 0.7586669921875, 0.962646484375, 1.1666259765625, 1.37060546875, 1.5745849609375, 1.778564453125, 1.9825439453125, 2.1865234375, 2.3905029296875, 2.594482421875, 2.7984619140625, 3.00244140625, 3.2064208984375, 3.410400390625, 3.6143798828125, 3.818359375, 4.0223388671875, 4.226318359375, 4.4302978515625, 4.63427734375, 4.8382568359375, 5.042236328125, 5.2462158203125, 5.4501953125, 5.6541748046875, 5.858154296875, 6.0621337890625, 6.26611328125, 6.4700927734375, 6.674072265625, 6.8780517578125, 7.08203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 5.0, 7.0, 12.0, 25.0, 22.0, 28.0, 32.0, 57.0, 145.0, 279.0, 687.0, 2706.0, 23437.0, 8349392.0, 9078.0, 1635.0, 463.0, 225.0, 100.0, 56.0, 43.0, 30.0, 24.0, 20.0, 16.0, 7.0, 4.0, 0.0, 2.0, 1.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-59.76436996459961, -57.79380416870117, -55.8232421875, -53.85267639160156, -51.882110595703125, -49.91154479980469, -47.940982818603516, -45.97041702270508, -43.999855041503906, -42.02928924560547, -40.0587272644043, -38.08816146850586, -36.11759567260742, -34.14703369140625, -32.17646789550781, -30.205902099609375, -28.235336303710938, -26.264772415161133, -24.294206619262695, -22.32364273071289, -20.353076934814453, -18.38251304626465, -16.411949157714844, -14.441384315490723, -12.470819473266602, -10.50025463104248, -8.52968978881836, -6.559125900268555, -4.588561058044434, -2.6179962158203125, -0.6474323272705078, 1.3231325149536133, 3.293701171875, 5.264266014099121, 7.234830379486084, 9.205394744873047, 11.175959587097168, 13.146524429321289, 15.117088317871094, 17.08765411376953, 19.058218002319336, 21.02878189086914, 22.999347686767578, 24.969911575317383, 26.940475463867188, 28.911041259765625, 30.88160514831543, 32.852169036865234, 34.82273483276367, 36.79330062866211, 38.76386260986328, 40.73442840576172, 42.704994201660156, 44.675559997558594, 46.646121978759766, 48.6166877746582, 50.587249755859375, 52.55781555175781, 54.528377532958984, 56.49894332885742, 58.46950912475586, 60.44007110595703, 62.41063690185547, 64.3812026977539, 66.35176849365234]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 1.0, 6.0, 4.0, 8.0, 3.0, 7.0, 2.0, 3.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.71174621582031, -75.95531463623047, -72.19888305664062, -68.44245910644531, -64.68602752685547, -60.929595947265625, -57.17316818237305, -53.41674041748047, -49.660308837890625, -45.90387725830078, -42.1474494934082, -38.391021728515625, -34.63459014892578, -30.87816047668457, -27.12173080444336, -23.36530113220215, -19.608871459960938, -15.852441787719727, -12.096012115478516, -8.339582443237305, -4.583152770996094, -0.8267230987548828, 2.929706573486328, 6.686136245727539, 10.44256591796875, 14.198995590209961, 17.955425262451172, 21.711854934692383, 25.468284606933594, 29.224714279174805, 32.981143951416016, 36.737571716308594, 40.49400329589844, 44.25043487548828, 48.00686264038086, 51.76329040527344, 55.51972198486328, 59.276153564453125, 63.0325813293457, 66.78900909423828, 70.54544067382812, 74.30187225341797, 78.05830383300781, 81.81472778320312, 85.57115936279297, 89.32759094238281, 93.08401489257812, 96.84044647216797, 100.59687805175781, 104.35330963134766, 108.1097412109375, 111.86616516113281, 115.62259674072266, 119.3790283203125, 123.13545227050781, 126.89188385009766, 130.6483154296875, 134.4047393798828, 138.1611785888672, 141.9176025390625, 145.67404174804688, 149.4304656982422, 153.1868896484375, 156.94332885742188, 160.6997528076172]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 4.0, 14.0, 23.0, 18.0, 29.0, 32.0, 51.0, 70.0, 100.0, 174.0, 253.0, 524.0, 1097.0, 2521.0, 6317.0, 17124.0, 46398.0, 126789.0, 187832.0, 85072.0, 30599.0, 11294.0, 4369.0, 1688.0, 781.0, 392.0, 244.0, 130.0, 98.0, 69.0, 47.0, 25.0, 25.0, 11.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.171875, -27.058349609375, -25.94482421875, -24.831298828125, -23.7177734375, -22.604248046875, -21.49072265625, -20.377197265625, -19.263671875, -18.150146484375, -17.03662109375, -15.923095703125, -14.8095703125, -13.696044921875, -12.58251953125, -11.468994140625, -10.35546875, -9.241943359375, -8.12841796875, -7.014892578125, -5.9013671875, -4.787841796875, -3.67431640625, -2.560791015625, -1.447265625, -0.333740234375, 0.77978515625, 1.893310546875, 3.0068359375, 4.120361328125, 5.23388671875, 6.347412109375, 7.4609375, 8.574462890625, 9.68798828125, 10.801513671875, 11.9150390625, 13.028564453125, 14.14208984375, 15.255615234375, 16.369140625, 17.482666015625, 18.59619140625, 19.709716796875, 20.8232421875, 21.936767578125, 23.05029296875, 24.163818359375, 25.27734375, 26.390869140625, 27.50439453125, 28.617919921875, 29.7314453125, 30.844970703125, 31.95849609375, 33.072021484375, 34.185546875, 35.299072265625, 36.41259765625, 37.526123046875, 38.6396484375, 39.753173828125, 40.86669921875, 41.980224609375, 43.09375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 4.0, 7.0, 9.0, 10.0, 15.0, 9.0, 11.0, 12.0, 19.0, 26.0, 34.0, 45.0, 42.0, 49.0, 53.0, 59.0, 46.0, 51.0, 58.0, 63.0, 44.0, 42.0, 46.0, 39.0, 40.0, 37.0, 26.0, 19.0, 10.0, 18.0, 10.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.3709716796875, -4.218505859375, -4.0660400390625, -3.91357421875, -3.7611083984375, -3.608642578125, -3.4561767578125, -3.3037109375, -3.1512451171875, -2.998779296875, -2.8463134765625, -2.69384765625, -2.5413818359375, -2.388916015625, -2.2364501953125, -2.083984375, -1.9315185546875, -1.779052734375, -1.6265869140625, -1.47412109375, -1.3216552734375, -1.169189453125, -1.0167236328125, -0.8642578125, -0.7117919921875, -0.559326171875, -0.4068603515625, -0.25439453125, -0.1019287109375, 0.050537109375, 0.2030029296875, 0.35546875, 0.5079345703125, 0.660400390625, 0.8128662109375, 0.96533203125, 1.1177978515625, 1.270263671875, 1.4227294921875, 1.5751953125, 1.7276611328125, 1.880126953125, 2.0325927734375, 2.18505859375, 2.3375244140625, 2.489990234375, 2.6424560546875, 2.794921875, 2.9473876953125, 3.099853515625, 3.2523193359375, 3.40478515625, 3.5572509765625, 3.709716796875, 3.8621826171875, 4.0146484375, 4.1671142578125, 4.319580078125, 4.4720458984375, 4.62451171875, 4.7769775390625, 4.929443359375, 5.0819091796875, 5.234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 7.0, 18.0, 27.0, 40.0, 77.0, 65.0, 83.0, 57.0, 33.0, 16.0, 15.0, 9.0, 8.0, 9.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.49615478515625, -42.117000579833984, -40.73784637451172, -39.35869216918945, -37.97953796386719, -36.60038375854492, -35.221229553222656, -33.842071533203125, -32.462921142578125, -31.08376693725586, -29.704612731933594, -28.325458526611328, -26.946304321289062, -25.567150115966797, -24.1879940032959, -22.808839797973633, -21.429683685302734, -20.05052947998047, -18.671375274658203, -17.292221069335938, -15.913065910339355, -14.53391170501709, -13.154756546020508, -11.775602340698242, -10.396448135375977, -9.017293930053711, -7.638139247894287, -6.258984565734863, -4.879830360412598, -3.500676155090332, -2.12152099609375, -0.7423667907714844, 0.6367874145507812, 2.015941858291626, 3.3950963020324707, 4.7742509841918945, 6.15340518951416, 7.532559394836426, 8.911714553833008, 10.290868759155273, 11.670022964477539, 13.049177169799805, 14.42833137512207, 15.807486534118652, 17.186641693115234, 18.5657958984375, 19.944950103759766, 21.32410430908203, 22.703258514404297, 24.082412719726562, 25.461566925048828, 26.840721130371094, 28.21987533569336, 29.599029541015625, 30.978185653686523, 32.357337951660156, 33.73649597167969, 35.11565017700195, 36.49480438232422, 37.873958587646484, 39.25311279296875, 40.632266998291016, 42.01142120361328, 43.39057922363281, 44.76972961425781]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 6.0, 10.0, 12.0, 40.0, 57.0, 61.0, 63.0, 59.0, 47.0, 18.0, 23.0, 15.0, 10.0, 6.0, 5.0, 6.0, 2.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.523101806640625, -16.629711151123047, -15.736321449279785, -14.842931747436523, -13.949541091918945, -13.056151390075684, -12.162761688232422, -11.269371032714844, -10.375980377197266, -9.482590675354004, -8.589200019836426, -7.695810317993164, -6.802419662475586, -5.909029960632324, -5.015639781951904, -4.122249603271484, -3.2288599014282227, -2.3354697227478027, -1.4420796632766724, -0.548689603805542, 0.34470057487487793, 1.2380905151367188, 2.1314806938171387, 3.0248708724975586, 3.9182610511779785, 4.811651229858398, 5.705041408538818, 6.598431587219238, 7.4918212890625, 8.385211944580078, 9.27860164642334, 10.171991348266602, 11.06538200378418, 11.958771705627441, 12.85216236114502, 13.745552062988281, 14.63894271850586, 15.532332420349121, 16.425722122192383, 17.31911277770996, 18.21250343322754, 19.105894088745117, 19.999282836914062, 20.89267349243164, 21.78606414794922, 22.679454803466797, 23.572843551635742, 24.46623420715332, 25.359622955322266, 26.253013610839844, 27.14640235900879, 28.039793014526367, 28.933183670043945, 29.82657241821289, 30.71996307373047, 31.613353729248047, 32.506744384765625, 33.4001350402832, 34.29352569580078, 35.18691635131836, 36.08030319213867, 36.97369384765625, 37.86708450317383, 38.760475158691406, 39.653865814208984]}, "eval/loss": 3.785594940185547, "eval/wer": 0.6683334325455881, "eval/runtime": 893.3132, "eval/samples_per_second": 2.958, "eval/steps_per_second": 0.371} \ No newline at end of file +{"train/loss": 1.7532, "train/learning_rate": 2.109619952494062e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 38937, "_timestamp": 1646700176, "_step": 6003, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 27.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 29384.0, 1023.0, 35.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-283.75, -277.6923828125, -271.634765625, -265.5771484375, -259.51953125, -253.4619140625, -247.404296875, -241.3466796875, -235.2890625, -229.2314453125, -223.173828125, -217.1162109375, -211.05859375, -205.0009765625, -198.943359375, -192.8857421875, -186.828125, -180.7705078125, -174.712890625, -168.6552734375, -162.59765625, -156.5400390625, -150.482421875, -144.4248046875, -138.3671875, -132.3095703125, -126.251953125, -120.1943359375, -114.13671875, -108.0791015625, -102.021484375, -95.9638671875, -89.90625, -83.8486328125, -77.791015625, -71.7333984375, -65.67578125, -59.6181640625, -53.560546875, -47.5029296875, -41.4453125, -35.3876953125, -29.330078125, -23.2724609375, -17.21484375, -11.1572265625, -5.099609375, 0.9580078125, 7.015625, 13.0732421875, 19.130859375, 25.1884765625, 31.24609375, 37.3037109375, 43.361328125, 49.4189453125, 55.4765625, 61.5341796875, 67.591796875, 73.6494140625, 79.70703125, 85.7646484375, 91.822265625, 97.8798828125, 103.9375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 4.0, 5.0, 10.0, 7.0, 15.0, 15.0, 14.0, 20.0, 14.0, 22.0, 27.0, 28.0, 30.0, 38.0, 37.0, 57.0, 39.0, 56.0, 56.0, 43.0, 44.0, 57.0, 42.0, 36.0, 33.0, 41.0, 34.0, 33.0, 32.0, 22.0, 18.0, 16.0, 20.0, 9.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 4.0], "bins": [-99.3861312866211, -97.02130889892578, -94.65648651123047, -92.29166412353516, -89.92684173583984, -87.56201171875, -85.19718933105469, -82.83236694335938, -80.46754455566406, -78.10272216796875, -75.73789978027344, -73.37307739257812, -71.00825500488281, -68.6434326171875, -66.27861022949219, -63.913780212402344, -61.5489616394043, -59.184139251708984, -56.81931686401367, -54.454490661621094, -52.08966827392578, -49.72484588623047, -47.360023498535156, -44.995201110839844, -42.63037872314453, -40.26555633544922, -37.900733947753906, -35.535911560058594, -33.171085357666016, -30.806262969970703, -28.44144058227539, -26.076616287231445, -23.7117919921875, -21.346969604492188, -18.982145309448242, -16.61732292175293, -14.2524995803833, -11.887676239013672, -9.52285385131836, -7.158029556274414, -4.793207168579102, -2.4283840656280518, -0.06356096267700195, 2.3012619018554688, 4.666085243225098, 7.030908584594727, 9.395730972290039, 11.760555267333984, 14.125377655029297, 16.49020004272461, 18.855024337768555, 21.219846725463867, 23.584671020507812, 25.949493408203125, 28.314315795898438, 30.679140090942383, 33.04396057128906, 35.408782958984375, 37.77360534667969, 40.138427734375, 42.50325393676758, 44.86807632446289, 47.2328987121582, 49.59772491455078, 51.962547302246094]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 13.0, 15.0, 6.0, 11.0, 19.0, 28.0, 22.0, 26.0, 29.0, 26.0, 38.0, 39.0, 33.0, 29.0, 38.0, 42.0, 37.0, 29.0, 43.0, 35.0, 46.0, 31.0, 34.0, 38.0, 36.0, 24.0, 27.0, 26.0, 21.0, 25.0, 15.0, 16.0, 12.0, 18.0, 13.0, 6.0, 6.0, 8.0, 9.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.51362228393555, -47.64765930175781, -45.781700134277344, -43.91573715209961, -42.049774169921875, -40.183815002441406, -38.31785202026367, -36.45188903808594, -34.58592987060547, -32.719966888427734, -30.854007720947266, -28.98804473876953, -27.12208366394043, -25.256122589111328, -23.390159606933594, -21.524198532104492, -19.65823745727539, -17.79227638244629, -15.926314353942871, -14.060352325439453, -12.194391250610352, -10.32843017578125, -8.462468147277832, -6.596506118774414, -4.7305450439453125, -2.8645834922790527, -0.998621940612793, 0.8673396110534668, 2.7333011627197266, 4.599262237548828, 6.465224266052246, 8.331186294555664, 10.1971435546875, 12.063104629516602, 13.92906665802002, 15.795028686523438, 17.66098976135254, 19.52695083618164, 21.392913818359375, 23.258874893188477, 25.124835968017578, 26.99079704284668, 28.85675811767578, 30.722721099853516, 32.58868408203125, 34.45464324951172, 36.32060623168945, 38.18656921386719, 40.052528381347656, 41.91849136352539, 43.78445053100586, 45.650413513183594, 47.51637268066406, 49.3823356628418, 51.24829864501953, 53.1142578125, 54.980220794677734, 56.84618377685547, 58.71214294433594, 60.57810592651367, 62.444068908691406, 64.31002807617188, 66.17598724365234, 68.04195404052734, 69.90791320800781]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 18.0, 34.0, 37.0, 66.0, 123.0, 171.0, 322.0, 458.0, 759.0, 1244.0, 1875.0, 3155.0, 4690.0, 7238.0, 10788.0, 15990.0, 23160.0, 32884.0, 44462.0, 58545.0, 74099.0, 89667.0, 107658.0, 129804.0, 100719.0, 85855.0, 69099.0, 53624.0, 40702.0, 29076.0, 20645.0, 14196.0, 9677.0, 6168.0, 4132.0, 2774.0, 1705.0, 1064.0, 714.0, 446.0, 272.0, 155.0, 104.0, 60.0, 60.0, 24.0, 14.0, 8.0, 5.0, 2.0, 3.0, 1.0], "bins": [-200.125, -194.462890625, -188.80078125, -183.138671875, -177.4765625, -171.814453125, -166.15234375, -160.490234375, -154.828125, -149.166015625, -143.50390625, -137.841796875, -132.1796875, -126.517578125, -120.85546875, -115.193359375, -109.53125, -103.869140625, -98.20703125, -92.544921875, -86.8828125, -81.220703125, -75.55859375, -69.896484375, -64.234375, -58.572265625, -52.91015625, -47.248046875, -41.5859375, -35.923828125, -30.26171875, -24.599609375, -18.9375, -13.275390625, -7.61328125, -1.951171875, 3.7109375, 9.373046875, 15.03515625, 20.697265625, 26.359375, 32.021484375, 37.68359375, 43.345703125, 49.0078125, 54.669921875, 60.33203125, 65.994140625, 71.65625, 77.318359375, 82.98046875, 88.642578125, 94.3046875, 99.966796875, 105.62890625, 111.291015625, 116.953125, 122.615234375, 128.27734375, 133.939453125, 139.6015625, 145.263671875, 150.92578125, 156.587890625, 162.25]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 8.0, 13.0, 7.0, 11.0, 13.0, 19.0, 23.0, 19.0, 17.0, 33.0, 31.0, 40.0, 48.0, 35.0, 33.0, 33.0, 58.0, 49.0, 58.0, 48.0, 39.0, 42.0, 35.0, 30.0, 36.0, 31.0, 29.0, 18.0, 15.0, 20.0, 16.0, 9.0, 14.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-78.375, -75.9140625, -73.453125, -70.9921875, -68.53125, -66.0703125, -63.609375, -61.1484375, -58.6875, -56.2265625, -53.765625, -51.3046875, -48.84375, -46.3828125, -43.921875, -41.4609375, -39.0, -36.5390625, -34.078125, -31.6171875, -29.15625, -26.6953125, -24.234375, -21.7734375, -19.3125, -16.8515625, -14.390625, -11.9296875, -9.46875, -7.0078125, -4.546875, -2.0859375, 0.375, 2.8359375, 5.296875, 7.7578125, 10.21875, 12.6796875, 15.140625, 17.6015625, 20.0625, 22.5234375, 24.984375, 27.4453125, 29.90625, 32.3671875, 34.828125, 37.2890625, 39.75, 42.2109375, 44.671875, 47.1328125, 49.59375, 52.0546875, 54.515625, 56.9765625, 59.4375, 61.8984375, 64.359375, 66.8203125, 69.28125, 71.7421875, 74.203125, 76.6640625, 79.125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 11.0, 8.0, 12.0, 23.0, 7.0, 27.0, 23.0, 29.0, 31.0, 29.0, 36.0, 35.0, 45.0, 63.0, 40.0, 53.0, 65.0, 51.0, 62.0, 46.0, 45.0, 42.0, 34.0, 24.0, 29.0, 24.0, 12.0, 21.0, 8.0, 9.0, 14.0, 14.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.182701110839844, -55.2156982421875, -53.248695373535156, -51.28169250488281, -49.3146858215332, -47.34768295288086, -45.380680084228516, -43.41367721557617, -41.44667053222656, -39.47966766357422, -37.512664794921875, -35.54566192626953, -33.57865524291992, -31.611652374267578, -29.644649505615234, -27.67764663696289, -25.710643768310547, -23.743640899658203, -21.776636123657227, -19.809633255004883, -17.842628479003906, -15.875625610351562, -13.908622741699219, -11.941618919372559, -9.974615097045898, -8.007611274719238, -6.040607929229736, -4.073604583740234, -2.106600761413574, -0.13959693908691406, 1.8274059295654297, 3.79440975189209, 5.76141357421875, 7.72841739654541, 9.69542121887207, 11.662424087524414, 13.629427909851074, 15.596431732177734, 17.563434600830078, 19.530437469482422, 21.4974422454834, 23.464445114135742, 25.43144989013672, 27.398452758789062, 29.365455627441406, 31.332460403442383, 33.299461364746094, 35.2664680480957, 37.23347091674805, 39.20047378540039, 41.167476654052734, 43.134483337402344, 45.10148620605469, 47.06848907470703, 49.035491943359375, 51.00249481201172, 52.96949768066406, 54.936500549316406, 56.90350341796875, 58.870506286621094, 60.8375129699707, 62.80451583862305, 64.77151489257812, 66.738525390625, 68.70552825927734]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 9.0, 10.0, 12.0, 10.0, 8.0, 20.0, 22.0, 31.0, 30.0, 42.0, 34.0, 34.0, 44.0, 48.0, 53.0, 47.0, 52.0, 49.0, 53.0, 47.0, 49.0, 32.0, 49.0, 39.0, 27.0, 29.0, 17.0, 14.0, 20.0, 13.0, 14.0, 4.0, 6.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.51104736328125, -48.61479568481445, -46.71854019165039, -44.822288513183594, -42.92603302001953, -41.029781341552734, -39.13352584838867, -37.237274169921875, -35.34101867675781, -33.444766998291016, -31.548511505126953, -29.652257919311523, -27.756004333496094, -25.859752655029297, -23.963497161865234, -22.067245483398438, -20.170991897583008, -18.274738311767578, -16.37848472595215, -14.482231140136719, -12.585977554321289, -10.689724922180176, -8.793471336364746, -6.897217750549316, -5.000964164733887, -3.104710578918457, -1.2084572315216064, 0.6877961158752441, 2.584049701690674, 4.480302810668945, 6.376556396484375, 8.272809982299805, 10.169063568115234, 12.065317153930664, 13.961570739746094, 15.857824325561523, 17.754077911376953, 19.65032958984375, 21.546585083007812, 23.44283676147461, 25.339092254638672, 27.2353458404541, 29.13159942626953, 31.02785301208496, 32.92410659790039, 34.82035827636719, 36.71661376953125, 38.61286544799805, 40.509117126464844, 42.40536880493164, 44.3016242980957, 46.1978759765625, 48.09413146972656, 49.99038314819336, 51.88663864135742, 53.78289031982422, 55.67914581298828, 57.57539749145508, 59.47165298461914, 61.36790466308594, 63.26416015625, 65.16041564941406, 67.0566635131836, 68.95291900634766, 70.84917449951172]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 16.0, 21.0, 31.0, 55.0, 96.0, 151.0, 266.0, 434.0, 823.0, 1445.0, 2507.0, 4580.0, 8153.0, 14302.0, 25838.0, 46285.0, 82545.0, 147778.0, 259956.0, 440787.0, 686096.0, 819643.0, 663261.0, 421897.0, 246521.0, 140552.0, 78823.0, 43523.0, 24716.0, 13808.0, 7964.0, 4551.0, 2730.0, 1641.0, 944.0, 598.0, 339.0, 190.0, 141.0, 99.0, 61.0, 37.0, 27.0, 14.0, 10.0, 10.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-63.53125, -61.21728515625, -58.9033203125, -56.58935546875, -54.275390625, -51.96142578125, -49.6474609375, -47.33349609375, -45.01953125, -42.70556640625, -40.3916015625, -38.07763671875, -35.763671875, -33.44970703125, -31.1357421875, -28.82177734375, -26.5078125, -24.19384765625, -21.8798828125, -19.56591796875, -17.251953125, -14.93798828125, -12.6240234375, -10.31005859375, -7.99609375, -5.68212890625, -3.3681640625, -1.05419921875, 1.259765625, 3.57373046875, 5.8876953125, 8.20166015625, 10.515625, 12.82958984375, 15.1435546875, 17.45751953125, 19.771484375, 22.08544921875, 24.3994140625, 26.71337890625, 29.02734375, 31.34130859375, 33.6552734375, 35.96923828125, 38.283203125, 40.59716796875, 42.9111328125, 45.22509765625, 47.5390625, 49.85302734375, 52.1669921875, 54.48095703125, 56.794921875, 59.10888671875, 61.4228515625, 63.73681640625, 66.05078125, 68.36474609375, 70.6787109375, 72.99267578125, 75.306640625, 77.62060546875, 79.9345703125, 82.24853515625, 84.5625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 11.0, 14.0, 14.0, 16.0, 20.0, 23.0, 34.0, 29.0, 35.0, 35.0, 46.0, 47.0, 56.0, 45.0, 55.0, 54.0, 52.0, 45.0, 39.0, 52.0, 41.0, 37.0, 46.0, 31.0, 26.0, 14.0, 13.0, 4.0, 5.0, 9.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.75048828125, -40.2509765625, -38.75146484375, -37.251953125, -35.75244140625, -34.2529296875, -32.75341796875, -31.25390625, -29.75439453125, -28.2548828125, -26.75537109375, -25.255859375, -23.75634765625, -22.2568359375, -20.75732421875, -19.2578125, -17.75830078125, -16.2587890625, -14.75927734375, -13.259765625, -11.76025390625, -10.2607421875, -8.76123046875, -7.26171875, -5.76220703125, -4.2626953125, -2.76318359375, -1.263671875, 0.23583984375, 1.7353515625, 3.23486328125, 4.734375, 6.23388671875, 7.7333984375, 9.23291015625, 10.732421875, 12.23193359375, 13.7314453125, 15.23095703125, 16.73046875, 18.22998046875, 19.7294921875, 21.22900390625, 22.728515625, 24.22802734375, 25.7275390625, 27.22705078125, 28.7265625, 30.22607421875, 31.7255859375, 33.22509765625, 34.724609375, 36.22412109375, 37.7236328125, 39.22314453125, 40.72265625, 42.22216796875, 43.7216796875, 45.22119140625, 46.720703125, 48.22021484375, 49.7197265625, 51.21923828125, 52.71875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 10.0, 15.0, 20.0, 16.0, 38.0, 55.0, 98.0, 122.0, 230.0, 373.0, 528.0, 886.0, 1478.0, 2510.0, 4159.0, 6782.0, 11465.0, 18907.0, 31431.0, 51690.0, 84854.0, 135485.0, 212119.0, 318071.0, 444425.0, 561446.0, 601319.0, 530337.0, 404728.0, 282335.0, 185266.0, 117450.0, 73399.0, 44503.0, 26715.0, 16139.0, 9848.0, 5877.0, 3509.0, 2110.0, 1307.0, 825.0, 513.0, 318.0, 205.0, 136.0, 79.0, 63.0, 35.0, 21.0, 12.0, 9.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-45.875, -44.36328125, -42.8515625, -41.33984375, -39.828125, -38.31640625, -36.8046875, -35.29296875, -33.78125, -32.26953125, -30.7578125, -29.24609375, -27.734375, -26.22265625, -24.7109375, -23.19921875, -21.6875, -20.17578125, -18.6640625, -17.15234375, -15.640625, -14.12890625, -12.6171875, -11.10546875, -9.59375, -8.08203125, -6.5703125, -5.05859375, -3.546875, -2.03515625, -0.5234375, 0.98828125, 2.5, 4.01171875, 5.5234375, 7.03515625, 8.546875, 10.05859375, 11.5703125, 13.08203125, 14.59375, 16.10546875, 17.6171875, 19.12890625, 20.640625, 22.15234375, 23.6640625, 25.17578125, 26.6875, 28.19921875, 29.7109375, 31.22265625, 32.734375, 34.24609375, 35.7578125, 37.26953125, 38.78125, 40.29296875, 41.8046875, 43.31640625, 44.828125, 46.33984375, 47.8515625, 49.36328125, 50.875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 1.0, 7.0, 8.0, 9.0, 17.0, 29.0, 28.0, 28.0, 32.0, 62.0, 51.0, 68.0, 92.0, 97.0, 147.0, 152.0, 175.0, 192.0, 214.0, 227.0, 226.0, 231.0, 215.0, 240.0, 202.0, 176.0, 186.0, 153.0, 154.0, 128.0, 104.0, 76.0, 68.0, 68.0, 35.0, 43.0, 30.0, 32.0, 12.0, 15.0, 10.0, 11.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.140625, -21.50048828125, -20.8603515625, -20.22021484375, -19.580078125, -18.93994140625, -18.2998046875, -17.65966796875, -17.01953125, -16.37939453125, -15.7392578125, -15.09912109375, -14.458984375, -13.81884765625, -13.1787109375, -12.53857421875, -11.8984375, -11.25830078125, -10.6181640625, -9.97802734375, -9.337890625, -8.69775390625, -8.0576171875, -7.41748046875, -6.77734375, -6.13720703125, -5.4970703125, -4.85693359375, -4.216796875, -3.57666015625, -2.9365234375, -2.29638671875, -1.65625, -1.01611328125, -0.3759765625, 0.26416015625, 0.904296875, 1.54443359375, 2.1845703125, 2.82470703125, 3.46484375, 4.10498046875, 4.7451171875, 5.38525390625, 6.025390625, 6.66552734375, 7.3056640625, 7.94580078125, 8.5859375, 9.22607421875, 9.8662109375, 10.50634765625, 11.146484375, 11.78662109375, 12.4267578125, 13.06689453125, 13.70703125, 14.34716796875, 14.9873046875, 15.62744140625, 16.267578125, 16.90771484375, 17.5478515625, 18.18798828125, 18.828125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 7.0, 8.0, 11.0, 13.0, 18.0, 13.0, 23.0, 33.0, 36.0, 39.0, 45.0, 39.0, 46.0, 61.0, 63.0, 49.0, 67.0, 58.0, 59.0, 53.0, 31.0, 36.0, 35.0, 27.0, 27.0, 29.0, 15.0, 8.0, 15.0, 11.0, 3.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.269248962402344, -43.37336730957031, -41.47748947143555, -39.58161163330078, -37.68572998046875, -35.78984832763672, -33.89397048950195, -31.998090744018555, -30.102210998535156, -28.206331253051758, -26.31045150756836, -24.41457176208496, -22.518692016601562, -20.622812271118164, -18.726932525634766, -16.831052780151367, -14.935173034667969, -13.03929328918457, -11.143413543701172, -9.247533798217773, -7.351654052734375, -5.455774307250977, -3.559894561767578, -1.6640148162841797, 0.23186492919921875, 2.127744674682617, 4.023624420166016, 5.919504165649414, 7.8153839111328125, 9.711263656616211, 11.60714340209961, 13.503023147583008, 15.398902893066406, 17.294782638549805, 19.190662384033203, 21.0865421295166, 22.982421875, 24.8783016204834, 26.774181365966797, 28.670061111450195, 30.565940856933594, 32.461822509765625, 34.35770034790039, 36.253578186035156, 38.14945983886719, 40.04534149169922, 41.941219329833984, 43.83709716796875, 45.73297882080078, 47.62886047363281, 49.52473831176758, 51.420616149902344, 53.316497802734375, 55.212379455566406, 57.10825729370117, 59.00413513183594, 60.90001678466797, 62.7958984375, 64.6917724609375, 66.58765411376953, 68.48353576660156, 70.3794174194336, 72.27529907226562, 74.17117309570312, 76.06705474853516]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 4.0, 6.0, 7.0, 10.0, 7.0, 28.0, 20.0, 22.0, 36.0, 29.0, 30.0, 29.0, 28.0, 45.0, 29.0, 45.0, 48.0, 42.0, 52.0, 45.0, 48.0, 31.0, 44.0, 36.0, 29.0, 33.0, 32.0, 32.0, 19.0, 11.0, 14.0, 25.0, 13.0, 14.0, 5.0, 6.0, 6.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.849143981933594, -47.37669372558594, -45.90424346923828, -44.431793212890625, -42.95934295654297, -41.48689651489258, -40.01444625854492, -38.541996002197266, -37.06954574584961, -35.59709548950195, -34.1246452331543, -32.65219497680664, -31.179746627807617, -29.70729637145996, -28.234848022460938, -26.76239776611328, -25.289947509765625, -23.81749725341797, -22.345046997070312, -20.87259864807129, -19.400148391723633, -17.927698135375977, -16.455249786376953, -14.982799530029297, -13.51034927368164, -12.037899017333984, -10.565449714660645, -9.093000411987305, -7.620550155639648, -6.14810037612915, -4.675650596618652, -3.2032012939453125, -1.7307472229003906, -0.2582974433898926, 1.2141523361206055, 2.6866021156311035, 4.159051895141602, 5.6315016746521, 7.103951454162598, 8.576400756835938, 10.048851013183594, 11.52130126953125, 12.99375057220459, 14.46619987487793, 15.938650131225586, 17.411100387573242, 18.883548736572266, 20.355998992919922, 21.828449249267578, 23.300899505615234, 24.77334976196289, 26.245798110961914, 27.71824836730957, 29.190698623657227, 30.66314697265625, 32.135597229003906, 33.60804748535156, 35.08049774169922, 36.552947998046875, 38.02539825439453, 39.49784851074219, 40.97029495239258, 42.442745208740234, 43.91519546508789, 45.38764572143555]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 13.0, 11.0, 12.0, 26.0, 43.0, 65.0, 94.0, 135.0, 195.0, 284.0, 488.0, 747.0, 1136.0, 1742.0, 2637.0, 4138.0, 6570.0, 10245.0, 16094.0, 25837.0, 41213.0, 67497.0, 108350.0, 160409.0, 184000.0, 151532.0, 99920.0, 61648.0, 38228.0, 23792.0, 15055.0, 9291.0, 6188.0, 3783.0, 2534.0, 1592.0, 988.0, 697.0, 435.0, 301.0, 179.0, 122.0, 86.0, 66.0, 37.0, 25.0, 21.0, 20.0, 11.0, 4.0, 8.0, 2.0, 2.0, 5.0, 1.0, 3.0], "bins": [-73.5625, -71.29296875, -69.0234375, -66.75390625, -64.484375, -62.21484375, -59.9453125, -57.67578125, -55.40625, -53.13671875, -50.8671875, -48.59765625, -46.328125, -44.05859375, -41.7890625, -39.51953125, -37.25, -34.98046875, -32.7109375, -30.44140625, -28.171875, -25.90234375, -23.6328125, -21.36328125, -19.09375, -16.82421875, -14.5546875, -12.28515625, -10.015625, -7.74609375, -5.4765625, -3.20703125, -0.9375, 1.33203125, 3.6015625, 5.87109375, 8.140625, 10.41015625, 12.6796875, 14.94921875, 17.21875, 19.48828125, 21.7578125, 24.02734375, 26.296875, 28.56640625, 30.8359375, 33.10546875, 35.375, 37.64453125, 39.9140625, 42.18359375, 44.453125, 46.72265625, 48.9921875, 51.26171875, 53.53125, 55.80078125, 58.0703125, 60.33984375, 62.609375, 64.87890625, 67.1484375, 69.41796875, 71.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 10.0, 7.0, 11.0, 10.0, 18.0, 17.0, 13.0, 24.0, 22.0, 24.0, 21.0, 31.0, 32.0, 48.0, 39.0, 41.0, 40.0, 48.0, 39.0, 48.0, 41.0, 59.0, 49.0, 45.0, 35.0, 19.0, 36.0, 21.0, 13.0, 30.0, 15.0, 21.0, 12.0, 14.0, 10.0, 11.0, 2.0, 5.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-45.03125, -43.7021484375, -42.373046875, -41.0439453125, -39.71484375, -38.3857421875, -37.056640625, -35.7275390625, -34.3984375, -33.0693359375, -31.740234375, -30.4111328125, -29.08203125, -27.7529296875, -26.423828125, -25.0947265625, -23.765625, -22.4365234375, -21.107421875, -19.7783203125, -18.44921875, -17.1201171875, -15.791015625, -14.4619140625, -13.1328125, -11.8037109375, -10.474609375, -9.1455078125, -7.81640625, -6.4873046875, -5.158203125, -3.8291015625, -2.5, -1.1708984375, 0.158203125, 1.4873046875, 2.81640625, 4.1455078125, 5.474609375, 6.8037109375, 8.1328125, 9.4619140625, 10.791015625, 12.1201171875, 13.44921875, 14.7783203125, 16.107421875, 17.4365234375, 18.765625, 20.0947265625, 21.423828125, 22.7529296875, 24.08203125, 25.4111328125, 26.740234375, 28.0693359375, 29.3984375, 30.7275390625, 32.056640625, 33.3857421875, 34.71484375, 36.0439453125, 37.373046875, 38.7021484375, 40.03125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 16.0, 27.0, 54.0, 104.0, 137.0, 228.0, 388.0, 591.0, 935.0, 1518.0, 2479.0, 4358.0, 7617.0, 13965.0, 26556.0, 55552.0, 126103.0, 271043.0, 280845.0, 134387.0, 59072.0, 28550.0, 14535.0, 8128.0, 4466.0, 2630.0, 1658.0, 1002.0, 622.0, 351.0, 255.0, 125.0, 75.0, 56.0, 30.0, 22.0, 15.0, 13.0, 6.0, 3.0, 3.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-108.125, -104.75, -101.375, -98.0, -94.625, -91.25, -87.875, -84.5, -81.125, -77.75, -74.375, -71.0, -67.625, -64.25, -60.875, -57.5, -54.125, -50.75, -47.375, -44.0, -40.625, -37.25, -33.875, -30.5, -27.125, -23.75, -20.375, -17.0, -13.625, -10.25, -6.875, -3.5, -0.125, 3.25, 6.625, 10.0, 13.375, 16.75, 20.125, 23.5, 26.875, 30.25, 33.625, 37.0, 40.375, 43.75, 47.125, 50.5, 53.875, 57.25, 60.625, 64.0, 67.375, 70.75, 74.125, 77.5, 80.875, 84.25, 87.625, 91.0, 94.375, 97.75, 101.125, 104.5, 107.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 7.0, 5.0, 6.0, 9.0, 10.0, 11.0, 21.0, 20.0, 23.0, 18.0, 13.0, 18.0, 19.0, 17.0, 21.0, 37.0, 29.0, 25.0, 29.0, 27.0, 26.0, 29.0, 33.0, 36.0, 33.0, 42.0, 34.0, 29.0, 26.0, 37.0, 31.0, 31.0, 27.0, 20.0, 30.0, 19.0, 19.0, 17.0, 21.0, 8.0, 14.0, 11.0, 17.0, 8.0, 6.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-23.34375, -22.622802734375, -21.90185546875, -21.180908203125, -20.4599609375, -19.739013671875, -19.01806640625, -18.297119140625, -17.576171875, -16.855224609375, -16.13427734375, -15.413330078125, -14.6923828125, -13.971435546875, -13.25048828125, -12.529541015625, -11.80859375, -11.087646484375, -10.36669921875, -9.645751953125, -8.9248046875, -8.203857421875, -7.48291015625, -6.761962890625, -6.041015625, -5.320068359375, -4.59912109375, -3.878173828125, -3.1572265625, -2.436279296875, -1.71533203125, -0.994384765625, -0.2734375, 0.447509765625, 1.16845703125, 1.889404296875, 2.6103515625, 3.331298828125, 4.05224609375, 4.773193359375, 5.494140625, 6.215087890625, 6.93603515625, 7.656982421875, 8.3779296875, 9.098876953125, 9.81982421875, 10.540771484375, 11.26171875, 11.982666015625, 12.70361328125, 13.424560546875, 14.1455078125, 14.866455078125, 15.58740234375, 16.308349609375, 17.029296875, 17.750244140625, 18.47119140625, 19.192138671875, 19.9130859375, 20.634033203125, 21.35498046875, 22.075927734375, 22.796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 22.0, 21.0, 33.0, 52.0, 66.0, 97.0, 181.0, 277.0, 482.0, 684.0, 1171.0, 2097.0, 3694.0, 6525.0, 12418.0, 24696.0, 53254.0, 125378.0, 290463.0, 292903.0, 127251.0, 53853.0, 24975.0, 12446.0, 6581.0, 3646.0, 2060.0, 1225.0, 766.0, 436.0, 294.0, 182.0, 106.0, 78.0, 56.0, 28.0, 19.0, 13.0, 10.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.34375, -42.91357421875, -41.4833984375, -40.05322265625, -38.623046875, -37.19287109375, -35.7626953125, -34.33251953125, -32.90234375, -31.47216796875, -30.0419921875, -28.61181640625, -27.181640625, -25.75146484375, -24.3212890625, -22.89111328125, -21.4609375, -20.03076171875, -18.6005859375, -17.17041015625, -15.740234375, -14.31005859375, -12.8798828125, -11.44970703125, -10.01953125, -8.58935546875, -7.1591796875, -5.72900390625, -4.298828125, -2.86865234375, -1.4384765625, -0.00830078125, 1.421875, 2.85205078125, 4.2822265625, 5.71240234375, 7.142578125, 8.57275390625, 10.0029296875, 11.43310546875, 12.86328125, 14.29345703125, 15.7236328125, 17.15380859375, 18.583984375, 20.01416015625, 21.4443359375, 22.87451171875, 24.3046875, 25.73486328125, 27.1650390625, 28.59521484375, 30.025390625, 31.45556640625, 32.8857421875, 34.31591796875, 35.74609375, 37.17626953125, 38.6064453125, 40.03662109375, 41.466796875, 42.89697265625, 44.3271484375, 45.75732421875, 47.1875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 7.0, 14.0, 15.0, 26.0, 44.0, 46.0, 82.0, 99.0, 142.0, 142.0, 107.0, 83.0, 64.0, 38.0, 26.0, 12.0, 10.0, 5.0, 4.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004093170166015625, -0.0038986802101135254, -0.0037041902542114258, -0.003509700298309326, -0.0033152103424072266, -0.003120720386505127, -0.0029262304306030273, -0.0027317404747009277, -0.002537250518798828, -0.0023427605628967285, -0.002148270606994629, -0.0019537806510925293, -0.0017592906951904297, -0.00156480073928833, -0.0013703107833862305, -0.0011758208274841309, -0.0009813308715820312, -0.0007868409156799316, -0.000592350959777832, -0.0003978610038757324, -0.0002033710479736328, -8.881092071533203e-06, 0.0001856088638305664, 0.000380098819732666, 0.0005745887756347656, 0.0007690787315368652, 0.0009635686874389648, 0.0011580586433410645, 0.001352548599243164, 0.0015470385551452637, 0.0017415285110473633, 0.0019360184669494629, 0.0021305084228515625, 0.002324998378753662, 0.0025194883346557617, 0.0027139782905578613, 0.002908468246459961, 0.0031029582023620605, 0.00329744815826416, 0.0034919381141662598, 0.0036864280700683594, 0.003880918025970459, 0.004075407981872559, 0.004269897937774658, 0.004464387893676758, 0.004658877849578857, 0.004853367805480957, 0.005047857761383057, 0.005242347717285156, 0.005436837673187256, 0.0056313276290893555, 0.005825817584991455, 0.006020307540893555, 0.006214797496795654, 0.006409287452697754, 0.0066037774085998535, 0.006798267364501953, 0.006992757320404053, 0.007187247276306152, 0.007381737232208252, 0.0075762271881103516, 0.007770717144012451, 0.00796520709991455, 0.00815969705581665, 0.00835418701171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 17.0, 15.0, 35.0, 48.0, 69.0, 118.0, 151.0, 251.0, 434.0, 666.0, 1071.0, 1743.0, 3012.0, 5466.0, 9968.0, 18609.0, 36455.0, 74564.0, 147109.0, 238121.0, 230525.0, 138255.0, 68785.0, 33875.0, 17439.0, 9256.0, 5013.0, 2956.0, 1734.0, 1019.0, 610.0, 408.0, 248.0, 170.0, 107.0, 72.0, 41.0, 44.0, 16.0, 12.0, 7.0, 10.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.84375, -46.34619140625, -44.8486328125, -43.35107421875, -41.853515625, -40.35595703125, -38.8583984375, -37.36083984375, -35.86328125, -34.36572265625, -32.8681640625, -31.37060546875, -29.873046875, -28.37548828125, -26.8779296875, -25.38037109375, -23.8828125, -22.38525390625, -20.8876953125, -19.39013671875, -17.892578125, -16.39501953125, -14.8974609375, -13.39990234375, -11.90234375, -10.40478515625, -8.9072265625, -7.40966796875, -5.912109375, -4.41455078125, -2.9169921875, -1.41943359375, 0.078125, 1.57568359375, 3.0732421875, 4.57080078125, 6.068359375, 7.56591796875, 9.0634765625, 10.56103515625, 12.05859375, 13.55615234375, 15.0537109375, 16.55126953125, 18.048828125, 19.54638671875, 21.0439453125, 22.54150390625, 24.0390625, 25.53662109375, 27.0341796875, 28.53173828125, 30.029296875, 31.52685546875, 33.0244140625, 34.52197265625, 36.01953125, 37.51708984375, 39.0146484375, 40.51220703125, 42.009765625, 43.50732421875, 45.0048828125, 46.50244140625, 48.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 7.0, 6.0, 9.0, 17.0, 11.0, 23.0, 21.0, 30.0, 29.0, 52.0, 37.0, 53.0, 71.0, 62.0, 61.0, 53.0, 73.0, 57.0, 36.0, 43.0, 44.0, 31.0, 37.0, 27.0, 24.0, 19.0, 9.0, 5.0, 12.0, 6.0, 6.0, 2.0, 0.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.50146484375, -10.1123046875, -9.72314453125, -9.333984375, -8.94482421875, -8.5556640625, -8.16650390625, -7.77734375, -7.38818359375, -6.9990234375, -6.60986328125, -6.220703125, -5.83154296875, -5.4423828125, -5.05322265625, -4.6640625, -4.27490234375, -3.8857421875, -3.49658203125, -3.107421875, -2.71826171875, -2.3291015625, -1.93994140625, -1.55078125, -1.16162109375, -0.7724609375, -0.38330078125, 0.005859375, 0.39501953125, 0.7841796875, 1.17333984375, 1.5625, 1.95166015625, 2.3408203125, 2.72998046875, 3.119140625, 3.50830078125, 3.8974609375, 4.28662109375, 4.67578125, 5.06494140625, 5.4541015625, 5.84326171875, 6.232421875, 6.62158203125, 7.0107421875, 7.39990234375, 7.7890625, 8.17822265625, 8.5673828125, 8.95654296875, 9.345703125, 9.73486328125, 10.1240234375, 10.51318359375, 10.90234375, 11.29150390625, 11.6806640625, 12.06982421875, 12.458984375, 12.84814453125, 13.2373046875, 13.62646484375, 14.015625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 11.0, 7.0, 15.0, 17.0, 22.0, 34.0, 35.0, 38.0, 50.0, 58.0, 56.0, 58.0, 63.0, 71.0, 64.0, 57.0, 45.0, 47.0, 36.0, 29.0, 36.0, 32.0, 24.0, 22.0, 17.0, 16.0, 5.0, 10.0, 6.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.69770431518555, -36.896141052246094, -35.09457778930664, -33.29301452636719, -31.4914493560791, -29.68988609313965, -27.888320922851562, -26.08675765991211, -24.285194396972656, -22.483631134033203, -20.68206787109375, -18.880502700805664, -17.07893943786621, -15.277376174926758, -13.475811958312988, -11.674247741699219, -9.872684478759766, -8.071121215820312, -6.269556999206543, -4.467993259429932, -2.6664295196533203, -0.8648662567138672, 0.9366979598999023, 2.738262176513672, 4.539825439453125, 6.341389179229736, 8.142952919006348, 9.944517135620117, 11.74608039855957, 13.547643661499023, 15.349207878112793, 17.150772094726562, 18.95233917236328, 20.753902435302734, 22.555465698242188, 24.357030868530273, 26.158594131469727, 27.96015739440918, 29.761722564697266, 31.56328582763672, 33.36484909057617, 35.166412353515625, 36.96797561645508, 38.76953887939453, 40.57110595703125, 42.37266540527344, 44.174232482910156, 45.97579574584961, 47.77735900878906, 49.578922271728516, 51.38048553466797, 53.18204879760742, 54.983612060546875, 56.785179138183594, 58.58674240112305, 60.3883056640625, 62.18986892700195, 63.991432189941406, 65.79299926757812, 67.59455871582031, 69.39612579345703, 71.19768524169922, 72.99925231933594, 74.80081176757812, 76.60237884521484]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 7.0, 8.0, 23.0, 17.0, 24.0, 31.0, 37.0, 19.0, 33.0, 28.0, 30.0, 38.0, 41.0, 37.0, 49.0, 30.0, 51.0, 38.0, 44.0, 39.0, 48.0, 33.0, 31.0, 26.0, 23.0, 26.0, 26.0, 22.0, 19.0, 16.0, 14.0, 11.0, 12.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-40.85141372680664, -39.61397171020508, -38.37652587890625, -37.13908386230469, -35.90163803100586, -34.6641960144043, -33.42675018310547, -32.189308166503906, -30.95186424255371, -29.714420318603516, -28.47697639465332, -27.239532470703125, -26.002090454101562, -24.764644622802734, -23.527202606201172, -22.289758682250977, -21.05231475830078, -19.814870834350586, -18.57742691040039, -17.339982986450195, -16.1025390625, -14.865096092224121, -13.627653121948242, -12.390209197998047, -11.152765274047852, -9.915321350097656, -8.677877426147461, -7.440434455871582, -6.202990531921387, -4.965546607971191, -3.7281031608581543, -2.490659713745117, -1.2532196044921875, -0.01577591896057129, 1.221667766571045, 2.459111452102661, 3.6965551376342773, 4.933999061584473, 6.17144250869751, 7.408885955810547, 8.646329879760742, 9.883773803710938, 11.121217727661133, 12.358660697937012, 13.596104621887207, 14.833548545837402, 16.07099151611328, 17.308435440063477, 18.545879364013672, 19.783323287963867, 21.020767211914062, 22.258211135864258, 23.495655059814453, 24.733097076416016, 25.97054100036621, 27.207984924316406, 28.4454288482666, 29.682872772216797, 30.920316696166992, 32.15776062011719, 33.39520263671875, 34.63264846801758, 35.87009048461914, 37.10753631591797, 38.34497833251953]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 11.0, 10.0, 26.0, 32.0, 63.0, 110.0, 153.0, 254.0, 421.0, 703.0, 1027.0, 1736.0, 2770.0, 4502.0, 7022.0, 11031.0, 17251.0, 25875.0, 38091.0, 53853.0, 72079.0, 92027.0, 107990.0, 116802.0, 113589.0, 100501.0, 82478.0, 62547.0, 45448.0, 31491.0, 21086.0, 13741.0, 8895.0, 5672.0, 3508.0, 2174.0, 1408.0, 799.0, 509.0, 362.0, 201.0, 124.0, 75.0, 46.0, 29.0, 13.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -42.2490234375, -40.779296875, -39.3095703125, -37.83984375, -36.3701171875, -34.900390625, -33.4306640625, -31.9609375, -30.4912109375, -29.021484375, -27.5517578125, -26.08203125, -24.6123046875, -23.142578125, -21.6728515625, -20.203125, -18.7333984375, -17.263671875, -15.7939453125, -14.32421875, -12.8544921875, -11.384765625, -9.9150390625, -8.4453125, -6.9755859375, -5.505859375, -4.0361328125, -2.56640625, -1.0966796875, 0.373046875, 1.8427734375, 3.3125, 4.7822265625, 6.251953125, 7.7216796875, 9.19140625, 10.6611328125, 12.130859375, 13.6005859375, 15.0703125, 16.5400390625, 18.009765625, 19.4794921875, 20.94921875, 22.4189453125, 23.888671875, 25.3583984375, 26.828125, 28.2978515625, 29.767578125, 31.2373046875, 32.70703125, 34.1767578125, 35.646484375, 37.1162109375, 38.5859375, 40.0556640625, 41.525390625, 42.9951171875, 44.46484375, 45.9345703125, 47.404296875, 48.8740234375, 50.34375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 9.0, 16.0, 11.0, 15.0, 16.0, 25.0, 22.0, 23.0, 38.0, 27.0, 35.0, 27.0, 51.0, 45.0, 37.0, 37.0, 37.0, 48.0, 38.0, 50.0, 39.0, 28.0, 38.0, 39.0, 26.0, 25.0, 27.0, 22.0, 24.0, 16.0, 11.0, 22.0, 16.0, 7.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-39.28125, -38.08642578125, -36.8916015625, -35.69677734375, -34.501953125, -33.30712890625, -32.1123046875, -30.91748046875, -29.72265625, -28.52783203125, -27.3330078125, -26.13818359375, -24.943359375, -23.74853515625, -22.5537109375, -21.35888671875, -20.1640625, -18.96923828125, -17.7744140625, -16.57958984375, -15.384765625, -14.18994140625, -12.9951171875, -11.80029296875, -10.60546875, -9.41064453125, -8.2158203125, -7.02099609375, -5.826171875, -4.63134765625, -3.4365234375, -2.24169921875, -1.046875, 0.14794921875, 1.3427734375, 2.53759765625, 3.732421875, 4.92724609375, 6.1220703125, 7.31689453125, 8.51171875, 9.70654296875, 10.9013671875, 12.09619140625, 13.291015625, 14.48583984375, 15.6806640625, 16.87548828125, 18.0703125, 19.26513671875, 20.4599609375, 21.65478515625, 22.849609375, 24.04443359375, 25.2392578125, 26.43408203125, 27.62890625, 28.82373046875, 30.0185546875, 31.21337890625, 32.408203125, 33.60302734375, 34.7978515625, 35.99267578125, 37.1875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 4.0, 13.0, 11.0, 33.0, 39.0, 70.0, 112.0, 151.0, 276.0, 439.0, 667.0, 1081.0, 1836.0, 2959.0, 4610.0, 7555.0, 12106.0, 19502.0, 30831.0, 45638.0, 64786.0, 86369.0, 107231.0, 120021.0, 122455.0, 112400.0, 92799.0, 70961.0, 50805.0, 33913.0, 22165.0, 13952.0, 8784.0, 5448.0, 3234.0, 2054.0, 1162.0, 785.0, 450.0, 281.0, 210.0, 129.0, 75.0, 59.0, 40.0, 27.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.35009765625, -50.6689453125, -48.98779296875, -47.306640625, -45.62548828125, -43.9443359375, -42.26318359375, -40.58203125, -38.90087890625, -37.2197265625, -35.53857421875, -33.857421875, -32.17626953125, -30.4951171875, -28.81396484375, -27.1328125, -25.45166015625, -23.7705078125, -22.08935546875, -20.408203125, -18.72705078125, -17.0458984375, -15.36474609375, -13.68359375, -12.00244140625, -10.3212890625, -8.64013671875, -6.958984375, -5.27783203125, -3.5966796875, -1.91552734375, -0.234375, 1.44677734375, 3.1279296875, 4.80908203125, 6.490234375, 8.17138671875, 9.8525390625, 11.53369140625, 13.21484375, 14.89599609375, 16.5771484375, 18.25830078125, 19.939453125, 21.62060546875, 23.3017578125, 24.98291015625, 26.6640625, 28.34521484375, 30.0263671875, 31.70751953125, 33.388671875, 35.06982421875, 36.7509765625, 38.43212890625, 40.11328125, 41.79443359375, 43.4755859375, 45.15673828125, 46.837890625, 48.51904296875, 50.2001953125, 51.88134765625, 53.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 8.0, 14.0, 7.0, 15.0, 9.0, 13.0, 19.0, 19.0, 20.0, 18.0, 28.0, 31.0, 31.0, 26.0, 34.0, 51.0, 36.0, 33.0, 35.0, 52.0, 46.0, 43.0, 40.0, 35.0, 33.0, 31.0, 37.0, 38.0, 25.0, 24.0, 21.0, 20.0, 19.0, 13.0, 14.0, 11.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.953125, -23.16748046875, -22.3818359375, -21.59619140625, -20.810546875, -20.02490234375, -19.2392578125, -18.45361328125, -17.66796875, -16.88232421875, -16.0966796875, -15.31103515625, -14.525390625, -13.73974609375, -12.9541015625, -12.16845703125, -11.3828125, -10.59716796875, -9.8115234375, -9.02587890625, -8.240234375, -7.45458984375, -6.6689453125, -5.88330078125, -5.09765625, -4.31201171875, -3.5263671875, -2.74072265625, -1.955078125, -1.16943359375, -0.3837890625, 0.40185546875, 1.1875, 1.97314453125, 2.7587890625, 3.54443359375, 4.330078125, 5.11572265625, 5.9013671875, 6.68701171875, 7.47265625, 8.25830078125, 9.0439453125, 9.82958984375, 10.615234375, 11.40087890625, 12.1865234375, 12.97216796875, 13.7578125, 14.54345703125, 15.3291015625, 16.11474609375, 16.900390625, 17.68603515625, 18.4716796875, 19.25732421875, 20.04296875, 20.82861328125, 21.6142578125, 22.39990234375, 23.185546875, 23.97119140625, 24.7568359375, 25.54248046875, 26.328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 11.0, 14.0, 21.0, 31.0, 46.0, 63.0, 105.0, 138.0, 212.0, 331.0, 442.0, 771.0, 1236.0, 2005.0, 3479.0, 6055.0, 10903.0, 20275.0, 38354.0, 71274.0, 125981.0, 185665.0, 203829.0, 160687.0, 98838.0, 53955.0, 28405.0, 15353.0, 8314.0, 4698.0, 2628.0, 1634.0, 986.0, 626.0, 395.0, 253.0, 177.0, 121.0, 75.0, 54.0, 37.0, 26.0, 22.0, 11.0, 10.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.5, -21.780517578125, -21.06103515625, -20.341552734375, -19.6220703125, -18.902587890625, -18.18310546875, -17.463623046875, -16.744140625, -16.024658203125, -15.30517578125, -14.585693359375, -13.8662109375, -13.146728515625, -12.42724609375, -11.707763671875, -10.98828125, -10.268798828125, -9.54931640625, -8.829833984375, -8.1103515625, -7.390869140625, -6.67138671875, -5.951904296875, -5.232421875, -4.512939453125, -3.79345703125, -3.073974609375, -2.3544921875, -1.635009765625, -0.91552734375, -0.196044921875, 0.5234375, 1.242919921875, 1.96240234375, 2.681884765625, 3.4013671875, 4.120849609375, 4.84033203125, 5.559814453125, 6.279296875, 6.998779296875, 7.71826171875, 8.437744140625, 9.1572265625, 9.876708984375, 10.59619140625, 11.315673828125, 12.03515625, 12.754638671875, 13.47412109375, 14.193603515625, 14.9130859375, 15.632568359375, 16.35205078125, 17.071533203125, 17.791015625, 18.510498046875, 19.22998046875, 19.949462890625, 20.6689453125, 21.388427734375, 22.10791015625, 22.827392578125, 23.546875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 4.0, 8.0, 5.0, 11.0, 8.0, 11.0, 18.0, 17.0, 15.0, 27.0, 29.0, 30.0, 38.0, 66.0, 47.0, 55.0, 64.0, 70.0, 67.0, 55.0, 43.0, 42.0, 40.0, 37.0, 34.0, 30.0, 28.0, 18.0, 13.0, 13.0, 12.0, 9.0, 8.0, 5.0, 4.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0020751953125, -0.002010852098464966, -0.0019465088844299316, -0.0018821656703948975, -0.0018178224563598633, -0.001753479242324829, -0.001689136028289795, -0.0016247928142547607, -0.0015604496002197266, -0.0014961063861846924, -0.0014317631721496582, -0.001367419958114624, -0.0013030767440795898, -0.0012387335300445557, -0.0011743903160095215, -0.0011100471019744873, -0.0010457038879394531, -0.000981360673904419, -0.0009170174598693848, -0.0008526742458343506, -0.0007883310317993164, -0.0007239878177642822, -0.000659644603729248, -0.0005953013896942139, -0.0005309581756591797, -0.0004666149616241455, -0.00040227174758911133, -0.00033792853355407715, -0.00027358531951904297, -0.0002092421054840088, -0.0001448988914489746, -8.055567741394043e-05, -1.621246337890625e-05, 4.813075065612793e-05, 0.00011247396469116211, 0.0001768171787261963, 0.00024116039276123047, 0.00030550360679626465, 0.00036984682083129883, 0.000434190034866333, 0.0004985332489013672, 0.0005628764629364014, 0.0006272196769714355, 0.0006915628910064697, 0.0007559061050415039, 0.0008202493190765381, 0.0008845925331115723, 0.0009489357471466064, 0.0010132789611816406, 0.0010776221752166748, 0.001141965389251709, 0.0012063086032867432, 0.0012706518173217773, 0.0013349950313568115, 0.0013993382453918457, 0.0014636814594268799, 0.001528024673461914, 0.0015923678874969482, 0.0016567111015319824, 0.0017210543155670166, 0.0017853975296020508, 0.001849740743637085, 0.0019140839576721191, 0.0019784271717071533, 0.0020427703857421875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 10.0, 15.0, 23.0, 28.0, 35.0, 50.0, 87.0, 112.0, 169.0, 274.0, 427.0, 722.0, 1253.0, 2121.0, 3827.0, 7307.0, 15171.0, 32942.0, 71392.0, 146080.0, 230943.0, 236857.0, 153859.0, 76115.0, 35063.0, 16371.0, 7906.0, 3912.0, 2123.0, 1273.0, 749.0, 457.0, 297.0, 196.0, 119.0, 88.0, 60.0, 36.0, 25.0, 13.0, 21.0, 7.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-27.875, -27.05615234375, -26.2373046875, -25.41845703125, -24.599609375, -23.78076171875, -22.9619140625, -22.14306640625, -21.32421875, -20.50537109375, -19.6865234375, -18.86767578125, -18.048828125, -17.22998046875, -16.4111328125, -15.59228515625, -14.7734375, -13.95458984375, -13.1357421875, -12.31689453125, -11.498046875, -10.67919921875, -9.8603515625, -9.04150390625, -8.22265625, -7.40380859375, -6.5849609375, -5.76611328125, -4.947265625, -4.12841796875, -3.3095703125, -2.49072265625, -1.671875, -0.85302734375, -0.0341796875, 0.78466796875, 1.603515625, 2.42236328125, 3.2412109375, 4.06005859375, 4.87890625, 5.69775390625, 6.5166015625, 7.33544921875, 8.154296875, 8.97314453125, 9.7919921875, 10.61083984375, 11.4296875, 12.24853515625, 13.0673828125, 13.88623046875, 14.705078125, 15.52392578125, 16.3427734375, 17.16162109375, 17.98046875, 18.79931640625, 19.6181640625, 20.43701171875, 21.255859375, 22.07470703125, 22.8935546875, 23.71240234375, 24.53125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 1.0, 7.0, 8.0, 9.0, 4.0, 8.0, 9.0, 12.0, 28.0, 8.0, 39.0, 27.0, 41.0, 41.0, 51.0, 40.0, 62.0, 53.0, 55.0, 54.0, 63.0, 40.0, 55.0, 41.0, 42.0, 42.0, 36.0, 20.0, 20.0, 20.0, 14.0, 14.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 6.0, 4.0], "bins": [-8.8203125, -8.60888671875, -8.3974609375, -8.18603515625, -7.974609375, -7.76318359375, -7.5517578125, -7.34033203125, -7.12890625, -6.91748046875, -6.7060546875, -6.49462890625, -6.283203125, -6.07177734375, -5.8603515625, -5.64892578125, -5.4375, -5.22607421875, -5.0146484375, -4.80322265625, -4.591796875, -4.38037109375, -4.1689453125, -3.95751953125, -3.74609375, -3.53466796875, -3.3232421875, -3.11181640625, -2.900390625, -2.68896484375, -2.4775390625, -2.26611328125, -2.0546875, -1.84326171875, -1.6318359375, -1.42041015625, -1.208984375, -0.99755859375, -0.7861328125, -0.57470703125, -0.36328125, -0.15185546875, 0.0595703125, 0.27099609375, 0.482421875, 0.69384765625, 0.9052734375, 1.11669921875, 1.328125, 1.53955078125, 1.7509765625, 1.96240234375, 2.173828125, 2.38525390625, 2.5966796875, 2.80810546875, 3.01953125, 3.23095703125, 3.4423828125, 3.65380859375, 3.865234375, 4.07666015625, 4.2880859375, 4.49951171875, 4.7109375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 11.0, 9.0, 15.0, 17.0, 25.0, 19.0, 28.0, 22.0, 51.0, 38.0, 45.0, 51.0, 56.0, 50.0, 63.0, 54.0, 44.0, 48.0, 55.0, 36.0, 38.0, 27.0, 31.0, 24.0, 29.0, 21.0, 13.0, 20.0, 9.0, 10.0, 4.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.2425422668457, -38.69725799560547, -37.151973724365234, -35.606689453125, -34.061405181884766, -32.51612091064453, -30.970836639404297, -29.425552368164062, -27.880268096923828, -26.334983825683594, -24.78969955444336, -23.244415283203125, -21.69913101196289, -20.153846740722656, -18.608562469482422, -17.063278198242188, -15.517993927001953, -13.972709655761719, -12.427425384521484, -10.88214111328125, -9.336856842041016, -7.791572570800781, -6.246288299560547, -4.7010040283203125, -3.155719757080078, -1.6104354858398438, -0.06515121459960938, 1.480133056640625, 3.0254173278808594, 4.570701599121094, 6.115985870361328, 7.6612701416015625, 9.206554412841797, 10.751838684082031, 12.297122955322266, 13.8424072265625, 15.387691497802734, 16.93297576904297, 18.478260040283203, 20.023544311523438, 21.568828582763672, 23.114112854003906, 24.65939712524414, 26.204681396484375, 27.74996566772461, 29.295249938964844, 30.840534210205078, 32.38581848144531, 33.93110275268555, 35.47638702392578, 37.021671295166016, 38.56695556640625, 40.112239837646484, 41.65752410888672, 43.20280838012695, 44.74809265136719, 46.29337692260742, 47.838661193847656, 49.38394546508789, 50.929229736328125, 52.47451400756836, 54.019798278808594, 55.56508255004883, 57.11036682128906, 58.6556510925293]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 11.0, 10.0, 9.0, 23.0, 24.0, 23.0, 22.0, 16.0, 33.0, 18.0, 26.0, 29.0, 40.0, 33.0, 41.0, 30.0, 44.0, 39.0, 38.0, 35.0, 34.0, 42.0, 27.0, 40.0, 28.0, 29.0, 19.0, 31.0, 23.0, 24.0, 26.0, 19.0, 18.0, 12.0, 15.0, 7.0, 12.0, 6.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0], "bins": [-39.16324996948242, -38.02390670776367, -36.88456344604492, -35.74522018432617, -34.60587692260742, -33.46653366088867, -32.32719039916992, -31.187849044799805, -30.048505783081055, -28.909162521362305, -27.769819259643555, -26.630475997924805, -25.491134643554688, -24.351791381835938, -23.212448120117188, -22.073104858398438, -20.933761596679688, -19.794418334960938, -18.655075073242188, -17.515731811523438, -16.376388549804688, -15.237046241760254, -14.09770393371582, -12.95836067199707, -11.81901741027832, -10.67967414855957, -9.54033088684082, -8.400988578796387, -7.261645317077637, -6.122302055358887, -4.982959270477295, -3.843616485595703, -2.7042770385742188, -1.5649340152740479, -0.42559099197387695, 0.713752031326294, 1.8530950546264648, 2.992438316345215, 4.131781101226807, 5.271123886108398, 6.410467147827148, 7.549810409545898, 8.689153671264648, 9.828495979309082, 10.967839241027832, 12.107182502746582, 13.246524810791016, 14.385868072509766, 15.525211334228516, 16.664554595947266, 17.803897857666016, 18.943241119384766, 20.082584381103516, 21.221927642822266, 22.361268997192383, 23.500612258911133, 24.639955520629883, 25.779298782348633, 26.918642044067383, 28.057985305786133, 29.19732666015625, 30.336669921875, 31.47601318359375, 32.6153564453125, 33.75469970703125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 8.0, 17.0, 18.0, 29.0, 29.0, 49.0, 95.0, 154.0, 233.0, 369.0, 522.0, 937.0, 1538.0, 2374.0, 4017.0, 6590.0, 10693.0, 18018.0, 29717.0, 49750.0, 82474.0, 138150.0, 229933.0, 376963.0, 584537.0, 743443.0, 683460.0, 476570.0, 297640.0, 179686.0, 108872.0, 65449.0, 39826.0, 24227.0, 14580.0, 8886.0, 5424.0, 3373.0, 2175.0, 1286.0, 785.0, 517.0, 337.0, 182.0, 112.0, 92.0, 54.0, 29.0, 21.0, 15.0, 11.0, 7.0, 4.0, 1.0], "bins": [-53.125, -51.6396484375, -50.154296875, -48.6689453125, -47.18359375, -45.6982421875, -44.212890625, -42.7275390625, -41.2421875, -39.7568359375, -38.271484375, -36.7861328125, -35.30078125, -33.8154296875, -32.330078125, -30.8447265625, -29.359375, -27.8740234375, -26.388671875, -24.9033203125, -23.41796875, -21.9326171875, -20.447265625, -18.9619140625, -17.4765625, -15.9912109375, -14.505859375, -13.0205078125, -11.53515625, -10.0498046875, -8.564453125, -7.0791015625, -5.59375, -4.1083984375, -2.623046875, -1.1376953125, 0.34765625, 1.8330078125, 3.318359375, 4.8037109375, 6.2890625, 7.7744140625, 9.259765625, 10.7451171875, 12.23046875, 13.7158203125, 15.201171875, 16.6865234375, 18.171875, 19.6572265625, 21.142578125, 22.6279296875, 24.11328125, 25.5986328125, 27.083984375, 28.5693359375, 30.0546875, 31.5400390625, 33.025390625, 34.5107421875, 35.99609375, 37.4814453125, 38.966796875, 40.4521484375, 41.9375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 16.0, 10.0, 8.0, 15.0, 17.0, 17.0, 33.0, 33.0, 31.0, 28.0, 34.0, 40.0, 32.0, 37.0, 29.0, 45.0, 41.0, 38.0, 35.0, 49.0, 55.0, 35.0, 31.0, 27.0, 26.0, 35.0, 24.0, 14.0, 22.0, 17.0, 20.0, 21.0, 14.0, 10.0, 8.0, 4.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.671875, -23.80029296875, -22.9287109375, -22.05712890625, -21.185546875, -20.31396484375, -19.4423828125, -18.57080078125, -17.69921875, -16.82763671875, -15.9560546875, -15.08447265625, -14.212890625, -13.34130859375, -12.4697265625, -11.59814453125, -10.7265625, -9.85498046875, -8.9833984375, -8.11181640625, -7.240234375, -6.36865234375, -5.4970703125, -4.62548828125, -3.75390625, -2.88232421875, -2.0107421875, -1.13916015625, -0.267578125, 0.60400390625, 1.4755859375, 2.34716796875, 3.21875, 4.09033203125, 4.9619140625, 5.83349609375, 6.705078125, 7.57666015625, 8.4482421875, 9.31982421875, 10.19140625, 11.06298828125, 11.9345703125, 12.80615234375, 13.677734375, 14.54931640625, 15.4208984375, 16.29248046875, 17.1640625, 18.03564453125, 18.9072265625, 19.77880859375, 20.650390625, 21.52197265625, 22.3935546875, 23.26513671875, 24.13671875, 25.00830078125, 25.8798828125, 26.75146484375, 27.623046875, 28.49462890625, 29.3662109375, 30.23779296875, 31.109375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 8.0, 9.0, 11.0, 22.0, 31.0, 49.0, 75.0, 120.0, 191.0, 291.0, 554.0, 794.0, 1246.0, 2182.0, 3563.0, 6066.0, 10119.0, 17313.0, 29372.0, 49018.0, 81839.0, 134211.0, 215313.0, 330361.0, 471421.0, 596000.0, 625062.0, 534853.0, 393463.0, 264514.0, 168139.0, 102836.0, 63005.0, 37220.0, 22253.0, 12952.0, 7832.0, 4569.0, 2877.0, 1749.0, 1051.0, 658.0, 401.0, 233.0, 165.0, 97.0, 64.0, 33.0, 30.0, 17.0, 10.0, 12.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-38.84375, -37.638671875, -36.43359375, -35.228515625, -34.0234375, -32.818359375, -31.61328125, -30.408203125, -29.203125, -27.998046875, -26.79296875, -25.587890625, -24.3828125, -23.177734375, -21.97265625, -20.767578125, -19.5625, -18.357421875, -17.15234375, -15.947265625, -14.7421875, -13.537109375, -12.33203125, -11.126953125, -9.921875, -8.716796875, -7.51171875, -6.306640625, -5.1015625, -3.896484375, -2.69140625, -1.486328125, -0.28125, 0.923828125, 2.12890625, 3.333984375, 4.5390625, 5.744140625, 6.94921875, 8.154296875, 9.359375, 10.564453125, 11.76953125, 12.974609375, 14.1796875, 15.384765625, 16.58984375, 17.794921875, 19.0, 20.205078125, 21.41015625, 22.615234375, 23.8203125, 25.025390625, 26.23046875, 27.435546875, 28.640625, 29.845703125, 31.05078125, 32.255859375, 33.4609375, 34.666015625, 35.87109375, 37.076171875, 38.28125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 9.0, 12.0, 25.0, 33.0, 33.0, 38.0, 46.0, 70.0, 91.0, 87.0, 98.0, 129.0, 146.0, 169.0, 198.0, 187.0, 193.0, 240.0, 220.0, 224.0, 214.0, 220.0, 181.0, 183.0, 165.0, 140.0, 132.0, 120.0, 92.0, 87.0, 62.0, 48.0, 34.0, 27.0, 21.0, 14.0, 12.0, 20.0, 10.0, 11.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.5, -15.0159912109375, -14.531982421875, -14.0479736328125, -13.56396484375, -13.0799560546875, -12.595947265625, -12.1119384765625, -11.6279296875, -11.1439208984375, -10.659912109375, -10.1759033203125, -9.69189453125, -9.2078857421875, -8.723876953125, -8.2398681640625, -7.755859375, -7.2718505859375, -6.787841796875, -6.3038330078125, -5.81982421875, -5.3358154296875, -4.851806640625, -4.3677978515625, -3.8837890625, -3.3997802734375, -2.915771484375, -2.4317626953125, -1.94775390625, -1.4637451171875, -0.979736328125, -0.4957275390625, -0.01171875, 0.4722900390625, 0.956298828125, 1.4403076171875, 1.92431640625, 2.4083251953125, 2.892333984375, 3.3763427734375, 3.8603515625, 4.3443603515625, 4.828369140625, 5.3123779296875, 5.79638671875, 6.2803955078125, 6.764404296875, 7.2484130859375, 7.732421875, 8.2164306640625, 8.700439453125, 9.1844482421875, 9.66845703125, 10.1524658203125, 10.636474609375, 11.1204833984375, 11.6044921875, 12.0885009765625, 12.572509765625, 13.0565185546875, 13.54052734375, 14.0245361328125, 14.508544921875, 14.9925537109375, 15.4765625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 12.0, 16.0, 15.0, 18.0, 29.0, 37.0, 28.0, 36.0, 49.0, 47.0, 62.0, 44.0, 61.0, 50.0, 45.0, 54.0, 56.0, 44.0, 36.0, 36.0, 32.0, 36.0, 31.0, 18.0, 11.0, 11.0, 14.0, 9.0, 11.0, 5.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-44.19761657714844, -42.84590148925781, -41.49419021606445, -40.14247512817383, -38.79076385498047, -37.439048767089844, -36.08733367919922, -34.735618591308594, -33.383907318115234, -32.03219223022461, -30.68048095703125, -29.328765869140625, -27.977052688598633, -26.62533950805664, -25.273624420166016, -23.921911239624023, -22.57019805908203, -21.21848487854004, -19.866771697998047, -18.515056610107422, -17.16334342956543, -15.811630249023438, -14.459916114807129, -13.10820198059082, -11.756488800048828, -10.404775619506836, -9.053061485290527, -7.701347827911377, -6.349634170532227, -4.997920513153076, -3.646206855773926, -2.294492721557617, -0.9427833557128906, 0.40893030166625977, 1.7606439590454102, 3.1123576164245605, 4.464071273803711, 5.815784931182861, 7.167498588562012, 8.51921272277832, 9.870925903320312, 11.222639083862305, 12.574353218078613, 13.926067352294922, 15.277780532836914, 16.629493713378906, 17.98120880126953, 19.332921981811523, 20.684635162353516, 22.036348342895508, 23.3880615234375, 24.739776611328125, 26.091489791870117, 27.44320297241211, 28.794918060302734, 30.146631240844727, 31.49834442138672, 32.850059509277344, 34.2017707824707, 35.55348587036133, 36.90519714355469, 38.25691223144531, 39.60862731933594, 40.96034240722656, 42.31205368041992]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 13.0, 11.0, 8.0, 6.0, 18.0, 10.0, 16.0, 20.0, 28.0, 21.0, 23.0, 22.0, 31.0, 38.0, 38.0, 42.0, 23.0, 41.0, 47.0, 40.0, 33.0, 39.0, 36.0, 38.0, 48.0, 34.0, 27.0, 33.0, 25.0, 27.0, 22.0, 25.0, 20.0, 25.0, 9.0, 11.0, 6.0, 9.0, 10.0, 10.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.25787353515625, -34.21341323852539, -33.16895294189453, -32.12449264526367, -31.080034255981445, -30.035573959350586, -28.99111557006836, -27.9466552734375, -26.90219497680664, -25.85773468017578, -24.813274383544922, -23.768815994262695, -22.724355697631836, -21.679895401000977, -20.63543701171875, -19.59097671508789, -18.54651641845703, -17.502056121826172, -16.457595825195312, -15.413137435913086, -14.368677139282227, -13.324216842651367, -12.279757499694824, -11.235298156738281, -10.190837860107422, -9.146377563476562, -8.10191822052002, -7.057458400726318, -6.012998580932617, -4.968538761138916, -3.924078941345215, -2.8796191215515137, -1.8351593017578125, -0.7906994819641113, 0.25376033782958984, 1.298220157623291, 2.342679977416992, 3.3871397972106934, 4.4315996170043945, 5.476059436798096, 6.520519256591797, 7.564979076385498, 8.6094388961792, 9.653898239135742, 10.698358535766602, 11.742818832397461, 12.787278175354004, 13.831737518310547, 14.876197814941406, 15.920658111572266, 16.965118408203125, 18.00957679748535, 19.05403709411621, 20.09849739074707, 21.142955780029297, 22.187416076660156, 23.231876373291016, 24.276336669921875, 25.320796966552734, 26.36525535583496, 27.40971565246582, 28.45417594909668, 29.498634338378906, 30.543094635009766, 31.587554931640625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 14.0, 13.0, 30.0, 52.0, 68.0, 85.0, 143.0, 238.0, 355.0, 466.0, 785.0, 1150.0, 1768.0, 2655.0, 4059.0, 6180.0, 9615.0, 14611.0, 22241.0, 33387.0, 49401.0, 70292.0, 95107.0, 118437.0, 130538.0, 125372.0, 105755.0, 80689.0, 57347.0, 39870.0, 26658.0, 17447.0, 11528.0, 7599.0, 5095.0, 3307.0, 2118.0, 1374.0, 943.0, 581.0, 393.0, 267.0, 180.0, 116.0, 71.0, 59.0, 36.0, 23.0, 15.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-62.59375, -60.55615234375, -58.5185546875, -56.48095703125, -54.443359375, -52.40576171875, -50.3681640625, -48.33056640625, -46.29296875, -44.25537109375, -42.2177734375, -40.18017578125, -38.142578125, -36.10498046875, -34.0673828125, -32.02978515625, -29.9921875, -27.95458984375, -25.9169921875, -23.87939453125, -21.841796875, -19.80419921875, -17.7666015625, -15.72900390625, -13.69140625, -11.65380859375, -9.6162109375, -7.57861328125, -5.541015625, -3.50341796875, -1.4658203125, 0.57177734375, 2.609375, 4.64697265625, 6.6845703125, 8.72216796875, 10.759765625, 12.79736328125, 14.8349609375, 16.87255859375, 18.91015625, 20.94775390625, 22.9853515625, 25.02294921875, 27.060546875, 29.09814453125, 31.1357421875, 33.17333984375, 35.2109375, 37.24853515625, 39.2861328125, 41.32373046875, 43.361328125, 45.39892578125, 47.4365234375, 49.47412109375, 51.51171875, 53.54931640625, 55.5869140625, 57.62451171875, 59.662109375, 61.69970703125, 63.7373046875, 65.77490234375, 67.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 3.0, 1.0, 5.0, 13.0, 5.0, 5.0, 13.0, 12.0, 12.0, 22.0, 13.0, 22.0, 18.0, 17.0, 20.0, 28.0, 28.0, 28.0, 50.0, 37.0, 27.0, 36.0, 44.0, 41.0, 34.0, 36.0, 42.0, 27.0, 34.0, 43.0, 37.0, 28.0, 25.0, 27.0, 27.0, 28.0, 14.0, 14.0, 14.0, 11.0, 14.0, 9.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.015625, -23.2421875, -22.46875, -21.6953125, -20.921875, -20.1484375, -19.375, -18.6015625, -17.828125, -17.0546875, -16.28125, -15.5078125, -14.734375, -13.9609375, -13.1875, -12.4140625, -11.640625, -10.8671875, -10.09375, -9.3203125, -8.546875, -7.7734375, -7.0, -6.2265625, -5.453125, -4.6796875, -3.90625, -3.1328125, -2.359375, -1.5859375, -0.8125, -0.0390625, 0.734375, 1.5078125, 2.28125, 3.0546875, 3.828125, 4.6015625, 5.375, 6.1484375, 6.921875, 7.6953125, 8.46875, 9.2421875, 10.015625, 10.7890625, 11.5625, 12.3359375, 13.109375, 13.8828125, 14.65625, 15.4296875, 16.203125, 16.9765625, 17.75, 18.5234375, 19.296875, 20.0703125, 20.84375, 21.6171875, 22.390625, 23.1640625, 23.9375, 24.7109375, 25.484375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 9.0, 1.0, 4.0, 6.0, 15.0, 10.0, 29.0, 36.0, 51.0, 85.0, 101.0, 129.0, 197.0, 265.0, 448.0, 562.0, 856.0, 1235.0, 1790.0, 2504.0, 3836.0, 5453.0, 8406.0, 13010.0, 20724.0, 33507.0, 55878.0, 92689.0, 149256.0, 200862.0, 170976.0, 109864.0, 66409.0, 39760.0, 24399.0, 15124.0, 9876.0, 6473.0, 4339.0, 2925.0, 1989.0, 1376.0, 982.0, 640.0, 449.0, 309.0, 209.0, 155.0, 117.0, 70.0, 54.0, 34.0, 26.0, 14.0, 16.0, 9.0, 4.0, 4.0, 9.0, 1.0, 3.0], "bins": [-77.625, -75.2490234375, -72.873046875, -70.4970703125, -68.12109375, -65.7451171875, -63.369140625, -60.9931640625, -58.6171875, -56.2412109375, -53.865234375, -51.4892578125, -49.11328125, -46.7373046875, -44.361328125, -41.9853515625, -39.609375, -37.2333984375, -34.857421875, -32.4814453125, -30.10546875, -27.7294921875, -25.353515625, -22.9775390625, -20.6015625, -18.2255859375, -15.849609375, -13.4736328125, -11.09765625, -8.7216796875, -6.345703125, -3.9697265625, -1.59375, 0.7822265625, 3.158203125, 5.5341796875, 7.91015625, 10.2861328125, 12.662109375, 15.0380859375, 17.4140625, 19.7900390625, 22.166015625, 24.5419921875, 26.91796875, 29.2939453125, 31.669921875, 34.0458984375, 36.421875, 38.7978515625, 41.173828125, 43.5498046875, 45.92578125, 48.3017578125, 50.677734375, 53.0537109375, 55.4296875, 57.8056640625, 60.181640625, 62.5576171875, 64.93359375, 67.3095703125, 69.685546875, 72.0615234375, 74.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 3.0, 9.0, 17.0, 12.0, 10.0, 12.0, 22.0, 21.0, 13.0, 33.0, 33.0, 36.0, 32.0, 25.0, 27.0, 34.0, 32.0, 46.0, 43.0, 34.0, 37.0, 41.0, 28.0, 31.0, 34.0, 39.0, 38.0, 26.0, 25.0, 24.0, 32.0, 24.0, 19.0, 18.0, 16.0, 12.0, 10.0, 11.0, 7.0, 3.0, 8.0, 2.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-19.015625, -18.380859375, -17.74609375, -17.111328125, -16.4765625, -15.841796875, -15.20703125, -14.572265625, -13.9375, -13.302734375, -12.66796875, -12.033203125, -11.3984375, -10.763671875, -10.12890625, -9.494140625, -8.859375, -8.224609375, -7.58984375, -6.955078125, -6.3203125, -5.685546875, -5.05078125, -4.416015625, -3.78125, -3.146484375, -2.51171875, -1.876953125, -1.2421875, -0.607421875, 0.02734375, 0.662109375, 1.296875, 1.931640625, 2.56640625, 3.201171875, 3.8359375, 4.470703125, 5.10546875, 5.740234375, 6.375, 7.009765625, 7.64453125, 8.279296875, 8.9140625, 9.548828125, 10.18359375, 10.818359375, 11.453125, 12.087890625, 12.72265625, 13.357421875, 13.9921875, 14.626953125, 15.26171875, 15.896484375, 16.53125, 17.166015625, 17.80078125, 18.435546875, 19.0703125, 19.705078125, 20.33984375, 20.974609375, 21.609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 10.0, 16.0, 23.0, 42.0, 49.0, 105.0, 95.0, 124.0, 217.0, 309.0, 485.0, 722.0, 1074.0, 1623.0, 2639.0, 4273.0, 7547.0, 14599.0, 30592.0, 84489.0, 416019.0, 348289.0, 75031.0, 27975.0, 13552.0, 7252.0, 4155.0, 2591.0, 1527.0, 1044.0, 657.0, 467.0, 290.0, 212.0, 153.0, 83.0, 63.0, 44.0, 40.0, 22.0, 14.0, 14.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.875, -147.12109375, -142.3671875, -137.61328125, -132.859375, -128.10546875, -123.3515625, -118.59765625, -113.84375, -109.08984375, -104.3359375, -99.58203125, -94.828125, -90.07421875, -85.3203125, -80.56640625, -75.8125, -71.05859375, -66.3046875, -61.55078125, -56.796875, -52.04296875, -47.2890625, -42.53515625, -37.78125, -33.02734375, -28.2734375, -23.51953125, -18.765625, -14.01171875, -9.2578125, -4.50390625, 0.25, 5.00390625, 9.7578125, 14.51171875, 19.265625, 24.01953125, 28.7734375, 33.52734375, 38.28125, 43.03515625, 47.7890625, 52.54296875, 57.296875, 62.05078125, 66.8046875, 71.55859375, 76.3125, 81.06640625, 85.8203125, 90.57421875, 95.328125, 100.08203125, 104.8359375, 109.58984375, 114.34375, 119.09765625, 123.8515625, 128.60546875, 133.359375, 138.11328125, 142.8671875, 147.62109375, 152.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 9.0, 9.0, 16.0, 18.0, 31.0, 60.0, 120.0, 255.0, 197.0, 99.0, 52.0, 33.0, 15.0, 17.0, 11.0, 9.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0195770263671875, -0.018816471099853516, -0.01805591583251953, -0.017295360565185547, -0.016534805297851562, -0.015774250030517578, -0.015013694763183594, -0.01425313949584961, -0.013492584228515625, -0.01273202896118164, -0.011971473693847656, -0.011210918426513672, -0.010450363159179688, -0.009689807891845703, -0.008929252624511719, -0.008168697357177734, -0.00740814208984375, -0.006647586822509766, -0.005887031555175781, -0.005126476287841797, -0.0043659210205078125, -0.003605365753173828, -0.0028448104858398438, -0.0020842552185058594, -0.001323699951171875, -0.0005631446838378906, 0.00019741058349609375, 0.0009579658508300781, 0.0017185211181640625, 0.002479076385498047, 0.0032396316528320312, 0.004000186920166016, 0.0047607421875, 0.005521297454833984, 0.006281852722167969, 0.007042407989501953, 0.0078029632568359375, 0.008563518524169922, 0.009324073791503906, 0.01008462905883789, 0.010845184326171875, 0.01160573959350586, 0.012366294860839844, 0.013126850128173828, 0.013887405395507812, 0.014647960662841797, 0.015408515930175781, 0.016169071197509766, 0.01692962646484375, 0.017690181732177734, 0.01845073699951172, 0.019211292266845703, 0.019971847534179688, 0.020732402801513672, 0.021492958068847656, 0.02225351333618164, 0.023014068603515625, 0.02377462387084961, 0.024535179138183594, 0.025295734405517578, 0.026056289672851562, 0.026816844940185547, 0.02757740020751953, 0.028337955474853516, 0.0290985107421875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 12.0, 13.0, 19.0, 20.0, 38.0, 53.0, 74.0, 101.0, 142.0, 185.0, 315.0, 415.0, 655.0, 990.0, 1549.0, 2548.0, 4335.0, 8141.0, 16760.0, 41404.0, 148888.0, 489880.0, 231220.0, 56102.0, 21568.0, 9814.0, 5100.0, 2948.0, 1790.0, 1128.0, 734.0, 505.0, 360.0, 240.0, 141.0, 107.0, 82.0, 51.0, 30.0, 30.0, 20.0, 9.0, 6.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-123.5625, -119.8896484375, -116.216796875, -112.5439453125, -108.87109375, -105.1982421875, -101.525390625, -97.8525390625, -94.1796875, -90.5068359375, -86.833984375, -83.1611328125, -79.48828125, -75.8154296875, -72.142578125, -68.4697265625, -64.796875, -61.1240234375, -57.451171875, -53.7783203125, -50.10546875, -46.4326171875, -42.759765625, -39.0869140625, -35.4140625, -31.7412109375, -28.068359375, -24.3955078125, -20.72265625, -17.0498046875, -13.376953125, -9.7041015625, -6.03125, -2.3583984375, 1.314453125, 4.9873046875, 8.66015625, 12.3330078125, 16.005859375, 19.6787109375, 23.3515625, 27.0244140625, 30.697265625, 34.3701171875, 38.04296875, 41.7158203125, 45.388671875, 49.0615234375, 52.734375, 56.4072265625, 60.080078125, 63.7529296875, 67.42578125, 71.0986328125, 74.771484375, 78.4443359375, 82.1171875, 85.7900390625, 89.462890625, 93.1357421875, 96.80859375, 100.4814453125, 104.154296875, 107.8271484375, 111.5]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 12.0, 14.0, 14.0, 21.0, 19.0, 25.0, 55.0, 68.0, 102.0, 94.0, 116.0, 106.0, 84.0, 78.0, 44.0, 28.0, 27.0, 13.0, 10.0, 12.0, 8.0, 10.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.65625, -29.768798828125, -28.88134765625, -27.993896484375, -27.1064453125, -26.218994140625, -25.33154296875, -24.444091796875, -23.556640625, -22.669189453125, -21.78173828125, -20.894287109375, -20.0068359375, -19.119384765625, -18.23193359375, -17.344482421875, -16.45703125, -15.569580078125, -14.68212890625, -13.794677734375, -12.9072265625, -12.019775390625, -11.13232421875, -10.244873046875, -9.357421875, -8.469970703125, -7.58251953125, -6.695068359375, -5.8076171875, -4.920166015625, -4.03271484375, -3.145263671875, -2.2578125, -1.370361328125, -0.48291015625, 0.404541015625, 1.2919921875, 2.179443359375, 3.06689453125, 3.954345703125, 4.841796875, 5.729248046875, 6.61669921875, 7.504150390625, 8.3916015625, 9.279052734375, 10.16650390625, 11.053955078125, 11.94140625, 12.828857421875, 13.71630859375, 14.603759765625, 15.4912109375, 16.378662109375, 17.26611328125, 18.153564453125, 19.041015625, 19.928466796875, 20.81591796875, 21.703369140625, 22.5908203125, 23.478271484375, 24.36572265625, 25.253173828125, 26.140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 9.0, 9.0, 16.0, 24.0, 25.0, 24.0, 22.0, 30.0, 28.0, 41.0, 49.0, 45.0, 49.0, 52.0, 60.0, 55.0, 52.0, 46.0, 49.0, 45.0, 37.0, 30.0, 30.0, 17.0, 24.0, 18.0, 14.0, 16.0, 5.0, 11.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-39.827659606933594, -38.600399017333984, -37.37313461303711, -36.1458740234375, -34.91861343383789, -33.69135284423828, -32.464088439941406, -31.236827850341797, -30.009565353393555, -28.782302856445312, -27.555042266845703, -26.32777976989746, -25.10051727294922, -23.87325668334961, -22.645994186401367, -21.418731689453125, -20.191471099853516, -18.964208602905273, -17.736948013305664, -16.509685516357422, -15.282423973083496, -14.05516242980957, -12.827899932861328, -11.600638389587402, -10.373376846313477, -9.14611530303955, -7.918853282928467, -6.691591262817383, -5.464329719543457, -4.237068176269531, -3.0098061561584473, -1.7825441360473633, -0.5552825927734375, 0.6719791889190674, 1.8992409706115723, 3.126502752304077, 4.353764533996582, 5.581026077270508, 6.808288097381592, 8.035550117492676, 9.262811660766602, 10.490073204040527, 11.717334747314453, 12.944597244262695, 14.171858787536621, 15.399120330810547, 16.62638282775879, 17.85364532470703, 19.08090591430664, 20.308168411254883, 21.535429000854492, 22.762691497802734, 23.989952087402344, 25.217214584350586, 26.444477081298828, 27.671737670898438, 28.89900016784668, 30.126262664794922, 31.35352325439453, 32.58078384399414, 33.808048248291016, 35.035308837890625, 36.262569427490234, 37.48983383178711, 38.71709442138672]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 6.0, 3.0, 11.0, 12.0, 17.0, 15.0, 21.0, 20.0, 21.0, 24.0, 19.0, 21.0, 35.0, 41.0, 33.0, 43.0, 25.0, 29.0, 38.0, 34.0, 47.0, 46.0, 42.0, 37.0, 43.0, 34.0, 30.0, 30.0, 36.0, 27.0, 22.0, 24.0, 12.0, 22.0, 13.0, 9.0, 13.0, 5.0, 10.0, 10.0, 7.0, 0.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.89644432067871, -26.964345932006836, -26.032249450683594, -25.10015106201172, -24.168052673339844, -23.2359561920166, -22.303857803344727, -21.371761322021484, -20.43966293334961, -19.507564544677734, -18.575468063354492, -17.643369674682617, -16.711273193359375, -15.7791748046875, -14.847076416015625, -13.914978981018066, -12.982881546020508, -12.05078411102295, -11.11868667602539, -10.186588287353516, -9.254490852355957, -8.322393417358398, -7.390295505523682, -6.458197593688965, -5.526100158691406, -4.594002723693848, -3.661904811859131, -2.729807138442993, -1.7977094650268555, -0.8656120300292969, 0.06648588180541992, 0.9985837936401367, 1.9306812286376953, 2.862778902053833, 3.7948765754699707, 4.7269744873046875, 5.659071922302246, 6.591169357299805, 7.5232672691345215, 8.455365180969238, 9.387462615966797, 10.319560050964355, 11.251657485961914, 12.183755874633789, 13.115853309631348, 14.047950744628906, 14.980049133300781, 15.91214656829834, 16.8442440032959, 17.776342391967773, 18.708438873291016, 19.64053726196289, 20.572635650634766, 21.504732131958008, 22.436830520629883, 23.368927001953125, 24.301025390625, 25.233123779296875, 26.165220260620117, 27.097318649291992, 28.029415130615234, 28.96151351928711, 29.893611907958984, 30.82571029663086, 31.7578067779541]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 15.0, 23.0, 41.0, 57.0, 87.0, 148.0, 250.0, 359.0, 631.0, 970.0, 1481.0, 2499.0, 3759.0, 6172.0, 9731.0, 15526.0, 25069.0, 38944.0, 58360.0, 84413.0, 113926.0, 135581.0, 140281.0, 123280.0, 95068.0, 67366.0, 45274.0, 29106.0, 18570.0, 11722.0, 7312.0, 4631.0, 2937.0, 1854.0, 1129.0, 762.0, 462.0, 263.0, 191.0, 119.0, 72.0, 40.0, 29.0, 18.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.75390625, -41.3828125, -40.01171875, -38.640625, -37.26953125, -35.8984375, -34.52734375, -33.15625, -31.78515625, -30.4140625, -29.04296875, -27.671875, -26.30078125, -24.9296875, -23.55859375, -22.1875, -20.81640625, -19.4453125, -18.07421875, -16.703125, -15.33203125, -13.9609375, -12.58984375, -11.21875, -9.84765625, -8.4765625, -7.10546875, -5.734375, -4.36328125, -2.9921875, -1.62109375, -0.25, 1.12109375, 2.4921875, 3.86328125, 5.234375, 6.60546875, 7.9765625, 9.34765625, 10.71875, 12.08984375, 13.4609375, 14.83203125, 16.203125, 17.57421875, 18.9453125, 20.31640625, 21.6875, 23.05859375, 24.4296875, 25.80078125, 27.171875, 28.54296875, 29.9140625, 31.28515625, 32.65625, 34.02734375, 35.3984375, 36.76953125, 38.140625, 39.51171875, 40.8828125, 42.25390625, 43.625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 5.0, 11.0, 16.0, 12.0, 18.0, 23.0, 20.0, 17.0, 23.0, 26.0, 33.0, 30.0, 25.0, 28.0, 40.0, 32.0, 30.0, 42.0, 41.0, 36.0, 49.0, 36.0, 42.0, 34.0, 31.0, 33.0, 27.0, 40.0, 28.0, 22.0, 27.0, 16.0, 14.0, 7.0, 12.0, 13.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.296875, -23.481201171875, -22.66552734375, -21.849853515625, -21.0341796875, -20.218505859375, -19.40283203125, -18.587158203125, -17.771484375, -16.955810546875, -16.14013671875, -15.324462890625, -14.5087890625, -13.693115234375, -12.87744140625, -12.061767578125, -11.24609375, -10.430419921875, -9.61474609375, -8.799072265625, -7.9833984375, -7.167724609375, -6.35205078125, -5.536376953125, -4.720703125, -3.905029296875, -3.08935546875, -2.273681640625, -1.4580078125, -0.642333984375, 0.17333984375, 0.989013671875, 1.8046875, 2.620361328125, 3.43603515625, 4.251708984375, 5.0673828125, 5.883056640625, 6.69873046875, 7.514404296875, 8.330078125, 9.145751953125, 9.96142578125, 10.777099609375, 11.5927734375, 12.408447265625, 13.22412109375, 14.039794921875, 14.85546875, 15.671142578125, 16.48681640625, 17.302490234375, 18.1181640625, 18.933837890625, 19.74951171875, 20.565185546875, 21.380859375, 22.196533203125, 23.01220703125, 23.827880859375, 24.6435546875, 25.459228515625, 26.27490234375, 27.090576171875, 27.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 8.0, 17.0, 21.0, 27.0, 40.0, 62.0, 99.0, 148.0, 220.0, 355.0, 497.0, 801.0, 1180.0, 1693.0, 2550.0, 3917.0, 6234.0, 9123.0, 14076.0, 20698.0, 31184.0, 45645.0, 65069.0, 88437.0, 111231.0, 125804.0, 125228.0, 109567.0, 86687.0, 63401.0, 44619.0, 30325.0, 20136.0, 13456.0, 8742.0, 5722.0, 4017.0, 2516.0, 1645.0, 1108.0, 770.0, 498.0, 330.0, 247.0, 149.0, 87.0, 54.0, 29.0, 36.0, 27.0, 15.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.65625, -36.3994140625, -35.142578125, -33.8857421875, -32.62890625, -31.3720703125, -30.115234375, -28.8583984375, -27.6015625, -26.3447265625, -25.087890625, -23.8310546875, -22.57421875, -21.3173828125, -20.060546875, -18.8037109375, -17.546875, -16.2900390625, -15.033203125, -13.7763671875, -12.51953125, -11.2626953125, -10.005859375, -8.7490234375, -7.4921875, -6.2353515625, -4.978515625, -3.7216796875, -2.46484375, -1.2080078125, 0.048828125, 1.3056640625, 2.5625, 3.8193359375, 5.076171875, 6.3330078125, 7.58984375, 8.8466796875, 10.103515625, 11.3603515625, 12.6171875, 13.8740234375, 15.130859375, 16.3876953125, 17.64453125, 18.9013671875, 20.158203125, 21.4150390625, 22.671875, 23.9287109375, 25.185546875, 26.4423828125, 27.69921875, 28.9560546875, 30.212890625, 31.4697265625, 32.7265625, 33.9833984375, 35.240234375, 36.4970703125, 37.75390625, 39.0107421875, 40.267578125, 41.5244140625, 42.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 6.0, 9.0, 9.0, 6.0, 7.0, 9.0, 12.0, 9.0, 15.0, 14.0, 21.0, 23.0, 24.0, 23.0, 38.0, 42.0, 44.0, 26.0, 33.0, 33.0, 40.0, 42.0, 29.0, 41.0, 44.0, 43.0, 41.0, 38.0, 41.0, 27.0, 22.0, 20.0, 27.0, 26.0, 17.0, 17.0, 18.0, 16.0, 9.0, 8.0, 11.0, 5.0, 7.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.75, -19.142822265625, -18.53564453125, -17.928466796875, -17.3212890625, -16.714111328125, -16.10693359375, -15.499755859375, -14.892578125, -14.285400390625, -13.67822265625, -13.071044921875, -12.4638671875, -11.856689453125, -11.24951171875, -10.642333984375, -10.03515625, -9.427978515625, -8.82080078125, -8.213623046875, -7.6064453125, -6.999267578125, -6.39208984375, -5.784912109375, -5.177734375, -4.570556640625, -3.96337890625, -3.356201171875, -2.7490234375, -2.141845703125, -1.53466796875, -0.927490234375, -0.3203125, 0.286865234375, 0.89404296875, 1.501220703125, 2.1083984375, 2.715576171875, 3.32275390625, 3.929931640625, 4.537109375, 5.144287109375, 5.75146484375, 6.358642578125, 6.9658203125, 7.572998046875, 8.18017578125, 8.787353515625, 9.39453125, 10.001708984375, 10.60888671875, 11.216064453125, 11.8232421875, 12.430419921875, 13.03759765625, 13.644775390625, 14.251953125, 14.859130859375, 15.46630859375, 16.073486328125, 16.6806640625, 17.287841796875, 17.89501953125, 18.502197265625, 19.109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 20.0, 29.0, 25.0, 64.0, 100.0, 123.0, 230.0, 331.0, 473.0, 684.0, 1178.0, 1923.0, 3178.0, 5587.0, 10124.0, 18653.0, 36793.0, 73576.0, 142034.0, 222746.0, 226179.0, 146242.0, 75858.0, 38006.0, 19645.0, 10344.0, 5825.0, 3221.0, 1938.0, 1193.0, 757.0, 484.0, 333.0, 212.0, 142.0, 89.0, 57.0, 41.0, 18.0, 21.0, 16.0, 17.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.53125, -36.28125, -35.03125, -33.78125, -32.53125, -31.28125, -30.03125, -28.78125, -27.53125, -26.28125, -25.03125, -23.78125, -22.53125, -21.28125, -20.03125, -18.78125, -17.53125, -16.28125, -15.03125, -13.78125, -12.53125, -11.28125, -10.03125, -8.78125, -7.53125, -6.28125, -5.03125, -3.78125, -2.53125, -1.28125, -0.03125, 1.21875, 2.46875, 3.71875, 4.96875, 6.21875, 7.46875, 8.71875, 9.96875, 11.21875, 12.46875, 13.71875, 14.96875, 16.21875, 17.46875, 18.71875, 19.96875, 21.21875, 22.46875, 23.71875, 24.96875, 26.21875, 27.46875, 28.71875, 29.96875, 31.21875, 32.46875, 33.71875, 34.96875, 36.21875, 37.46875, 38.71875, 39.96875, 41.21875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 7.0, 5.0, 3.0, 15.0, 11.0, 16.0, 19.0, 31.0, 20.0, 46.0, 51.0, 60.0, 54.0, 68.0, 83.0, 59.0, 48.0, 62.0, 59.0, 49.0, 42.0, 46.0, 26.0, 14.0, 21.0, 17.0, 15.0, 6.0, 12.0, 4.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0036468505859375, -0.0035337507724761963, -0.0034206509590148926, -0.003307551145553589, -0.003194451332092285, -0.0030813515186309814, -0.0029682517051696777, -0.002855151891708374, -0.0027420520782470703, -0.0026289522647857666, -0.002515852451324463, -0.002402752637863159, -0.0022896528244018555, -0.0021765530109405518, -0.002063453197479248, -0.0019503533840179443, -0.0018372535705566406, -0.001724153757095337, -0.0016110539436340332, -0.0014979541301727295, -0.0013848543167114258, -0.001271754503250122, -0.0011586546897888184, -0.0010455548763275146, -0.0009324550628662109, -0.0008193552494049072, -0.0007062554359436035, -0.0005931556224822998, -0.0004800558090209961, -0.0003669559955596924, -0.00025385618209838867, -0.00014075636863708496, -2.765655517578125e-05, 8.544325828552246e-05, 0.00019854307174682617, 0.0003116428852081299, 0.0004247426986694336, 0.0005378425121307373, 0.000650942325592041, 0.0007640421390533447, 0.0008771419525146484, 0.0009902417659759521, 0.0011033415794372559, 0.0012164413928985596, 0.0013295412063598633, 0.001442641019821167, 0.0015557408332824707, 0.0016688406467437744, 0.0017819404602050781, 0.0018950402736663818, 0.0020081400871276855, 0.0021212399005889893, 0.002234339714050293, 0.0023474395275115967, 0.0024605393409729004, 0.002573639154434204, 0.002686738967895508, 0.0027998387813568115, 0.0029129385948181152, 0.003026038408279419, 0.0031391382217407227, 0.0032522380352020264, 0.00336533784866333, 0.003478437662124634, 0.0035915374755859375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 12.0, 16.0, 16.0, 24.0, 32.0, 56.0, 68.0, 104.0, 154.0, 218.0, 343.0, 480.0, 729.0, 1087.0, 1633.0, 2571.0, 3980.0, 6749.0, 11463.0, 19655.0, 35476.0, 64590.0, 114992.0, 180562.0, 208947.0, 164940.0, 100583.0, 55352.0, 30313.0, 16957.0, 10054.0, 5958.0, 3636.0, 2327.0, 1534.0, 971.0, 627.0, 428.0, 295.0, 211.0, 125.0, 93.0, 68.0, 41.0, 29.0, 24.0, 9.0, 13.0, 8.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.9375, -29.9189453125, -28.900390625, -27.8818359375, -26.86328125, -25.8447265625, -24.826171875, -23.8076171875, -22.7890625, -21.7705078125, -20.751953125, -19.7333984375, -18.71484375, -17.6962890625, -16.677734375, -15.6591796875, -14.640625, -13.6220703125, -12.603515625, -11.5849609375, -10.56640625, -9.5478515625, -8.529296875, -7.5107421875, -6.4921875, -5.4736328125, -4.455078125, -3.4365234375, -2.41796875, -1.3994140625, -0.380859375, 0.6376953125, 1.65625, 2.6748046875, 3.693359375, 4.7119140625, 5.73046875, 6.7490234375, 7.767578125, 8.7861328125, 9.8046875, 10.8232421875, 11.841796875, 12.8603515625, 13.87890625, 14.8974609375, 15.916015625, 16.9345703125, 17.953125, 18.9716796875, 19.990234375, 21.0087890625, 22.02734375, 23.0458984375, 24.064453125, 25.0830078125, 26.1015625, 27.1201171875, 28.138671875, 29.1572265625, 30.17578125, 31.1943359375, 32.212890625, 33.2314453125, 34.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 9.0, 11.0, 21.0, 16.0, 28.0, 29.0, 44.0, 59.0, 69.0, 66.0, 83.0, 77.0, 80.0, 63.0, 73.0, 49.0, 42.0, 27.0, 32.0, 21.0, 15.0, 7.0, 14.0, 9.0, 6.0, 10.0, 7.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.5537109375, -10.154296875, -9.7548828125, -9.35546875, -8.9560546875, -8.556640625, -8.1572265625, -7.7578125, -7.3583984375, -6.958984375, -6.5595703125, -6.16015625, -5.7607421875, -5.361328125, -4.9619140625, -4.5625, -4.1630859375, -3.763671875, -3.3642578125, -2.96484375, -2.5654296875, -2.166015625, -1.7666015625, -1.3671875, -0.9677734375, -0.568359375, -0.1689453125, 0.23046875, 0.6298828125, 1.029296875, 1.4287109375, 1.828125, 2.2275390625, 2.626953125, 3.0263671875, 3.42578125, 3.8251953125, 4.224609375, 4.6240234375, 5.0234375, 5.4228515625, 5.822265625, 6.2216796875, 6.62109375, 7.0205078125, 7.419921875, 7.8193359375, 8.21875, 8.6181640625, 9.017578125, 9.4169921875, 9.81640625, 10.2158203125, 10.615234375, 11.0146484375, 11.4140625, 11.8134765625, 12.212890625, 12.6123046875, 13.01171875, 13.4111328125, 13.810546875, 14.2099609375, 14.609375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 9.0, 11.0, 6.0, 11.0, 9.0, 9.0, 16.0, 11.0, 17.0, 40.0, 22.0, 23.0, 34.0, 34.0, 44.0, 52.0, 53.0, 46.0, 54.0, 49.0, 47.0, 44.0, 38.0, 31.0, 35.0, 38.0, 32.0, 29.0, 34.0, 21.0, 19.0, 11.0, 15.0, 6.0, 7.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-33.787757873535156, -32.69562530517578, -31.60348892211914, -30.511354446411133, -29.419219970703125, -28.32708740234375, -27.234952926635742, -26.142818450927734, -25.050683975219727, -23.95854949951172, -22.86641502380371, -21.774280548095703, -20.682147979736328, -19.590011596679688, -18.497879028320312, -17.405744552612305, -16.313610076904297, -15.221475601196289, -14.129341125488281, -13.03720760345459, -11.945073127746582, -10.852938652038574, -9.760805130004883, -8.668670654296875, -7.576536178588867, -6.484401702880859, -5.39226770401001, -4.30013370513916, -3.2079992294311523, -2.1158647537231445, -1.023730754852295, 0.06840324401855469, 1.1605415344238281, 2.252675771713257, 3.3448100090026855, 4.436944007873535, 5.529078483581543, 6.621212959289551, 7.7133469581604, 8.80548095703125, 9.897615432739258, 10.989749908447266, 12.081884384155273, 13.174017906188965, 14.266152381896973, 15.35828685760498, 16.450420379638672, 17.54255485534668, 18.634689331054688, 19.726823806762695, 20.818958282470703, 21.91109275817871, 23.00322723388672, 24.095359802246094, 25.1874942779541, 26.27962875366211, 27.371763229370117, 28.463897705078125, 29.556032180786133, 30.64816665649414, 31.740299224853516, 32.832435607910156, 33.92456817626953, 35.016700744628906, 36.10883712768555]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 11.0, 7.0, 11.0, 10.0, 15.0, 17.0, 13.0, 25.0, 31.0, 29.0, 34.0, 32.0, 54.0, 56.0, 46.0, 56.0, 50.0, 48.0, 45.0, 57.0, 40.0, 39.0, 41.0, 33.0, 33.0, 34.0, 24.0, 15.0, 27.0, 13.0, 17.0, 9.0, 5.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.968156814575195, -30.830211639404297, -29.6922664642334, -28.5543212890625, -27.4163761138916, -26.278430938720703, -25.140485763549805, -24.002540588378906, -22.864595413208008, -21.72665023803711, -20.58870506286621, -19.450759887695312, -18.312814712524414, -17.174869537353516, -16.036924362182617, -14.898979187011719, -13.76103401184082, -12.623088836669922, -11.485143661499023, -10.347198486328125, -9.209253311157227, -8.071308135986328, -6.93336296081543, -5.795417785644531, -4.657472610473633, -3.5195274353027344, -2.381582260131836, -1.2436370849609375, -0.10569190979003906, 1.0322532653808594, 2.170198440551758, 3.3081436157226562, 4.4460906982421875, 5.584035873413086, 6.721981048583984, 7.859926223754883, 8.997871398925781, 10.13581657409668, 11.273761749267578, 12.411706924438477, 13.549652099609375, 14.687597274780273, 15.825542449951172, 16.96348762512207, 18.10143280029297, 19.239377975463867, 20.377323150634766, 21.515268325805664, 22.653213500976562, 23.79115867614746, 24.92910385131836, 26.067049026489258, 27.204994201660156, 28.342939376831055, 29.480884552001953, 30.61882972717285, 31.75677490234375, 32.89472198486328, 34.03266525268555, 35.17060852050781, 36.308555603027344, 37.446502685546875, 38.58444595336914, 39.722389221191406, 40.86033630371094]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 12.0, 17.0, 26.0, 52.0, 77.0, 95.0, 161.0, 254.0, 395.0, 669.0, 971.0, 1638.0, 2573.0, 4082.0, 6746.0, 10943.0, 18431.0, 30587.0, 52133.0, 90454.0, 159476.0, 286359.0, 509986.0, 779319.0, 836852.0, 601227.0, 346018.0, 192161.0, 108311.0, 62337.0, 36288.0, 21576.0, 13070.0, 7890.0, 4912.0, 3022.0, 1875.0, 1204.0, 735.0, 511.0, 302.0, 209.0, 114.0, 76.0, 53.0, 24.0, 20.0, 19.0, 9.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-33.3125, -32.27685546875, -31.2412109375, -30.20556640625, -29.169921875, -28.13427734375, -27.0986328125, -26.06298828125, -25.02734375, -23.99169921875, -22.9560546875, -21.92041015625, -20.884765625, -19.84912109375, -18.8134765625, -17.77783203125, -16.7421875, -15.70654296875, -14.6708984375, -13.63525390625, -12.599609375, -11.56396484375, -10.5283203125, -9.49267578125, -8.45703125, -7.42138671875, -6.3857421875, -5.35009765625, -4.314453125, -3.27880859375, -2.2431640625, -1.20751953125, -0.171875, 0.86376953125, 1.8994140625, 2.93505859375, 3.970703125, 5.00634765625, 6.0419921875, 7.07763671875, 8.11328125, 9.14892578125, 10.1845703125, 11.22021484375, 12.255859375, 13.29150390625, 14.3271484375, 15.36279296875, 16.3984375, 17.43408203125, 18.4697265625, 19.50537109375, 20.541015625, 21.57666015625, 22.6123046875, 23.64794921875, 24.68359375, 25.71923828125, 26.7548828125, 27.79052734375, 28.826171875, 29.86181640625, 30.8974609375, 31.93310546875, 32.96875]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 4.0, 5.0, 10.0, 14.0, 13.0, 25.0, 26.0, 25.0, 29.0, 35.0, 27.0, 25.0, 48.0, 49.0, 51.0, 45.0, 55.0, 57.0, 59.0, 53.0, 46.0, 33.0, 31.0, 33.0, 29.0, 30.0, 39.0, 21.0, 21.0, 17.0, 10.0, 5.0, 11.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -21.20263671875, -20.3583984375, -19.51416015625, -18.669921875, -17.82568359375, -16.9814453125, -16.13720703125, -15.29296875, -14.44873046875, -13.6044921875, -12.76025390625, -11.916015625, -11.07177734375, -10.2275390625, -9.38330078125, -8.5390625, -7.69482421875, -6.8505859375, -6.00634765625, -5.162109375, -4.31787109375, -3.4736328125, -2.62939453125, -1.78515625, -0.94091796875, -0.0966796875, 0.74755859375, 1.591796875, 2.43603515625, 3.2802734375, 4.12451171875, 4.96875, 5.81298828125, 6.6572265625, 7.50146484375, 8.345703125, 9.18994140625, 10.0341796875, 10.87841796875, 11.72265625, 12.56689453125, 13.4111328125, 14.25537109375, 15.099609375, 15.94384765625, 16.7880859375, 17.63232421875, 18.4765625, 19.32080078125, 20.1650390625, 21.00927734375, 21.853515625, 22.69775390625, 23.5419921875, 24.38623046875, 25.23046875, 26.07470703125, 26.9189453125, 27.76318359375, 28.607421875, 29.45166015625, 30.2958984375, 31.14013671875, 31.984375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 18.0, 21.0, 44.0, 61.0, 100.0, 123.0, 209.0, 311.0, 462.0, 733.0, 1165.0, 1777.0, 2879.0, 4483.0, 7245.0, 11346.0, 18661.0, 29685.0, 48420.0, 78305.0, 127232.0, 205277.0, 324112.0, 489041.0, 655704.0, 684850.0, 535081.0, 361712.0, 230201.0, 143491.0, 87573.0, 54148.0, 33682.0, 20776.0, 12851.0, 8244.0, 5230.0, 3256.0, 2030.0, 1360.0, 815.0, 521.0, 372.0, 230.0, 175.0, 90.0, 69.0, 38.0, 30.0, 15.0, 7.0, 14.0, 3.0, 4.0, 1.0], "bins": [-32.5, -31.547607421875, -30.59521484375, -29.642822265625, -28.6904296875, -27.738037109375, -26.78564453125, -25.833251953125, -24.880859375, -23.928466796875, -22.97607421875, -22.023681640625, -21.0712890625, -20.118896484375, -19.16650390625, -18.214111328125, -17.26171875, -16.309326171875, -15.35693359375, -14.404541015625, -13.4521484375, -12.499755859375, -11.54736328125, -10.594970703125, -9.642578125, -8.690185546875, -7.73779296875, -6.785400390625, -5.8330078125, -4.880615234375, -3.92822265625, -2.975830078125, -2.0234375, -1.071044921875, -0.11865234375, 0.833740234375, 1.7861328125, 2.738525390625, 3.69091796875, 4.643310546875, 5.595703125, 6.548095703125, 7.50048828125, 8.452880859375, 9.4052734375, 10.357666015625, 11.31005859375, 12.262451171875, 13.21484375, 14.167236328125, 15.11962890625, 16.072021484375, 17.0244140625, 17.976806640625, 18.92919921875, 19.881591796875, 20.833984375, 21.786376953125, 22.73876953125, 23.691162109375, 24.6435546875, 25.595947265625, 26.54833984375, 27.500732421875, 28.453125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 8.0, 13.0, 21.0, 20.0, 28.0, 22.0, 38.0, 50.0, 63.0, 92.0, 98.0, 109.0, 123.0, 144.0, 176.0, 186.0, 211.0, 216.0, 255.0, 228.0, 212.0, 235.0, 206.0, 169.0, 184.0, 165.0, 119.0, 101.0, 104.0, 72.0, 81.0, 74.0, 58.0, 37.0, 39.0, 25.0, 11.0, 17.0, 16.0, 13.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.1593017578125, -9.787353515625, -9.4154052734375, -9.04345703125, -8.6715087890625, -8.299560546875, -7.9276123046875, -7.5556640625, -7.1837158203125, -6.811767578125, -6.4398193359375, -6.06787109375, -5.6959228515625, -5.323974609375, -4.9520263671875, -4.580078125, -4.2081298828125, -3.836181640625, -3.4642333984375, -3.09228515625, -2.7203369140625, -2.348388671875, -1.9764404296875, -1.6044921875, -1.2325439453125, -0.860595703125, -0.4886474609375, -0.11669921875, 0.2552490234375, 0.627197265625, 0.9991455078125, 1.37109375, 1.7430419921875, 2.114990234375, 2.4869384765625, 2.85888671875, 3.2308349609375, 3.602783203125, 3.9747314453125, 4.3466796875, 4.7186279296875, 5.090576171875, 5.4625244140625, 5.83447265625, 6.2064208984375, 6.578369140625, 6.9503173828125, 7.322265625, 7.6942138671875, 8.066162109375, 8.4381103515625, 8.81005859375, 9.1820068359375, 9.553955078125, 9.9259033203125, 10.2978515625, 10.6697998046875, 11.041748046875, 11.4136962890625, 11.78564453125, 12.1575927734375, 12.529541015625, 12.9014892578125, 13.2734375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 5.0, 10.0, 14.0, 13.0, 16.0, 15.0, 14.0, 21.0, 34.0, 26.0, 35.0, 49.0, 32.0, 44.0, 56.0, 52.0, 48.0, 51.0, 42.0, 38.0, 48.0, 39.0, 50.0, 35.0, 38.0, 24.0, 29.0, 16.0, 23.0, 15.0, 13.0, 5.0, 8.0, 7.0, 6.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.612056732177734, -33.548973083496094, -32.48588943481445, -31.422807693481445, -30.359725952148438, -29.296642303466797, -28.233558654785156, -27.170475006103516, -26.107393264770508, -25.044309616088867, -23.98122787475586, -22.91814422607422, -21.855060577392578, -20.79197883605957, -19.72889518737793, -18.665813446044922, -17.60272979736328, -16.53964614868164, -15.476564407348633, -14.413480758666992, -13.350398063659668, -12.287315368652344, -11.224231719970703, -10.161149024963379, -9.098066329956055, -8.03498363494873, -6.971900463104248, -5.908817291259766, -4.845734596252441, -3.782651901245117, -2.7195687294006348, -1.6564855575561523, -0.5934066772460938, 0.46967625617980957, 1.532759189605713, 2.595842123031616, 3.6589250564575195, 4.722007751464844, 5.785090923309326, 6.848174095153809, 7.911256790161133, 8.974339485168457, 10.037422180175781, 11.100505828857422, 12.163588523864746, 13.22667121887207, 14.289754867553711, 15.352837562561035, 16.41592025756836, 17.47900390625, 18.542085647583008, 19.60516929626465, 20.668251037597656, 21.731334686279297, 22.794418334960938, 23.857501983642578, 24.920583724975586, 25.983667373657227, 27.046749114990234, 28.109832763671875, 29.172916412353516, 30.235998153686523, 31.299081802368164, 32.36216354370117, 33.42524719238281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 7.0, 6.0, 8.0, 8.0, 22.0, 14.0, 18.0, 22.0, 23.0, 25.0, 30.0, 24.0, 28.0, 38.0, 43.0, 26.0, 37.0, 36.0, 49.0, 48.0, 44.0, 38.0, 31.0, 43.0, 23.0, 31.0, 33.0, 28.0, 37.0, 31.0, 21.0, 18.0, 19.0, 20.0, 11.0, 10.0, 7.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.538476943969727, -26.691091537475586, -25.843708038330078, -24.996322631835938, -24.14893913269043, -23.30155372619629, -22.45417022705078, -21.60678482055664, -20.7593994140625, -19.91201400756836, -19.06463050842285, -18.21724510192871, -17.369861602783203, -16.522476196289062, -15.675091743469238, -14.827707290649414, -13.980323791503906, -13.132939338684082, -12.285554885864258, -11.438169479370117, -10.59078598022461, -9.743400573730469, -8.896016120910645, -8.04863166809082, -7.201247215270996, -6.353862762451172, -5.506478309631348, -4.659093379974365, -3.811708927154541, -2.964324474334717, -2.1169395446777344, -1.2695550918579102, -0.42217254638671875, 0.425212025642395, 1.2725965976715088, 2.119981288909912, 2.9673657417297363, 3.8147501945495605, 4.662135124206543, 5.509519577026367, 6.356904029846191, 7.204288482666016, 8.05167293548584, 8.899057388305664, 9.746442794799805, 10.593826293945312, 11.441211700439453, 12.288596153259277, 13.135980606079102, 13.983365058898926, 14.83074951171875, 15.67813491821289, 16.5255184173584, 17.37290382385254, 18.220287322998047, 19.067672729492188, 19.915058135986328, 20.76244354248047, 21.609827041625977, 22.457212448120117, 23.304595947265625, 24.151981353759766, 24.999366760253906, 25.846750259399414, 26.694133758544922]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 20.0, 9.0, 30.0, 26.0, 48.0, 81.0, 114.0, 181.0, 253.0, 380.0, 549.0, 820.0, 1283.0, 1896.0, 2997.0, 4818.0, 7873.0, 12666.0, 21286.0, 36502.0, 61695.0, 103255.0, 159695.0, 196084.0, 165530.0, 108256.0, 64892.0, 38710.0, 22810.0, 13456.0, 8252.0, 4936.0, 3211.0, 2003.0, 1330.0, 841.0, 589.0, 361.0, 266.0, 176.0, 99.0, 87.0, 55.0, 39.0, 24.0, 21.0, 11.0, 11.0, 8.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-79.0, -76.49609375, -73.9921875, -71.48828125, -68.984375, -66.48046875, -63.9765625, -61.47265625, -58.96875, -56.46484375, -53.9609375, -51.45703125, -48.953125, -46.44921875, -43.9453125, -41.44140625, -38.9375, -36.43359375, -33.9296875, -31.42578125, -28.921875, -26.41796875, -23.9140625, -21.41015625, -18.90625, -16.40234375, -13.8984375, -11.39453125, -8.890625, -6.38671875, -3.8828125, -1.37890625, 1.125, 3.62890625, 6.1328125, 8.63671875, 11.140625, 13.64453125, 16.1484375, 18.65234375, 21.15625, 23.66015625, 26.1640625, 28.66796875, 31.171875, 33.67578125, 36.1796875, 38.68359375, 41.1875, 43.69140625, 46.1953125, 48.69921875, 51.203125, 53.70703125, 56.2109375, 58.71484375, 61.21875, 63.72265625, 66.2265625, 68.73046875, 71.234375, 73.73828125, 76.2421875, 78.74609375, 81.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 6.0, 16.0, 20.0, 20.0, 27.0, 20.0, 21.0, 30.0, 35.0, 32.0, 34.0, 30.0, 37.0, 46.0, 37.0, 66.0, 49.0, 42.0, 39.0, 45.0, 27.0, 41.0, 32.0, 28.0, 27.0, 16.0, 25.0, 16.0, 26.0, 22.0, 12.0, 14.0, 8.0, 8.0, 6.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-28.078125, -27.2275390625, -26.376953125, -25.5263671875, -24.67578125, -23.8251953125, -22.974609375, -22.1240234375, -21.2734375, -20.4228515625, -19.572265625, -18.7216796875, -17.87109375, -17.0205078125, -16.169921875, -15.3193359375, -14.46875, -13.6181640625, -12.767578125, -11.9169921875, -11.06640625, -10.2158203125, -9.365234375, -8.5146484375, -7.6640625, -6.8134765625, -5.962890625, -5.1123046875, -4.26171875, -3.4111328125, -2.560546875, -1.7099609375, -0.859375, -0.0087890625, 0.841796875, 1.6923828125, 2.54296875, 3.3935546875, 4.244140625, 5.0947265625, 5.9453125, 6.7958984375, 7.646484375, 8.4970703125, 9.34765625, 10.1982421875, 11.048828125, 11.8994140625, 12.75, 13.6005859375, 14.451171875, 15.3017578125, 16.15234375, 17.0029296875, 17.853515625, 18.7041015625, 19.5546875, 20.4052734375, 21.255859375, 22.1064453125, 22.95703125, 23.8076171875, 24.658203125, 25.5087890625, 26.359375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 14.0, 20.0, 28.0, 43.0, 73.0, 86.0, 167.0, 198.0, 298.0, 483.0, 659.0, 1043.0, 1682.0, 2660.0, 4420.0, 7454.0, 13150.0, 24861.0, 48597.0, 104016.0, 223955.0, 296027.0, 162721.0, 74891.0, 36202.0, 18989.0, 10283.0, 5901.0, 3512.0, 2151.0, 1347.0, 858.0, 574.0, 357.0, 288.0, 169.0, 112.0, 91.0, 52.0, 38.0, 27.0, 10.0, 15.0, 9.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-98.6875, -95.630859375, -92.57421875, -89.517578125, -86.4609375, -83.404296875, -80.34765625, -77.291015625, -74.234375, -71.177734375, -68.12109375, -65.064453125, -62.0078125, -58.951171875, -55.89453125, -52.837890625, -49.78125, -46.724609375, -43.66796875, -40.611328125, -37.5546875, -34.498046875, -31.44140625, -28.384765625, -25.328125, -22.271484375, -19.21484375, -16.158203125, -13.1015625, -10.044921875, -6.98828125, -3.931640625, -0.875, 2.181640625, 5.23828125, 8.294921875, 11.3515625, 14.408203125, 17.46484375, 20.521484375, 23.578125, 26.634765625, 29.69140625, 32.748046875, 35.8046875, 38.861328125, 41.91796875, 44.974609375, 48.03125, 51.087890625, 54.14453125, 57.201171875, 60.2578125, 63.314453125, 66.37109375, 69.427734375, 72.484375, 75.541015625, 78.59765625, 81.654296875, 84.7109375, 87.767578125, 90.82421875, 93.880859375, 96.9375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 13.0, 11.0, 6.0, 15.0, 13.0, 25.0, 16.0, 27.0, 29.0, 36.0, 40.0, 40.0, 42.0, 43.0, 58.0, 36.0, 37.0, 42.0, 37.0, 46.0, 42.0, 39.0, 41.0, 20.0, 28.0, 26.0, 37.0, 24.0, 24.0, 24.0, 10.0, 11.0, 8.0, 11.0, 6.0, 4.0, 7.0, 8.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.549072265625, -19.89501953125, -19.240966796875, -18.5869140625, -17.932861328125, -17.27880859375, -16.624755859375, -15.970703125, -15.316650390625, -14.66259765625, -14.008544921875, -13.3544921875, -12.700439453125, -12.04638671875, -11.392333984375, -10.73828125, -10.084228515625, -9.43017578125, -8.776123046875, -8.1220703125, -7.468017578125, -6.81396484375, -6.159912109375, -5.505859375, -4.851806640625, -4.19775390625, -3.543701171875, -2.8896484375, -2.235595703125, -1.58154296875, -0.927490234375, -0.2734375, 0.380615234375, 1.03466796875, 1.688720703125, 2.3427734375, 2.996826171875, 3.65087890625, 4.304931640625, 4.958984375, 5.613037109375, 6.26708984375, 6.921142578125, 7.5751953125, 8.229248046875, 8.88330078125, 9.537353515625, 10.19140625, 10.845458984375, 11.49951171875, 12.153564453125, 12.8076171875, 13.461669921875, 14.11572265625, 14.769775390625, 15.423828125, 16.077880859375, 16.73193359375, 17.385986328125, 18.0400390625, 18.694091796875, 19.34814453125, 20.002197265625, 20.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 13.0, 18.0, 30.0, 24.0, 55.0, 75.0, 105.0, 145.0, 192.0, 309.0, 427.0, 616.0, 890.0, 1311.0, 2111.0, 3067.0, 4977.0, 8340.0, 15298.0, 32662.0, 109764.0, 596876.0, 184312.0, 42774.0, 18195.0, 9619.0, 5746.0, 3529.0, 2301.0, 1421.0, 990.0, 651.0, 499.0, 370.0, 251.0, 170.0, 122.0, 82.0, 62.0, 53.0, 27.0, 14.0, 17.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-152.375, -147.845703125, -143.31640625, -138.787109375, -134.2578125, -129.728515625, -125.19921875, -120.669921875, -116.140625, -111.611328125, -107.08203125, -102.552734375, -98.0234375, -93.494140625, -88.96484375, -84.435546875, -79.90625, -75.376953125, -70.84765625, -66.318359375, -61.7890625, -57.259765625, -52.73046875, -48.201171875, -43.671875, -39.142578125, -34.61328125, -30.083984375, -25.5546875, -21.025390625, -16.49609375, -11.966796875, -7.4375, -2.908203125, 1.62109375, 6.150390625, 10.6796875, 15.208984375, 19.73828125, 24.267578125, 28.796875, 33.326171875, 37.85546875, 42.384765625, 46.9140625, 51.443359375, 55.97265625, 60.501953125, 65.03125, 69.560546875, 74.08984375, 78.619140625, 83.1484375, 87.677734375, 92.20703125, 96.736328125, 101.265625, 105.794921875, 110.32421875, 114.853515625, 119.3828125, 123.912109375, 128.44140625, 132.970703125, 137.5]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 11.0, 13.0, 16.0, 25.0, 36.0, 95.0, 274.0, 269.0, 76.0, 42.0, 20.0, 19.0, 7.0, 8.0, 13.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.01789093017578125, -0.0172271728515625, -0.01656341552734375, -0.015899658203125, -0.01523590087890625, -0.0145721435546875, -0.01390838623046875, -0.01324462890625, -0.01258087158203125, -0.0119171142578125, -0.01125335693359375, -0.010589599609375, -0.00992584228515625, -0.0092620849609375, -0.00859832763671875, -0.0079345703125, -0.00727081298828125, -0.0066070556640625, -0.00594329833984375, -0.005279541015625, -0.00461578369140625, -0.0039520263671875, -0.00328826904296875, -0.00262451171875, -0.00196075439453125, -0.0012969970703125, -0.00063323974609375, 3.0517578125e-05, 0.00069427490234375, 0.0013580322265625, 0.00202178955078125, 0.002685546875, 0.00334930419921875, 0.0040130615234375, 0.00467681884765625, 0.005340576171875, 0.00600433349609375, 0.0066680908203125, 0.00733184814453125, 0.00799560546875, 0.00865936279296875, 0.0093231201171875, 0.00998687744140625, 0.010650634765625, 0.01131439208984375, 0.0119781494140625, 0.01264190673828125, 0.0133056640625, 0.01396942138671875, 0.0146331787109375, 0.01529693603515625, 0.015960693359375, 0.01662445068359375, 0.0172882080078125, 0.01795196533203125, 0.01861572265625, 0.01927947998046875, 0.0199432373046875, 0.02060699462890625, 0.021270751953125, 0.02193450927734375, 0.0225982666015625, 0.02326202392578125, 0.02392578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 9.0, 16.0, 23.0, 37.0, 46.0, 50.0, 72.0, 102.0, 162.0, 238.0, 344.0, 557.0, 813.0, 1285.0, 2061.0, 3373.0, 5559.0, 9355.0, 17526.0, 38478.0, 117393.0, 421733.0, 291464.0, 75171.0, 28342.0, 13998.0, 7888.0, 4624.0, 2910.0, 1717.0, 1024.0, 788.0, 475.0, 291.0, 197.0, 127.0, 84.0, 70.0, 47.0, 21.0, 18.0, 13.0, 8.0, 9.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-95.0, -91.91796875, -88.8359375, -85.75390625, -82.671875, -79.58984375, -76.5078125, -73.42578125, -70.34375, -67.26171875, -64.1796875, -61.09765625, -58.015625, -54.93359375, -51.8515625, -48.76953125, -45.6875, -42.60546875, -39.5234375, -36.44140625, -33.359375, -30.27734375, -27.1953125, -24.11328125, -21.03125, -17.94921875, -14.8671875, -11.78515625, -8.703125, -5.62109375, -2.5390625, 0.54296875, 3.625, 6.70703125, 9.7890625, 12.87109375, 15.953125, 19.03515625, 22.1171875, 25.19921875, 28.28125, 31.36328125, 34.4453125, 37.52734375, 40.609375, 43.69140625, 46.7734375, 49.85546875, 52.9375, 56.01953125, 59.1015625, 62.18359375, 65.265625, 68.34765625, 71.4296875, 74.51171875, 77.59375, 80.67578125, 83.7578125, 86.83984375, 89.921875, 93.00390625, 96.0859375, 99.16796875, 102.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 9.0, 5.0, 10.0, 5.0, 6.0, 6.0, 12.0, 13.0, 21.0, 18.0, 24.0, 29.0, 55.0, 64.0, 87.0, 102.0, 106.0, 91.0, 69.0, 67.0, 37.0, 39.0, 20.0, 17.0, 15.0, 16.0, 9.0, 5.0, 6.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.59375, -23.880859375, -23.16796875, -22.455078125, -21.7421875, -21.029296875, -20.31640625, -19.603515625, -18.890625, -18.177734375, -17.46484375, -16.751953125, -16.0390625, -15.326171875, -14.61328125, -13.900390625, -13.1875, -12.474609375, -11.76171875, -11.048828125, -10.3359375, -9.623046875, -8.91015625, -8.197265625, -7.484375, -6.771484375, -6.05859375, -5.345703125, -4.6328125, -3.919921875, -3.20703125, -2.494140625, -1.78125, -1.068359375, -0.35546875, 0.357421875, 1.0703125, 1.783203125, 2.49609375, 3.208984375, 3.921875, 4.634765625, 5.34765625, 6.060546875, 6.7734375, 7.486328125, 8.19921875, 8.912109375, 9.625, 10.337890625, 11.05078125, 11.763671875, 12.4765625, 13.189453125, 13.90234375, 14.615234375, 15.328125, 16.041015625, 16.75390625, 17.466796875, 18.1796875, 18.892578125, 19.60546875, 20.318359375, 21.03125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 5.0, 14.0, 8.0, 16.0, 16.0, 25.0, 34.0, 33.0, 35.0, 52.0, 47.0, 55.0, 66.0, 65.0, 60.0, 55.0, 59.0, 45.0, 32.0, 42.0, 38.0, 33.0, 24.0, 21.0, 19.0, 25.0, 11.0, 9.0, 11.0, 11.0, 5.0, 3.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.637935638427734, -44.28535079956055, -42.93276596069336, -41.580177307128906, -40.22759246826172, -38.87500762939453, -37.522422790527344, -36.169837951660156, -34.81725311279297, -33.46466827392578, -32.112083435058594, -30.759496688842773, -29.406909942626953, -28.054325103759766, -26.701740264892578, -25.34915542602539, -23.996566772460938, -22.64398193359375, -21.29139518737793, -19.938810348510742, -18.586223602294922, -17.233638763427734, -15.881053924560547, -14.528468132019043, -13.175882339477539, -11.823296546936035, -10.470710754394531, -9.118125915527344, -7.76554012298584, -6.412954330444336, -5.060369491577148, -3.7077836990356445, -2.3552017211914062, -1.0026161670684814, 0.34996938705444336, 1.702554702758789, 3.055140495300293, 4.407726287841797, 5.760311126708984, 7.112896919250488, 8.465482711791992, 9.818068504333496, 11.170654296875, 12.523239135742188, 13.875824928283691, 15.228410720825195, 16.580995559692383, 17.933582305908203, 19.28616714477539, 20.638751983642578, 21.9913387298584, 23.343923568725586, 24.696510314941406, 26.049095153808594, 27.40167999267578, 28.75426483154297, 30.10685157775879, 31.459436416625977, 32.8120231628418, 34.164608001708984, 35.51719284057617, 36.869781494140625, 38.22236633300781, 39.574951171875, 40.92753601074219]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 6.0, 10.0, 14.0, 16.0, 16.0, 20.0, 23.0, 29.0, 27.0, 32.0, 43.0, 36.0, 32.0, 38.0, 41.0, 46.0, 38.0, 47.0, 47.0, 43.0, 62.0, 32.0, 35.0, 36.0, 27.0, 25.0, 25.0, 23.0, 21.0, 17.0, 20.0, 14.0, 8.0, 9.0, 5.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.595787048339844, -38.51987075805664, -37.44395446777344, -36.368038177490234, -35.29212188720703, -34.21620178222656, -33.14028549194336, -32.064369201660156, -30.988452911376953, -29.91253662109375, -28.836620330810547, -27.76070213317871, -26.684785842895508, -25.608869552612305, -24.53295135498047, -23.457035064697266, -22.381118774414062, -21.30520248413086, -20.229286193847656, -19.15336799621582, -18.077451705932617, -17.001535415649414, -15.925618171691895, -14.849700927734375, -13.773784637451172, -12.697868347167969, -11.62195110321045, -10.54603385925293, -9.470117568969727, -8.394201278686523, -7.318284034729004, -6.242367267608643, -5.166454315185547, -4.0905375480651855, -3.014620780944824, -1.938704013824463, -0.8627872467041016, 0.21312952041625977, 1.289046287536621, 2.3649630546569824, 3.4408798217773438, 4.516796588897705, 5.592713356018066, 6.668630123138428, 7.744546890258789, 8.820463180541992, 9.896380424499512, 10.972297668457031, 12.048213958740234, 13.124130249023438, 14.200047492980957, 15.275964736938477, 16.35188102722168, 17.427797317504883, 18.50371551513672, 19.579631805419922, 20.655548095703125, 21.731464385986328, 22.80738067626953, 23.883298873901367, 24.95921516418457, 26.035131454467773, 27.11104965209961, 28.186965942382812, 29.262882232666016]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [6.0, 5.0, 9.0, 7.0, 15.0, 13.0, 33.0, 40.0, 47.0, 88.0, 115.0, 203.0, 281.0, 459.0, 731.0, 1130.0, 1688.0, 2607.0, 3929.0, 6137.0, 9498.0, 14248.0, 21715.0, 32473.0, 48252.0, 70061.0, 97450.0, 126277.0, 140873.0, 131171.0, 104490.0, 76280.0, 53360.0, 35864.0, 24035.0, 15502.0, 10347.0, 6799.0, 4300.0, 2815.0, 1815.0, 1201.0, 744.0, 511.0, 342.0, 215.0, 142.0, 81.0, 55.0, 29.0, 24.0, 23.0, 18.0, 4.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.2197265625, -34.908203125, -33.5966796875, -32.28515625, -30.9736328125, -29.662109375, -28.3505859375, -27.0390625, -25.7275390625, -24.416015625, -23.1044921875, -21.79296875, -20.4814453125, -19.169921875, -17.8583984375, -16.546875, -15.2353515625, -13.923828125, -12.6123046875, -11.30078125, -9.9892578125, -8.677734375, -7.3662109375, -6.0546875, -4.7431640625, -3.431640625, -2.1201171875, -0.80859375, 0.5029296875, 1.814453125, 3.1259765625, 4.4375, 5.7490234375, 7.060546875, 8.3720703125, 9.68359375, 10.9951171875, 12.306640625, 13.6181640625, 14.9296875, 16.2412109375, 17.552734375, 18.8642578125, 20.17578125, 21.4873046875, 22.798828125, 24.1103515625, 25.421875, 26.7333984375, 28.044921875, 29.3564453125, 30.66796875, 31.9794921875, 33.291015625, 34.6025390625, 35.9140625, 37.2255859375, 38.537109375, 39.8486328125, 41.16015625, 42.4716796875, 43.783203125, 45.0947265625, 46.40625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 5.0, 13.0, 13.0, 22.0, 20.0, 21.0, 22.0, 23.0, 30.0, 31.0, 24.0, 37.0, 44.0, 46.0, 40.0, 44.0, 47.0, 48.0, 52.0, 37.0, 55.0, 37.0, 39.0, 32.0, 27.0, 28.0, 26.0, 22.0, 22.0, 14.0, 12.0, 10.0, 7.0, 4.0, 9.0, 4.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0], "bins": [-37.46875, -36.496826171875, -35.52490234375, -34.552978515625, -33.5810546875, -32.609130859375, -31.63720703125, -30.665283203125, -29.693359375, -28.721435546875, -27.74951171875, -26.777587890625, -25.8056640625, -24.833740234375, -23.86181640625, -22.889892578125, -21.91796875, -20.946044921875, -19.97412109375, -19.002197265625, -18.0302734375, -17.058349609375, -16.08642578125, -15.114501953125, -14.142578125, -13.170654296875, -12.19873046875, -11.226806640625, -10.2548828125, -9.282958984375, -8.31103515625, -7.339111328125, -6.3671875, -5.395263671875, -4.42333984375, -3.451416015625, -2.4794921875, -1.507568359375, -0.53564453125, 0.436279296875, 1.408203125, 2.380126953125, 3.35205078125, 4.323974609375, 5.2958984375, 6.267822265625, 7.23974609375, 8.211669921875, 9.18359375, 10.155517578125, 11.12744140625, 12.099365234375, 13.0712890625, 14.043212890625, 15.01513671875, 15.987060546875, 16.958984375, 17.930908203125, 18.90283203125, 19.874755859375, 20.8466796875, 21.818603515625, 22.79052734375, 23.762451171875, 24.734375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 2.0, 7.0, 14.0, 13.0, 26.0, 37.0, 57.0, 76.0, 140.0, 191.0, 283.0, 438.0, 597.0, 930.0, 1404.0, 2122.0, 3163.0, 4835.0, 7439.0, 11390.0, 17023.0, 26123.0, 38746.0, 56874.0, 80550.0, 107483.0, 129412.0, 134885.0, 119646.0, 94251.0, 68688.0, 47649.0, 31730.0, 21249.0, 13945.0, 9156.0, 6016.0, 4072.0, 2640.0, 1739.0, 1165.0, 840.0, 526.0, 327.0, 235.0, 154.0, 94.0, 53.0, 36.0, 29.0, 15.0, 14.0, 15.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-35.0, -33.84326171875, -32.6865234375, -31.52978515625, -30.373046875, -29.21630859375, -28.0595703125, -26.90283203125, -25.74609375, -24.58935546875, -23.4326171875, -22.27587890625, -21.119140625, -19.96240234375, -18.8056640625, -17.64892578125, -16.4921875, -15.33544921875, -14.1787109375, -13.02197265625, -11.865234375, -10.70849609375, -9.5517578125, -8.39501953125, -7.23828125, -6.08154296875, -4.9248046875, -3.76806640625, -2.611328125, -1.45458984375, -0.2978515625, 0.85888671875, 2.015625, 3.17236328125, 4.3291015625, 5.48583984375, 6.642578125, 7.79931640625, 8.9560546875, 10.11279296875, 11.26953125, 12.42626953125, 13.5830078125, 14.73974609375, 15.896484375, 17.05322265625, 18.2099609375, 19.36669921875, 20.5234375, 21.68017578125, 22.8369140625, 23.99365234375, 25.150390625, 26.30712890625, 27.4638671875, 28.62060546875, 29.77734375, 30.93408203125, 32.0908203125, 33.24755859375, 34.404296875, 35.56103515625, 36.7177734375, 37.87451171875, 39.03125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 14.0, 17.0, 16.0, 21.0, 23.0, 23.0, 22.0, 33.0, 29.0, 31.0, 49.0, 28.0, 36.0, 34.0, 35.0, 47.0, 51.0, 30.0, 44.0, 37.0, 43.0, 40.0, 35.0, 21.0, 34.0, 23.0, 30.0, 25.0, 19.0, 13.0, 12.0, 13.0, 10.0, 12.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.265625, -19.647705078125, -19.02978515625, -18.411865234375, -17.7939453125, -17.176025390625, -16.55810546875, -15.940185546875, -15.322265625, -14.704345703125, -14.08642578125, -13.468505859375, -12.8505859375, -12.232666015625, -11.61474609375, -10.996826171875, -10.37890625, -9.760986328125, -9.14306640625, -8.525146484375, -7.9072265625, -7.289306640625, -6.67138671875, -6.053466796875, -5.435546875, -4.817626953125, -4.19970703125, -3.581787109375, -2.9638671875, -2.345947265625, -1.72802734375, -1.110107421875, -0.4921875, 0.125732421875, 0.74365234375, 1.361572265625, 1.9794921875, 2.597412109375, 3.21533203125, 3.833251953125, 4.451171875, 5.069091796875, 5.68701171875, 6.304931640625, 6.9228515625, 7.540771484375, 8.15869140625, 8.776611328125, 9.39453125, 10.012451171875, 10.63037109375, 11.248291015625, 11.8662109375, 12.484130859375, 13.10205078125, 13.719970703125, 14.337890625, 14.955810546875, 15.57373046875, 16.191650390625, 16.8095703125, 17.427490234375, 18.04541015625, 18.663330078125, 19.28125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 7.0, 9.0, 17.0, 33.0, 43.0, 54.0, 90.0, 135.0, 209.0, 285.0, 448.0, 707.0, 1080.0, 1896.0, 3032.0, 5143.0, 9103.0, 16372.0, 31125.0, 61358.0, 123914.0, 223624.0, 250382.0, 154832.0, 78180.0, 39308.0, 20326.0, 11189.0, 6207.0, 3626.0, 2092.0, 1374.0, 842.0, 557.0, 303.0, 228.0, 139.0, 102.0, 53.0, 39.0, 27.0, 18.0, 13.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-47.125, -45.66015625, -44.1953125, -42.73046875, -41.265625, -39.80078125, -38.3359375, -36.87109375, -35.40625, -33.94140625, -32.4765625, -31.01171875, -29.546875, -28.08203125, -26.6171875, -25.15234375, -23.6875, -22.22265625, -20.7578125, -19.29296875, -17.828125, -16.36328125, -14.8984375, -13.43359375, -11.96875, -10.50390625, -9.0390625, -7.57421875, -6.109375, -4.64453125, -3.1796875, -1.71484375, -0.25, 1.21484375, 2.6796875, 4.14453125, 5.609375, 7.07421875, 8.5390625, 10.00390625, 11.46875, 12.93359375, 14.3984375, 15.86328125, 17.328125, 18.79296875, 20.2578125, 21.72265625, 23.1875, 24.65234375, 26.1171875, 27.58203125, 29.046875, 30.51171875, 31.9765625, 33.44140625, 34.90625, 36.37109375, 37.8359375, 39.30078125, 40.765625, 42.23046875, 43.6953125, 45.16015625, 46.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 0.0, 6.0, 7.0, 12.0, 8.0, 11.0, 15.0, 11.0, 26.0, 33.0, 34.0, 37.0, 47.0, 61.0, 61.0, 51.0, 57.0, 64.0, 58.0, 59.0, 48.0, 46.0, 29.0, 33.0, 36.0, 29.0, 23.0, 18.0, 15.0, 11.0, 10.0, 11.0, 3.0, 7.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0034732818603515625, -0.0033621788024902344, -0.0032510757446289062, -0.003139972686767578, -0.00302886962890625, -0.002917766571044922, -0.0028066635131835938, -0.0026955604553222656, -0.0025844573974609375, -0.0024733543395996094, -0.0023622512817382812, -0.002251148223876953, -0.002140045166015625, -0.002028942108154297, -0.0019178390502929688, -0.0018067359924316406, -0.0016956329345703125, -0.0015845298767089844, -0.0014734268188476562, -0.0013623237609863281, -0.001251220703125, -0.0011401176452636719, -0.0010290145874023438, -0.0009179115295410156, -0.0008068084716796875, -0.0006957054138183594, -0.0005846023559570312, -0.0004734992980957031, -0.000362396240234375, -0.0002512931823730469, -0.00014019012451171875, -2.9087066650390625e-05, 8.20159912109375e-05, 0.00019311904907226562, 0.00030422210693359375, 0.0004153251647949219, 0.00052642822265625, 0.0006375312805175781, 0.0007486343383789062, 0.0008597373962402344, 0.0009708404541015625, 0.0010819435119628906, 0.0011930465698242188, 0.0013041496276855469, 0.001415252685546875, 0.0015263557434082031, 0.0016374588012695312, 0.0017485618591308594, 0.0018596649169921875, 0.0019707679748535156, 0.0020818710327148438, 0.002192974090576172, 0.0023040771484375, 0.002415180206298828, 0.0025262832641601562, 0.0026373863220214844, 0.0027484893798828125, 0.0028595924377441406, 0.0029706954956054688, 0.003081798553466797, 0.003192901611328125, 0.003304004669189453, 0.0034151077270507812, 0.0035262107849121094, 0.0036373138427734375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 11.0, 8.0, 17.0, 31.0, 35.0, 39.0, 78.0, 120.0, 160.0, 236.0, 332.0, 512.0, 781.0, 1132.0, 1726.0, 2714.0, 4193.0, 6529.0, 10633.0, 17356.0, 29805.0, 51521.0, 91241.0, 157171.0, 219909.0, 185428.0, 111903.0, 63240.0, 35918.0, 21156.0, 12641.0, 7891.0, 4928.0, 3121.0, 2042.0, 1289.0, 861.0, 593.0, 410.0, 271.0, 174.0, 121.0, 105.0, 58.0, 47.0, 28.0, 14.0, 9.0, 3.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.125, -36.88232421875, -35.6396484375, -34.39697265625, -33.154296875, -31.91162109375, -30.6689453125, -29.42626953125, -28.18359375, -26.94091796875, -25.6982421875, -24.45556640625, -23.212890625, -21.97021484375, -20.7275390625, -19.48486328125, -18.2421875, -16.99951171875, -15.7568359375, -14.51416015625, -13.271484375, -12.02880859375, -10.7861328125, -9.54345703125, -8.30078125, -7.05810546875, -5.8154296875, -4.57275390625, -3.330078125, -2.08740234375, -0.8447265625, 0.39794921875, 1.640625, 2.88330078125, 4.1259765625, 5.36865234375, 6.611328125, 7.85400390625, 9.0966796875, 10.33935546875, 11.58203125, 12.82470703125, 14.0673828125, 15.31005859375, 16.552734375, 17.79541015625, 19.0380859375, 20.28076171875, 21.5234375, 22.76611328125, 24.0087890625, 25.25146484375, 26.494140625, 27.73681640625, 28.9794921875, 30.22216796875, 31.46484375, 32.70751953125, 33.9501953125, 35.19287109375, 36.435546875, 37.67822265625, 38.9208984375, 40.16357421875, 41.40625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 7.0, 11.0, 14.0, 22.0, 14.0, 20.0, 25.0, 35.0, 36.0, 35.0, 45.0, 58.0, 73.0, 71.0, 62.0, 58.0, 56.0, 56.0, 49.0, 38.0, 28.0, 31.0, 19.0, 22.0, 15.0, 12.0, 9.0, 19.0, 6.0, 9.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.2265625, -12.818603515625, -12.41064453125, -12.002685546875, -11.5947265625, -11.186767578125, -10.77880859375, -10.370849609375, -9.962890625, -9.554931640625, -9.14697265625, -8.739013671875, -8.3310546875, -7.923095703125, -7.51513671875, -7.107177734375, -6.69921875, -6.291259765625, -5.88330078125, -5.475341796875, -5.0673828125, -4.659423828125, -4.25146484375, -3.843505859375, -3.435546875, -3.027587890625, -2.61962890625, -2.211669921875, -1.8037109375, -1.395751953125, -0.98779296875, -0.579833984375, -0.171875, 0.236083984375, 0.64404296875, 1.052001953125, 1.4599609375, 1.867919921875, 2.27587890625, 2.683837890625, 3.091796875, 3.499755859375, 3.90771484375, 4.315673828125, 4.7236328125, 5.131591796875, 5.53955078125, 5.947509765625, 6.35546875, 6.763427734375, 7.17138671875, 7.579345703125, 7.9873046875, 8.395263671875, 8.80322265625, 9.211181640625, 9.619140625, 10.027099609375, 10.43505859375, 10.843017578125, 11.2509765625, 11.658935546875, 12.06689453125, 12.474853515625, 12.8828125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 12.0, 13.0, 8.0, 14.0, 20.0, 20.0, 27.0, 42.0, 40.0, 49.0, 65.0, 51.0, 58.0, 55.0, 52.0, 49.0, 62.0, 47.0, 49.0, 36.0, 35.0, 39.0, 24.0, 23.0, 17.0, 14.0, 18.0, 10.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-40.51506423950195, -39.29050827026367, -38.065956115722656, -36.841400146484375, -35.616844177246094, -34.39228820800781, -33.16773223876953, -31.943180084228516, -30.718624114990234, -29.494068145751953, -28.269514083862305, -27.044960021972656, -25.820404052734375, -24.595848083496094, -23.371294021606445, -22.146739959716797, -20.922183990478516, -19.697628021240234, -18.473073959350586, -17.248519897460938, -16.023963928222656, -14.799408912658691, -13.574853897094727, -12.350298881530762, -11.125743865966797, -9.901188850402832, -8.676633834838867, -7.452078819274902, -6.2275238037109375, -5.002968788146973, -3.778413772583008, -2.553858757019043, -1.3293075561523438, -0.1047525405883789, 1.119802474975586, 2.344357490539551, 3.5689125061035156, 4.7934675216674805, 6.018022537231445, 7.24257755279541, 8.467132568359375, 9.69168758392334, 10.916242599487305, 12.14079761505127, 13.365352630615234, 14.5899076461792, 15.814462661743164, 17.039016723632812, 18.263572692871094, 19.488128662109375, 20.712682723999023, 21.937236785888672, 23.161792755126953, 24.386348724365234, 25.610902786254883, 26.83545684814453, 28.060012817382812, 29.284568786621094, 30.509122848510742, 31.73367691040039, 32.95823287963867, 34.18278884887695, 35.40734100341797, 36.63189697265625, 37.85645294189453]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 6.0, 9.0, 13.0, 15.0, 16.0, 22.0, 21.0, 24.0, 28.0, 26.0, 25.0, 38.0, 34.0, 36.0, 37.0, 29.0, 38.0, 44.0, 38.0, 55.0, 41.0, 33.0, 45.0, 36.0, 29.0, 33.0, 35.0, 27.0, 20.0, 23.0, 15.0, 20.0, 17.0, 14.0, 11.0, 5.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.519691467285156, -35.51594924926758, -34.51220703125, -33.50846481323242, -32.504722595214844, -31.500980377197266, -30.497238159179688, -29.49349594116211, -28.48975372314453, -27.486011505126953, -26.482269287109375, -25.478527069091797, -24.47478485107422, -23.47104263305664, -22.467300415039062, -21.463558197021484, -20.459814071655273, -19.456071853637695, -18.452329635620117, -17.44858741760254, -16.44484519958496, -15.441102981567383, -14.437359809875488, -13.43361759185791, -12.429875373840332, -11.426133155822754, -10.422390937805176, -9.418647766113281, -8.414905548095703, -7.411163806915283, -6.407421112060547, -5.403678894042969, -4.399938583374023, -3.3961963653564453, -2.392453908920288, -1.3887114524841309, -0.38496923446655273, 0.6187729835510254, 1.6225156784057617, 2.62625789642334, 3.630000114440918, 4.633742332458496, 5.637484550476074, 6.6412272453308105, 7.644969463348389, 8.648712158203125, 9.652454376220703, 10.656196594238281, 11.65993881225586, 12.663681030273438, 13.667423248291016, 14.671165466308594, 15.674907684326172, 16.67864990234375, 17.682392120361328, 18.686134338378906, 19.689876556396484, 20.693618774414062, 21.69736099243164, 22.70110321044922, 23.704845428466797, 24.708587646484375, 25.712329864501953, 26.71607208251953, 27.719816207885742]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 14.0, 21.0, 33.0, 59.0, 99.0, 137.0, 191.0, 320.0, 511.0, 854.0, 1313.0, 2147.0, 3508.0, 5504.0, 8579.0, 14706.0, 24391.0, 42282.0, 75697.0, 140901.0, 280759.0, 587076.0, 982941.0, 939322.0, 535048.0, 254687.0, 128304.0, 69311.0, 38612.0, 22349.0, 13485.0, 8205.0, 4786.0, 2991.0, 1909.0, 1282.0, 755.0, 445.0, 289.0, 171.0, 112.0, 69.0, 35.0, 26.0, 14.0, 14.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-38.59375, -37.51953125, -36.4453125, -35.37109375, -34.296875, -33.22265625, -32.1484375, -31.07421875, -30.0, -28.92578125, -27.8515625, -26.77734375, -25.703125, -24.62890625, -23.5546875, -22.48046875, -21.40625, -20.33203125, -19.2578125, -18.18359375, -17.109375, -16.03515625, -14.9609375, -13.88671875, -12.8125, -11.73828125, -10.6640625, -9.58984375, -8.515625, -7.44140625, -6.3671875, -5.29296875, -4.21875, -3.14453125, -2.0703125, -0.99609375, 0.078125, 1.15234375, 2.2265625, 3.30078125, 4.375, 5.44921875, 6.5234375, 7.59765625, 8.671875, 9.74609375, 10.8203125, 11.89453125, 12.96875, 14.04296875, 15.1171875, 16.19140625, 17.265625, 18.33984375, 19.4140625, 20.48828125, 21.5625, 22.63671875, 23.7109375, 24.78515625, 25.859375, 26.93359375, 28.0078125, 29.08203125, 30.15625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 6.0, 11.0, 12.0, 11.0, 19.0, 11.0, 26.0, 14.0, 27.0, 23.0, 31.0, 28.0, 32.0, 32.0, 35.0, 32.0, 48.0, 32.0, 35.0, 36.0, 41.0, 35.0, 39.0, 46.0, 31.0, 38.0, 34.0, 28.0, 38.0, 27.0, 18.0, 22.0, 18.0, 18.0, 8.0, 12.0, 13.0, 7.0, 2.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.234375, -23.551025390625, -22.86767578125, -22.184326171875, -21.5009765625, -20.817626953125, -20.13427734375, -19.450927734375, -18.767578125, -18.084228515625, -17.40087890625, -16.717529296875, -16.0341796875, -15.350830078125, -14.66748046875, -13.984130859375, -13.30078125, -12.617431640625, -11.93408203125, -11.250732421875, -10.5673828125, -9.884033203125, -9.20068359375, -8.517333984375, -7.833984375, -7.150634765625, -6.46728515625, -5.783935546875, -5.1005859375, -4.417236328125, -3.73388671875, -3.050537109375, -2.3671875, -1.683837890625, -1.00048828125, -0.317138671875, 0.3662109375, 1.049560546875, 1.73291015625, 2.416259765625, 3.099609375, 3.782958984375, 4.46630859375, 5.149658203125, 5.8330078125, 6.516357421875, 7.19970703125, 7.883056640625, 8.56640625, 9.249755859375, 9.93310546875, 10.616455078125, 11.2998046875, 11.983154296875, 12.66650390625, 13.349853515625, 14.033203125, 14.716552734375, 15.39990234375, 16.083251953125, 16.7666015625, 17.449951171875, 18.13330078125, 18.816650390625, 19.5]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 30.0, 38.0, 70.0, 89.0, 124.0, 201.0, 325.0, 484.0, 804.0, 1177.0, 2106.0, 3283.0, 5291.0, 8904.0, 14671.0, 25677.0, 44909.0, 79651.0, 145315.0, 270014.0, 501757.0, 852290.0, 926745.0, 595443.0, 322807.0, 172219.0, 93901.0, 52435.0, 29862.0, 17075.0, 10211.0, 6169.0, 3887.0, 2285.0, 1445.0, 932.0, 579.0, 376.0, 258.0, 140.0, 94.0, 66.0, 46.0, 29.0, 17.0, 11.0, 9.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.8115234375, -31.685546875, -30.5595703125, -29.43359375, -28.3076171875, -27.181640625, -26.0556640625, -24.9296875, -23.8037109375, -22.677734375, -21.5517578125, -20.42578125, -19.2998046875, -18.173828125, -17.0478515625, -15.921875, -14.7958984375, -13.669921875, -12.5439453125, -11.41796875, -10.2919921875, -9.166015625, -8.0400390625, -6.9140625, -5.7880859375, -4.662109375, -3.5361328125, -2.41015625, -1.2841796875, -0.158203125, 0.9677734375, 2.09375, 3.2197265625, 4.345703125, 5.4716796875, 6.59765625, 7.7236328125, 8.849609375, 9.9755859375, 11.1015625, 12.2275390625, 13.353515625, 14.4794921875, 15.60546875, 16.7314453125, 17.857421875, 18.9833984375, 20.109375, 21.2353515625, 22.361328125, 23.4873046875, 24.61328125, 25.7392578125, 26.865234375, 27.9912109375, 29.1171875, 30.2431640625, 31.369140625, 32.4951171875, 33.62109375, 34.7470703125, 35.873046875, 36.9990234375, 38.125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 6.0, 18.0, 10.0, 15.0, 20.0, 38.0, 28.0, 49.0, 53.0, 56.0, 84.0, 97.0, 125.0, 144.0, 182.0, 206.0, 226.0, 264.0, 273.0, 303.0, 264.0, 252.0, 216.0, 165.0, 181.0, 140.0, 122.0, 111.0, 86.0, 71.0, 48.0, 48.0, 39.0, 31.0, 15.0, 11.0, 20.0, 11.0, 11.0, 11.0, 4.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.234375, -11.8409423828125, -11.447509765625, -11.0540771484375, -10.66064453125, -10.2672119140625, -9.873779296875, -9.4803466796875, -9.0869140625, -8.6934814453125, -8.300048828125, -7.9066162109375, -7.51318359375, -7.1197509765625, -6.726318359375, -6.3328857421875, -5.939453125, -5.5460205078125, -5.152587890625, -4.7591552734375, -4.36572265625, -3.9722900390625, -3.578857421875, -3.1854248046875, -2.7919921875, -2.3985595703125, -2.005126953125, -1.6116943359375, -1.21826171875, -0.8248291015625, -0.431396484375, -0.0379638671875, 0.35546875, 0.7489013671875, 1.142333984375, 1.5357666015625, 1.92919921875, 2.3226318359375, 2.716064453125, 3.1094970703125, 3.5029296875, 3.8963623046875, 4.289794921875, 4.6832275390625, 5.07666015625, 5.4700927734375, 5.863525390625, 6.2569580078125, 6.650390625, 7.0438232421875, 7.437255859375, 7.8306884765625, 8.22412109375, 8.6175537109375, 9.010986328125, 9.4044189453125, 9.7978515625, 10.1912841796875, 10.584716796875, 10.9781494140625, 11.37158203125, 11.7650146484375, 12.158447265625, 12.5518798828125, 12.9453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 7.0, 13.0, 19.0, 14.0, 16.0, 25.0, 20.0, 33.0, 43.0, 45.0, 57.0, 78.0, 54.0, 61.0, 81.0, 53.0, 65.0, 43.0, 44.0, 29.0, 41.0, 31.0, 27.0, 16.0, 12.0, 19.0, 9.0, 9.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.2911491394043, -36.08531951904297, -34.87948989868164, -33.67366027832031, -32.46782684326172, -31.26199722290039, -30.056167602539062, -28.850337982177734, -27.644508361816406, -26.438678741455078, -25.232847213745117, -24.02701759338379, -22.82118797302246, -21.6153564453125, -20.409526824951172, -19.203697204589844, -17.997865676879883, -16.792036056518555, -15.58620548248291, -14.380374908447266, -13.174545288085938, -11.968714714050293, -10.762884140014648, -9.55705451965332, -8.351223945617676, -7.1453938484191895, -5.939563751220703, -4.733733177185059, -3.5279030799865723, -2.322072982788086, -1.1162424087524414, 0.08958721160888672, 1.2954177856445312, 2.5012478828430176, 3.707078218460083, 4.912908554077148, 6.118738651275635, 7.324568748474121, 8.530399322509766, 9.736228942871094, 10.942059516906738, 12.147890090942383, 13.353719711303711, 14.559550285339355, 15.765380859375, 16.971210479736328, 18.177040100097656, 19.382869720458984, 20.588701248168945, 21.794530868530273, 23.000362396240234, 24.206192016601562, 25.41202163696289, 26.61785125732422, 27.82368278503418, 29.029512405395508, 30.23534393310547, 31.441173553466797, 32.647003173828125, 33.85283660888672, 35.05866622924805, 36.264495849609375, 37.4703254699707, 38.67615509033203, 39.88198471069336]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 12.0, 24.0, 15.0, 18.0, 25.0, 22.0, 22.0, 26.0, 34.0, 36.0, 39.0, 37.0, 43.0, 54.0, 49.0, 49.0, 48.0, 31.0, 49.0, 32.0, 46.0, 35.0, 34.0, 29.0, 18.0, 12.0, 21.0, 16.0, 13.0, 16.0, 14.0, 7.0, 9.0, 3.0, 5.0, 7.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34120559692383, -32.357147216796875, -31.373088836669922, -30.38903045654297, -29.404972076416016, -28.420913696289062, -27.436853408813477, -26.452795028686523, -25.46873664855957, -24.484678268432617, -23.500619888305664, -22.51656150817871, -21.532501220703125, -20.548442840576172, -19.56438446044922, -18.580326080322266, -17.596267700195312, -16.61220932006836, -15.628150939941406, -14.644091606140137, -13.660033226013184, -12.67597484588623, -11.691915512084961, -10.707857131958008, -9.723798751831055, -8.739740371704102, -7.75568151473999, -6.771622657775879, -5.787564277648926, -4.803505897521973, -3.8194470405578613, -2.83538818359375, -1.8513317108154297, -0.8672730922698975, 0.11678552627563477, 1.100844144821167, 2.084902763366699, 3.0689611434936523, 4.053020000457764, 5.037078857421875, 6.021137237548828, 7.005195617675781, 7.989254474639893, 8.973313331604004, 9.957371711730957, 10.94143009185791, 11.92548942565918, 12.909547805786133, 13.893606185913086, 14.877664566040039, 15.861722946166992, 16.845781326293945, 17.82984161376953, 18.813899993896484, 19.797958374023438, 20.78201675415039, 21.766075134277344, 22.750133514404297, 23.73419189453125, 24.718250274658203, 25.702308654785156, 26.68636703491211, 27.670427322387695, 28.65448570251465, 29.6385440826416]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 7.0, 10.0, 25.0, 33.0, 46.0, 53.0, 69.0, 100.0, 146.0, 222.0, 295.0, 408.0, 681.0, 984.0, 1401.0, 2304.0, 3941.0, 6564.0, 12318.0, 25783.0, 62724.0, 173512.0, 379890.0, 228695.0, 81377.0, 32166.0, 14897.0, 7704.0, 4450.0, 2662.0, 1728.0, 1093.0, 676.0, 468.0, 325.0, 230.0, 166.0, 106.0, 77.0, 59.0, 61.0, 31.0, 19.0, 17.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-100.875, -97.58203125, -94.2890625, -90.99609375, -87.703125, -84.41015625, -81.1171875, -77.82421875, -74.53125, -71.23828125, -67.9453125, -64.65234375, -61.359375, -58.06640625, -54.7734375, -51.48046875, -48.1875, -44.89453125, -41.6015625, -38.30859375, -35.015625, -31.72265625, -28.4296875, -25.13671875, -21.84375, -18.55078125, -15.2578125, -11.96484375, -8.671875, -5.37890625, -2.0859375, 1.20703125, 4.5, 7.79296875, 11.0859375, 14.37890625, 17.671875, 20.96484375, 24.2578125, 27.55078125, 30.84375, 34.13671875, 37.4296875, 40.72265625, 44.015625, 47.30859375, 50.6015625, 53.89453125, 57.1875, 60.48046875, 63.7734375, 67.06640625, 70.359375, 73.65234375, 76.9453125, 80.23828125, 83.53125, 86.82421875, 90.1171875, 93.41015625, 96.703125, 99.99609375, 103.2890625, 106.58203125, 109.875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 9.0, 7.0, 6.0, 15.0, 8.0, 18.0, 19.0, 20.0, 31.0, 25.0, 29.0, 28.0, 25.0, 46.0, 60.0, 51.0, 51.0, 43.0, 53.0, 45.0, 43.0, 46.0, 36.0, 46.0, 41.0, 42.0, 29.0, 12.0, 21.0, 17.0, 14.0, 7.0, 12.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.695556640625, -32.67236328125, -31.649169921875, -30.6259765625, -29.602783203125, -28.57958984375, -27.556396484375, -26.533203125, -25.510009765625, -24.48681640625, -23.463623046875, -22.4404296875, -21.417236328125, -20.39404296875, -19.370849609375, -18.34765625, -17.324462890625, -16.30126953125, -15.278076171875, -14.2548828125, -13.231689453125, -12.20849609375, -11.185302734375, -10.162109375, -9.138916015625, -8.11572265625, -7.092529296875, -6.0693359375, -5.046142578125, -4.02294921875, -2.999755859375, -1.9765625, -0.953369140625, 0.06982421875, 1.093017578125, 2.1162109375, 3.139404296875, 4.16259765625, 5.185791015625, 6.208984375, 7.232177734375, 8.25537109375, 9.278564453125, 10.3017578125, 11.324951171875, 12.34814453125, 13.371337890625, 14.39453125, 15.417724609375, 16.44091796875, 17.464111328125, 18.4873046875, 19.510498046875, 20.53369140625, 21.556884765625, 22.580078125, 23.603271484375, 24.62646484375, 25.649658203125, 26.6728515625, 27.696044921875, 28.71923828125, 29.742431640625, 30.765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 11.0, 11.0, 30.0, 27.0, 32.0, 77.0, 93.0, 153.0, 210.0, 311.0, 495.0, 726.0, 1094.0, 1823.0, 2958.0, 5358.0, 10496.0, 21978.0, 54372.0, 165032.0, 437918.0, 221991.0, 68901.0, 26761.0, 12339.0, 6274.0, 3382.0, 2046.0, 1253.0, 789.0, 563.0, 351.0, 228.0, 162.0, 90.0, 65.0, 45.0, 33.0, 24.0, 17.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.5, -92.4794921875, -89.458984375, -86.4384765625, -83.41796875, -80.3974609375, -77.376953125, -74.3564453125, -71.3359375, -68.3154296875, -65.294921875, -62.2744140625, -59.25390625, -56.2333984375, -53.212890625, -50.1923828125, -47.171875, -44.1513671875, -41.130859375, -38.1103515625, -35.08984375, -32.0693359375, -29.048828125, -26.0283203125, -23.0078125, -19.9873046875, -16.966796875, -13.9462890625, -10.92578125, -7.9052734375, -4.884765625, -1.8642578125, 1.15625, 4.1767578125, 7.197265625, 10.2177734375, 13.23828125, 16.2587890625, 19.279296875, 22.2998046875, 25.3203125, 28.3408203125, 31.361328125, 34.3818359375, 37.40234375, 40.4228515625, 43.443359375, 46.4638671875, 49.484375, 52.5048828125, 55.525390625, 58.5458984375, 61.56640625, 64.5869140625, 67.607421875, 70.6279296875, 73.6484375, 76.6689453125, 79.689453125, 82.7099609375, 85.73046875, 88.7509765625, 91.771484375, 94.7919921875, 97.8125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 9.0, 6.0, 16.0, 13.0, 13.0, 23.0, 23.0, 29.0, 30.0, 31.0, 39.0, 40.0, 44.0, 40.0, 54.0, 46.0, 52.0, 57.0, 42.0, 45.0, 33.0, 41.0, 35.0, 31.0, 31.0, 31.0, 24.0, 28.0, 11.0, 13.0, 7.0, 9.0, 9.0, 5.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375, -18.74267578125, -18.1103515625, -17.47802734375, -16.845703125, -16.21337890625, -15.5810546875, -14.94873046875, -14.31640625, -13.68408203125, -13.0517578125, -12.41943359375, -11.787109375, -11.15478515625, -10.5224609375, -9.89013671875, -9.2578125, -8.62548828125, -7.9931640625, -7.36083984375, -6.728515625, -6.09619140625, -5.4638671875, -4.83154296875, -4.19921875, -3.56689453125, -2.9345703125, -2.30224609375, -1.669921875, -1.03759765625, -0.4052734375, 0.22705078125, 0.859375, 1.49169921875, 2.1240234375, 2.75634765625, 3.388671875, 4.02099609375, 4.6533203125, 5.28564453125, 5.91796875, 6.55029296875, 7.1826171875, 7.81494140625, 8.447265625, 9.07958984375, 9.7119140625, 10.34423828125, 10.9765625, 11.60888671875, 12.2412109375, 12.87353515625, 13.505859375, 14.13818359375, 14.7705078125, 15.40283203125, 16.03515625, 16.66748046875, 17.2998046875, 17.93212890625, 18.564453125, 19.19677734375, 19.8291015625, 20.46142578125, 21.09375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 6.0, 9.0, 8.0, 11.0, 19.0, 28.0, 33.0, 49.0, 74.0, 107.0, 161.0, 213.0, 312.0, 402.0, 655.0, 901.0, 1253.0, 1954.0, 3145.0, 4936.0, 8708.0, 18372.0, 45134.0, 158957.0, 499271.0, 202486.0, 55154.0, 20727.0, 10085.0, 5526.0, 3310.0, 2162.0, 1323.0, 912.0, 635.0, 434.0, 306.0, 227.0, 162.0, 120.0, 77.0, 52.0, 39.0, 39.0, 15.0, 13.0, 7.0, 9.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.90625, -43.43798828125, -41.9697265625, -40.50146484375, -39.033203125, -37.56494140625, -36.0966796875, -34.62841796875, -33.16015625, -31.69189453125, -30.2236328125, -28.75537109375, -27.287109375, -25.81884765625, -24.3505859375, -22.88232421875, -21.4140625, -19.94580078125, -18.4775390625, -17.00927734375, -15.541015625, -14.07275390625, -12.6044921875, -11.13623046875, -9.66796875, -8.19970703125, -6.7314453125, -5.26318359375, -3.794921875, -2.32666015625, -0.8583984375, 0.60986328125, 2.078125, 3.54638671875, 5.0146484375, 6.48291015625, 7.951171875, 9.41943359375, 10.8876953125, 12.35595703125, 13.82421875, 15.29248046875, 16.7607421875, 18.22900390625, 19.697265625, 21.16552734375, 22.6337890625, 24.10205078125, 25.5703125, 27.03857421875, 28.5068359375, 29.97509765625, 31.443359375, 32.91162109375, 34.3798828125, 35.84814453125, 37.31640625, 38.78466796875, 40.2529296875, 41.72119140625, 43.189453125, 44.65771484375, 46.1259765625, 47.59423828125, 49.0625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 9.0, 6.0, 2.0, 9.0, 8.0, 15.0, 20.0, 26.0, 51.0, 73.0, 110.0, 155.0, 132.0, 120.0, 82.0, 48.0, 31.0, 21.0, 16.0, 7.0, 7.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.004055023193359375, -0.003932058811187744, -0.0038090944290161133, -0.0036861300468444824, -0.0035631656646728516, -0.0034402012825012207, -0.00331723690032959, -0.003194272518157959, -0.003071308135986328, -0.0029483437538146973, -0.0028253793716430664, -0.0027024149894714355, -0.0025794506072998047, -0.002456486225128174, -0.002333521842956543, -0.002210557460784912, -0.0020875930786132812, -0.0019646286964416504, -0.0018416643142700195, -0.0017186999320983887, -0.0015957355499267578, -0.001472771167755127, -0.001349806785583496, -0.0012268424034118652, -0.0011038780212402344, -0.0009809136390686035, -0.0008579492568969727, -0.0007349848747253418, -0.0006120204925537109, -0.0004890561103820801, -0.0003660917282104492, -0.00024312734603881836, -0.0001201629638671875, 2.8014183044433594e-06, 0.00012576580047607422, 0.0002487301826477051, 0.00037169456481933594, 0.0004946589469909668, 0.0006176233291625977, 0.0007405877113342285, 0.0008635520935058594, 0.0009865164756774902, 0.001109480857849121, 0.001232445240020752, 0.0013554096221923828, 0.0014783740043640137, 0.0016013383865356445, 0.0017243027687072754, 0.0018472671508789062, 0.001970231533050537, 0.002093195915222168, 0.002216160297393799, 0.0023391246795654297, 0.0024620890617370605, 0.0025850534439086914, 0.0027080178260803223, 0.002830982208251953, 0.002953946590423584, 0.003076910972595215, 0.0031998753547668457, 0.0033228397369384766, 0.0034458041191101074, 0.0035687685012817383, 0.003691732883453369, 0.003814697265625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 20.0, 26.0, 53.0, 76.0, 126.0, 210.0, 350.0, 603.0, 1074.0, 1806.0, 3358.0, 6389.0, 13971.0, 36775.0, 115577.0, 333728.0, 344638.0, 122126.0, 38570.0, 14410.0, 6621.0, 3498.0, 1881.0, 1135.0, 614.0, 343.0, 225.0, 112.0, 71.0, 50.0, 30.0, 20.0, 15.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.5625, -42.2021484375, -40.841796875, -39.4814453125, -38.12109375, -36.7607421875, -35.400390625, -34.0400390625, -32.6796875, -31.3193359375, -29.958984375, -28.5986328125, -27.23828125, -25.8779296875, -24.517578125, -23.1572265625, -21.796875, -20.4365234375, -19.076171875, -17.7158203125, -16.35546875, -14.9951171875, -13.634765625, -12.2744140625, -10.9140625, -9.5537109375, -8.193359375, -6.8330078125, -5.47265625, -4.1123046875, -2.751953125, -1.3916015625, -0.03125, 1.3291015625, 2.689453125, 4.0498046875, 5.41015625, 6.7705078125, 8.130859375, 9.4912109375, 10.8515625, 12.2119140625, 13.572265625, 14.9326171875, 16.29296875, 17.6533203125, 19.013671875, 20.3740234375, 21.734375, 23.0947265625, 24.455078125, 25.8154296875, 27.17578125, 28.5361328125, 29.896484375, 31.2568359375, 32.6171875, 33.9775390625, 35.337890625, 36.6982421875, 38.05859375, 39.4189453125, 40.779296875, 42.1396484375, 43.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 10.0, 2.0, 11.0, 12.0, 14.0, 11.0, 20.0, 27.0, 28.0, 48.0, 52.0, 81.0, 103.0, 86.0, 92.0, 77.0, 74.0, 62.0, 46.0, 47.0, 22.0, 17.0, 17.0, 11.0, 7.0, 5.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5389404296875, -8.195068359375, -7.8511962890625, -7.50732421875, -7.1634521484375, -6.819580078125, -6.4757080078125, -6.1318359375, -5.7879638671875, -5.444091796875, -5.1002197265625, -4.75634765625, -4.4124755859375, -4.068603515625, -3.7247314453125, -3.380859375, -3.0369873046875, -2.693115234375, -2.3492431640625, -2.00537109375, -1.6614990234375, -1.317626953125, -0.9737548828125, -0.6298828125, -0.2860107421875, 0.057861328125, 0.4017333984375, 0.74560546875, 1.0894775390625, 1.433349609375, 1.7772216796875, 2.12109375, 2.4649658203125, 2.808837890625, 3.1527099609375, 3.49658203125, 3.8404541015625, 4.184326171875, 4.5281982421875, 4.8720703125, 5.2159423828125, 5.559814453125, 5.9036865234375, 6.24755859375, 6.5914306640625, 6.935302734375, 7.2791748046875, 7.623046875, 7.9669189453125, 8.310791015625, 8.6546630859375, 8.99853515625, 9.3424072265625, 9.686279296875, 10.0301513671875, 10.3740234375, 10.7178955078125, 11.061767578125, 11.4056396484375, 11.74951171875, 12.0933837890625, 12.437255859375, 12.7811279296875, 13.125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 5.0, 8.0, 3.0, 9.0, 10.0, 8.0, 10.0, 21.0, 25.0, 38.0, 36.0, 39.0, 45.0, 45.0, 54.0, 62.0, 60.0, 72.0, 57.0, 63.0, 66.0, 49.0, 42.0, 36.0, 20.0, 24.0, 22.0, 22.0, 16.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.1842155456543, -35.0134162902832, -33.84261703491211, -32.67182159423828, -31.501022338867188, -30.330223083496094, -29.159423828125, -27.988624572753906, -26.817827224731445, -25.64702796936035, -24.47623062133789, -23.305431365966797, -22.134632110595703, -20.963834762573242, -19.79303550720215, -18.622238159179688, -17.451438903808594, -16.2806396484375, -15.109842300415039, -13.939043045043945, -12.768244743347168, -11.59744644165039, -10.426647186279297, -9.25584888458252, -8.085050582885742, -6.914252281188965, -5.743453502655029, -4.572654724121094, -3.4018564224243164, -2.231058120727539, -1.0602593421936035, 0.11053943634033203, 1.2813339233398438, 2.4521324634552, 3.6229310035705566, 4.793729782104492, 5.9645280838012695, 7.135326385498047, 8.30612564086914, 9.476923942565918, 10.647722244262695, 11.818520545959473, 12.98931884765625, 14.160118103027344, 15.330916404724121, 16.5017147064209, 17.672513961791992, 18.843311309814453, 20.014110565185547, 21.18490982055664, 22.3557071685791, 23.526506423950195, 24.697303771972656, 25.86810302734375, 27.038902282714844, 28.209701538085938, 29.3804988861084, 30.551298141479492, 31.722095489501953, 32.89289474487305, 34.06369400024414, 35.23448944091797, 36.40528869628906, 37.576087951660156, 38.74688720703125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 12.0, 10.0, 11.0, 12.0, 11.0, 18.0, 24.0, 18.0, 12.0, 19.0, 32.0, 28.0, 33.0, 41.0, 29.0, 38.0, 36.0, 45.0, 41.0, 47.0, 60.0, 35.0, 34.0, 33.0, 34.0, 43.0, 28.0, 30.0, 27.0, 23.0, 13.0, 13.0, 19.0, 9.0, 21.0, 6.0, 10.0, 14.0, 7.0, 4.0, 2.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.263290405273438, -29.37462043762207, -28.485952377319336, -27.59728240966797, -26.708614349365234, -25.819944381713867, -24.931276321411133, -24.042606353759766, -23.15393829345703, -22.265268325805664, -21.37660026550293, -20.487930297851562, -19.599262237548828, -18.71059226989746, -17.821924209594727, -16.93325424194336, -16.044586181640625, -15.155917167663574, -14.267248153686523, -13.378579139709473, -12.489910125732422, -11.601240158081055, -10.71257209777832, -9.823902130126953, -8.935232162475586, -8.046563148498535, -7.157894134521484, -6.269225120544434, -5.380556106567383, -4.491886615753174, -3.603217601776123, -2.7145485877990723, -1.8258800506591797, -0.9372109770774841, -0.048541903495788574, 0.8401272296905518, 1.7287962436676025, 2.6174654960632324, 3.506134510040283, 4.394803524017334, 5.283472537994385, 6.1721415519714355, 7.060810565948486, 7.949480056762695, 8.838149070739746, 9.726818084716797, 10.615487098693848, 11.504156112670898, 12.39282512664795, 13.281494140625, 14.17016315460205, 15.058832168579102, 15.947501182556152, 16.836170196533203, 17.72484016418457, 18.613508224487305, 19.502178192138672, 20.39084815979004, 21.279516220092773, 22.16818618774414, 23.056854248046875, 23.945524215698242, 24.834192276000977, 25.722862243652344, 26.611530303955078]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 10.0, 12.0, 17.0, 34.0, 44.0, 53.0, 109.0, 148.0, 246.0, 385.0, 629.0, 1233.0, 2072.0, 3737.0, 6860.0, 12526.0, 22583.0, 42165.0, 77115.0, 132199.0, 196563.0, 205253.0, 148819.0, 88658.0, 48857.0, 26171.0, 14276.0, 7855.0, 4309.0, 2354.0, 1369.0, 759.0, 469.0, 251.0, 143.0, 102.0, 55.0, 30.0, 29.0, 30.0, 14.0, 14.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.75, -49.119140625, -47.48828125, -45.857421875, -44.2265625, -42.595703125, -40.96484375, -39.333984375, -37.703125, -36.072265625, -34.44140625, -32.810546875, -31.1796875, -29.548828125, -27.91796875, -26.287109375, -24.65625, -23.025390625, -21.39453125, -19.763671875, -18.1328125, -16.501953125, -14.87109375, -13.240234375, -11.609375, -9.978515625, -8.34765625, -6.716796875, -5.0859375, -3.455078125, -1.82421875, -0.193359375, 1.4375, 3.068359375, 4.69921875, 6.330078125, 7.9609375, 9.591796875, 11.22265625, 12.853515625, 14.484375, 16.115234375, 17.74609375, 19.376953125, 21.0078125, 22.638671875, 24.26953125, 25.900390625, 27.53125, 29.162109375, 30.79296875, 32.423828125, 34.0546875, 35.685546875, 37.31640625, 38.947265625, 40.578125, 42.208984375, 43.83984375, 45.470703125, 47.1015625, 48.732421875, 50.36328125, 51.994140625, 53.625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 10.0, 10.0, 10.0, 9.0, 13.0, 23.0, 12.0, 18.0, 25.0, 18.0, 27.0, 36.0, 40.0, 45.0, 39.0, 39.0, 50.0, 44.0, 47.0, 40.0, 42.0, 33.0, 32.0, 37.0, 37.0, 37.0, 28.0, 23.0, 15.0, 28.0, 18.0, 13.0, 10.0, 15.0, 10.0, 12.0, 13.0, 7.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.09521484375, -22.2841796875, -21.47314453125, -20.662109375, -19.85107421875, -19.0400390625, -18.22900390625, -17.41796875, -16.60693359375, -15.7958984375, -14.98486328125, -14.173828125, -13.36279296875, -12.5517578125, -11.74072265625, -10.9296875, -10.11865234375, -9.3076171875, -8.49658203125, -7.685546875, -6.87451171875, -6.0634765625, -5.25244140625, -4.44140625, -3.63037109375, -2.8193359375, -2.00830078125, -1.197265625, -0.38623046875, 0.4248046875, 1.23583984375, 2.046875, 2.85791015625, 3.6689453125, 4.47998046875, 5.291015625, 6.10205078125, 6.9130859375, 7.72412109375, 8.53515625, 9.34619140625, 10.1572265625, 10.96826171875, 11.779296875, 12.59033203125, 13.4013671875, 14.21240234375, 15.0234375, 15.83447265625, 16.6455078125, 17.45654296875, 18.267578125, 19.07861328125, 19.8896484375, 20.70068359375, 21.51171875, 22.32275390625, 23.1337890625, 23.94482421875, 24.755859375, 25.56689453125, 26.3779296875, 27.18896484375, 28.0]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 11.0, 14.0, 26.0, 43.0, 50.0, 65.0, 113.0, 182.0, 240.0, 383.0, 525.0, 830.0, 1275.0, 1849.0, 2827.0, 4277.0, 6741.0, 10153.0, 15625.0, 24287.0, 36858.0, 56354.0, 82826.0, 115327.0, 142103.0, 146501.0, 124229.0, 91796.0, 63134.0, 41867.0, 27285.0, 17552.0, 11273.0, 7538.0, 4844.0, 3155.0, 2112.0, 1343.0, 976.0, 668.0, 451.0, 286.0, 184.0, 130.0, 76.0, 39.0, 46.0, 33.0, 18.0, 15.0, 8.0, 3.0, 0.0, 3.0, 1.0, 5.0], "bins": [-33.375, -32.367919921875, -31.36083984375, -30.353759765625, -29.3466796875, -28.339599609375, -27.33251953125, -26.325439453125, -25.318359375, -24.311279296875, -23.30419921875, -22.297119140625, -21.2900390625, -20.282958984375, -19.27587890625, -18.268798828125, -17.26171875, -16.254638671875, -15.24755859375, -14.240478515625, -13.2333984375, -12.226318359375, -11.21923828125, -10.212158203125, -9.205078125, -8.197998046875, -7.19091796875, -6.183837890625, -5.1767578125, -4.169677734375, -3.16259765625, -2.155517578125, -1.1484375, -0.141357421875, 0.86572265625, 1.872802734375, 2.8798828125, 3.886962890625, 4.89404296875, 5.901123046875, 6.908203125, 7.915283203125, 8.92236328125, 9.929443359375, 10.9365234375, 11.943603515625, 12.95068359375, 13.957763671875, 14.96484375, 15.971923828125, 16.97900390625, 17.986083984375, 18.9931640625, 20.000244140625, 21.00732421875, 22.014404296875, 23.021484375, 24.028564453125, 25.03564453125, 26.042724609375, 27.0498046875, 28.056884765625, 29.06396484375, 30.071044921875, 31.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 9.0, 9.0, 13.0, 10.0, 18.0, 23.0, 26.0, 30.0, 25.0, 32.0, 29.0, 33.0, 41.0, 32.0, 46.0, 53.0, 51.0, 49.0, 45.0, 30.0, 37.0, 42.0, 50.0, 36.0, 40.0, 34.0, 21.0, 19.0, 15.0, 15.0, 18.0, 9.0, 15.0, 9.0, 5.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.25, -18.64208984375, -18.0341796875, -17.42626953125, -16.818359375, -16.21044921875, -15.6025390625, -14.99462890625, -14.38671875, -13.77880859375, -13.1708984375, -12.56298828125, -11.955078125, -11.34716796875, -10.7392578125, -10.13134765625, -9.5234375, -8.91552734375, -8.3076171875, -7.69970703125, -7.091796875, -6.48388671875, -5.8759765625, -5.26806640625, -4.66015625, -4.05224609375, -3.4443359375, -2.83642578125, -2.228515625, -1.62060546875, -1.0126953125, -0.40478515625, 0.203125, 0.81103515625, 1.4189453125, 2.02685546875, 2.634765625, 3.24267578125, 3.8505859375, 4.45849609375, 5.06640625, 5.67431640625, 6.2822265625, 6.89013671875, 7.498046875, 8.10595703125, 8.7138671875, 9.32177734375, 9.9296875, 10.53759765625, 11.1455078125, 11.75341796875, 12.361328125, 12.96923828125, 13.5771484375, 14.18505859375, 14.79296875, 15.40087890625, 16.0087890625, 16.61669921875, 17.224609375, 17.83251953125, 18.4404296875, 19.04833984375, 19.65625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 30.0, 29.0, 58.0, 70.0, 110.0, 165.0, 260.0, 406.0, 590.0, 864.0, 1496.0, 2345.0, 3779.0, 6262.0, 10702.0, 19060.0, 34165.0, 65331.0, 128135.0, 227584.0, 241200.0, 143637.0, 73256.0, 38184.0, 20859.0, 11842.0, 6944.0, 4199.0, 2573.0, 1573.0, 1019.0, 632.0, 405.0, 245.0, 172.0, 105.0, 78.0, 60.0, 32.0, 23.0, 23.0, 8.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-31.609375, -30.624267578125, -29.63916015625, -28.654052734375, -27.6689453125, -26.683837890625, -25.69873046875, -24.713623046875, -23.728515625, -22.743408203125, -21.75830078125, -20.773193359375, -19.7880859375, -18.802978515625, -17.81787109375, -16.832763671875, -15.84765625, -14.862548828125, -13.87744140625, -12.892333984375, -11.9072265625, -10.922119140625, -9.93701171875, -8.951904296875, -7.966796875, -6.981689453125, -5.99658203125, -5.011474609375, -4.0263671875, -3.041259765625, -2.05615234375, -1.071044921875, -0.0859375, 0.899169921875, 1.88427734375, 2.869384765625, 3.8544921875, 4.839599609375, 5.82470703125, 6.809814453125, 7.794921875, 8.780029296875, 9.76513671875, 10.750244140625, 11.7353515625, 12.720458984375, 13.70556640625, 14.690673828125, 15.67578125, 16.660888671875, 17.64599609375, 18.631103515625, 19.6162109375, 20.601318359375, 21.58642578125, 22.571533203125, 23.556640625, 24.541748046875, 25.52685546875, 26.511962890625, 27.4970703125, 28.482177734375, 29.46728515625, 30.452392578125, 31.4375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 10.0, 7.0, 12.0, 17.0, 15.0, 17.0, 23.0, 39.0, 40.0, 46.0, 65.0, 71.0, 65.0, 71.0, 70.0, 73.0, 73.0, 49.0, 49.0, 38.0, 24.0, 23.0, 9.0, 19.0, 13.0, 10.0, 11.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002910614013671875, -0.002819061279296875, -0.002727508544921875, -0.002635955810546875, -0.002544403076171875, -0.002452850341796875, -0.002361297607421875, -0.002269744873046875, -0.002178192138671875, -0.002086639404296875, -0.001995086669921875, -0.001903533935546875, -0.001811981201171875, -0.001720428466796875, -0.001628875732421875, -0.001537322998046875, -0.001445770263671875, -0.001354217529296875, -0.001262664794921875, -0.001171112060546875, -0.001079559326171875, -0.000988006591796875, -0.000896453857421875, -0.000804901123046875, -0.000713348388671875, -0.000621795654296875, -0.000530242919921875, -0.000438690185546875, -0.000347137451171875, -0.000255584716796875, -0.000164031982421875, -7.2479248046875e-05, 1.9073486328125e-05, 0.000110626220703125, 0.000202178955078125, 0.000293731689453125, 0.000385284423828125, 0.000476837158203125, 0.000568389892578125, 0.000659942626953125, 0.000751495361328125, 0.000843048095703125, 0.000934600830078125, 0.001026153564453125, 0.001117706298828125, 0.001209259033203125, 0.001300811767578125, 0.001392364501953125, 0.001483917236328125, 0.001575469970703125, 0.001667022705078125, 0.001758575439453125, 0.001850128173828125, 0.001941680908203125, 0.002033233642578125, 0.002124786376953125, 0.002216339111328125, 0.002307891845703125, 0.002399444580078125, 0.002490997314453125, 0.002582550048828125, 0.002674102783203125, 0.002765655517578125, 0.002857208251953125, 0.002948760986328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 25.0, 25.0, 30.0, 45.0, 55.0, 89.0, 156.0, 216.0, 296.0, 476.0, 751.0, 1073.0, 1798.0, 3001.0, 4828.0, 8299.0, 15280.0, 29221.0, 59803.0, 125905.0, 241303.0, 263066.0, 147400.0, 70518.0, 33623.0, 17496.0, 9493.0, 5405.0, 3328.0, 1963.0, 1244.0, 743.0, 541.0, 338.0, 220.0, 159.0, 117.0, 81.0, 44.0, 21.0, 22.0, 9.0, 10.0, 4.0, 4.0, 11.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.953125, -28.887451171875, -27.82177734375, -26.756103515625, -25.6904296875, -24.624755859375, -23.55908203125, -22.493408203125, -21.427734375, -20.362060546875, -19.29638671875, -18.230712890625, -17.1650390625, -16.099365234375, -15.03369140625, -13.968017578125, -12.90234375, -11.836669921875, -10.77099609375, -9.705322265625, -8.6396484375, -7.573974609375, -6.50830078125, -5.442626953125, -4.376953125, -3.311279296875, -2.24560546875, -1.179931640625, -0.1142578125, 0.951416015625, 2.01708984375, 3.082763671875, 4.1484375, 5.214111328125, 6.27978515625, 7.345458984375, 8.4111328125, 9.476806640625, 10.54248046875, 11.608154296875, 12.673828125, 13.739501953125, 14.80517578125, 15.870849609375, 16.9365234375, 18.002197265625, 19.06787109375, 20.133544921875, 21.19921875, 22.264892578125, 23.33056640625, 24.396240234375, 25.4619140625, 26.527587890625, 27.59326171875, 28.658935546875, 29.724609375, 30.790283203125, 31.85595703125, 32.921630859375, 33.9873046875, 35.052978515625, 36.11865234375, 37.184326171875, 38.25]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 7.0, 6.0, 9.0, 22.0, 14.0, 43.0, 50.0, 60.0, 75.0, 101.0, 120.0, 97.0, 84.0, 76.0, 57.0, 45.0, 37.0, 18.0, 21.0, 19.0, 7.0, 7.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -15.982177734375, -15.52685546875, -15.071533203125, -14.6162109375, -14.160888671875, -13.70556640625, -13.250244140625, -12.794921875, -12.339599609375, -11.88427734375, -11.428955078125, -10.9736328125, -10.518310546875, -10.06298828125, -9.607666015625, -9.15234375, -8.697021484375, -8.24169921875, -7.786376953125, -7.3310546875, -6.875732421875, -6.42041015625, -5.965087890625, -5.509765625, -5.054443359375, -4.59912109375, -4.143798828125, -3.6884765625, -3.233154296875, -2.77783203125, -2.322509765625, -1.8671875, -1.411865234375, -0.95654296875, -0.501220703125, -0.0458984375, 0.409423828125, 0.86474609375, 1.320068359375, 1.775390625, 2.230712890625, 2.68603515625, 3.141357421875, 3.5966796875, 4.052001953125, 4.50732421875, 4.962646484375, 5.41796875, 5.873291015625, 6.32861328125, 6.783935546875, 7.2392578125, 7.694580078125, 8.14990234375, 8.605224609375, 9.060546875, 9.515869140625, 9.97119140625, 10.426513671875, 10.8818359375, 11.337158203125, 11.79248046875, 12.247802734375, 12.703125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 7.0, 6.0, 10.0, 20.0, 17.0, 28.0, 28.0, 29.0, 35.0, 32.0, 32.0, 47.0, 54.0, 53.0, 56.0, 59.0, 46.0, 58.0, 54.0, 41.0, 39.0, 48.0, 30.0, 22.0, 22.0, 15.0, 18.0, 13.0, 5.0, 10.0, 10.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-28.695228576660156, -27.745759963989258, -26.796293258666992, -25.846824645996094, -24.897357940673828, -23.94788932800293, -22.998422622680664, -22.048954010009766, -21.0994873046875, -20.1500186920166, -19.200551986694336, -18.251083374023438, -17.301616668701172, -16.352148056030273, -15.402681350708008, -14.45321273803711, -13.503745079040527, -12.554277420043945, -11.604809761047363, -10.655342102050781, -9.7058744430542, -8.756406784057617, -7.806938648223877, -6.857470989227295, -5.908003330230713, -4.958535671234131, -4.009068012237549, -3.0596001148223877, -2.1101324558258057, -1.1606645584106445, -0.2111968994140625, 0.7382707595825195, 1.6877384185791016, 2.6372060775756836, 3.5866737365722656, 4.536141395568848, 5.48560905456543, 6.43507719039917, 7.384544849395752, 8.334012985229492, 9.283479690551758, 10.23294734954834, 11.182415008544922, 12.131882667541504, 13.081350326538086, 14.030818939208984, 14.98028564453125, 15.929754257202148, 16.879222869873047, 17.828691482543945, 18.77815818786621, 19.72762680053711, 20.677093505859375, 21.626562118530273, 22.57602882385254, 23.525497436523438, 24.474964141845703, 25.4244327545166, 26.373899459838867, 27.323368072509766, 28.27283477783203, 29.22230339050293, 30.171770095825195, 31.121238708496094, 32.07070541381836]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 7.0, 11.0, 12.0, 18.0, 7.0, 21.0, 28.0, 24.0, 28.0, 29.0, 31.0, 36.0, 38.0, 23.0, 34.0, 42.0, 36.0, 31.0, 43.0, 34.0, 50.0, 33.0, 46.0, 41.0, 27.0, 29.0, 42.0, 28.0, 25.0, 17.0, 19.0, 18.0, 16.0, 14.0, 10.0, 3.0, 8.0, 6.0, 3.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.04069709777832, -26.171142578125, -25.30158805847168, -24.43203353881836, -23.562477111816406, -22.69292449951172, -21.823368072509766, -20.953813552856445, -20.084259033203125, -19.214704513549805, -18.345149993896484, -17.475595474243164, -16.606040954589844, -15.736485481262207, -14.86693000793457, -13.99737548828125, -13.12782096862793, -12.25826644897461, -11.388711929321289, -10.519156455993652, -9.649601936340332, -8.780047416687012, -7.910492420196533, -7.040937423706055, -6.171382904052734, -5.301828384399414, -4.4322733879089355, -3.562718629837036, -2.6931638717651367, -1.8236093521118164, -0.9540543556213379, -0.08449935913085938, 0.7850532531738281, 1.6546080112457275, 2.524162769317627, 3.3937175273895264, 4.263272285461426, 5.132826805114746, 6.002381801605225, 6.871936798095703, 7.741491317749023, 8.611045837402344, 9.480600357055664, 10.3501558303833, 11.219710350036621, 12.089264869689941, 12.958820343017578, 13.828374862670898, 14.697929382324219, 15.567483901977539, 16.43703842163086, 17.30659294128418, 18.1761474609375, 19.045703887939453, 19.915258407592773, 20.784812927246094, 21.654367446899414, 22.523921966552734, 23.393476486206055, 24.263031005859375, 25.132587432861328, 26.002140045166016, 26.87169647216797, 27.74125099182129, 28.61080551147461]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 7.0, 13.0, 23.0, 43.0, 62.0, 59.0, 132.0, 158.0, 244.0, 368.0, 502.0, 779.0, 1131.0, 1789.0, 2623.0, 4073.0, 6447.0, 10273.0, 16601.0, 27857.0, 48004.0, 86112.0, 166367.0, 353826.0, 760560.0, 1105716.0, 817969.0, 389793.0, 179536.0, 90582.0, 49403.0, 28314.0, 16822.0, 10228.0, 6476.0, 4001.0, 2612.0, 1592.0, 1040.0, 770.0, 434.0, 344.0, 197.0, 122.0, 102.0, 68.0, 42.0, 30.0, 17.0, 10.0, 6.0, 5.0, 0.0, 4.0], "bins": [-33.78125, -32.8310546875, -31.880859375, -30.9306640625, -29.98046875, -29.0302734375, -28.080078125, -27.1298828125, -26.1796875, -25.2294921875, -24.279296875, -23.3291015625, -22.37890625, -21.4287109375, -20.478515625, -19.5283203125, -18.578125, -17.6279296875, -16.677734375, -15.7275390625, -14.77734375, -13.8271484375, -12.876953125, -11.9267578125, -10.9765625, -10.0263671875, -9.076171875, -8.1259765625, -7.17578125, -6.2255859375, -5.275390625, -4.3251953125, -3.375, -2.4248046875, -1.474609375, -0.5244140625, 0.42578125, 1.3759765625, 2.326171875, 3.2763671875, 4.2265625, 5.1767578125, 6.126953125, 7.0771484375, 8.02734375, 8.9775390625, 9.927734375, 10.8779296875, 11.828125, 12.7783203125, 13.728515625, 14.6787109375, 15.62890625, 16.5791015625, 17.529296875, 18.4794921875, 19.4296875, 20.3798828125, 21.330078125, 22.2802734375, 23.23046875, 24.1806640625, 25.130859375, 26.0810546875, 27.03125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 8.0, 8.0, 17.0, 21.0, 18.0, 11.0, 22.0, 25.0, 19.0, 20.0, 36.0, 37.0, 37.0, 42.0, 37.0, 32.0, 39.0, 47.0, 37.0, 35.0, 58.0, 39.0, 42.0, 33.0, 29.0, 33.0, 27.0, 36.0, 24.0, 19.0, 14.0, 19.0, 9.0, 17.0, 8.0, 7.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.38330078125, -18.7822265625, -18.18115234375, -17.580078125, -16.97900390625, -16.3779296875, -15.77685546875, -15.17578125, -14.57470703125, -13.9736328125, -13.37255859375, -12.771484375, -12.17041015625, -11.5693359375, -10.96826171875, -10.3671875, -9.76611328125, -9.1650390625, -8.56396484375, -7.962890625, -7.36181640625, -6.7607421875, -6.15966796875, -5.55859375, -4.95751953125, -4.3564453125, -3.75537109375, -3.154296875, -2.55322265625, -1.9521484375, -1.35107421875, -0.75, -0.14892578125, 0.4521484375, 1.05322265625, 1.654296875, 2.25537109375, 2.8564453125, 3.45751953125, 4.05859375, 4.65966796875, 5.2607421875, 5.86181640625, 6.462890625, 7.06396484375, 7.6650390625, 8.26611328125, 8.8671875, 9.46826171875, 10.0693359375, 10.67041015625, 11.271484375, 11.87255859375, 12.4736328125, 13.07470703125, 13.67578125, 14.27685546875, 14.8779296875, 15.47900390625, 16.080078125, 16.68115234375, 17.2822265625, 17.88330078125, 18.484375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 8.0, 22.0, 21.0, 38.0, 67.0, 119.0, 152.0, 250.0, 371.0, 533.0, 838.0, 1258.0, 1825.0, 2897.0, 4563.0, 7433.0, 12340.0, 21072.0, 35952.0, 64460.0, 118962.0, 226504.0, 439647.0, 803748.0, 1009987.0, 674667.0, 355172.0, 183734.0, 97283.0, 53682.0, 30527.0, 17777.0, 10702.0, 6321.0, 4009.0, 2494.0, 1613.0, 1050.0, 719.0, 470.0, 290.0, 223.0, 151.0, 99.0, 88.0, 38.0, 32.0, 22.0, 10.0, 11.0, 9.0, 7.0, 2.0, 6.0, 2.0, 2.0], "bins": [-31.09375, -30.13232421875, -29.1708984375, -28.20947265625, -27.248046875, -26.28662109375, -25.3251953125, -24.36376953125, -23.40234375, -22.44091796875, -21.4794921875, -20.51806640625, -19.556640625, -18.59521484375, -17.6337890625, -16.67236328125, -15.7109375, -14.74951171875, -13.7880859375, -12.82666015625, -11.865234375, -10.90380859375, -9.9423828125, -8.98095703125, -8.01953125, -7.05810546875, -6.0966796875, -5.13525390625, -4.173828125, -3.21240234375, -2.2509765625, -1.28955078125, -0.328125, 0.63330078125, 1.5947265625, 2.55615234375, 3.517578125, 4.47900390625, 5.4404296875, 6.40185546875, 7.36328125, 8.32470703125, 9.2861328125, 10.24755859375, 11.208984375, 12.17041015625, 13.1318359375, 14.09326171875, 15.0546875, 16.01611328125, 16.9775390625, 17.93896484375, 18.900390625, 19.86181640625, 20.8232421875, 21.78466796875, 22.74609375, 23.70751953125, 24.6689453125, 25.63037109375, 26.591796875, 27.55322265625, 28.5146484375, 29.47607421875, 30.4375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 9.0, 7.0, 13.0, 14.0, 12.0, 21.0, 22.0, 39.0, 37.0, 53.0, 79.0, 89.0, 105.0, 166.0, 168.0, 175.0, 240.0, 302.0, 325.0, 349.0, 297.0, 268.0, 216.0, 201.0, 163.0, 166.0, 112.0, 104.0, 76.0, 54.0, 39.0, 32.0, 29.0, 16.0, 18.0, 9.0, 15.0, 4.0, 5.0, 6.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5234375, -11.14599609375, -10.7685546875, -10.39111328125, -10.013671875, -9.63623046875, -9.2587890625, -8.88134765625, -8.50390625, -8.12646484375, -7.7490234375, -7.37158203125, -6.994140625, -6.61669921875, -6.2392578125, -5.86181640625, -5.484375, -5.10693359375, -4.7294921875, -4.35205078125, -3.974609375, -3.59716796875, -3.2197265625, -2.84228515625, -2.46484375, -2.08740234375, -1.7099609375, -1.33251953125, -0.955078125, -0.57763671875, -0.2001953125, 0.17724609375, 0.5546875, 0.93212890625, 1.3095703125, 1.68701171875, 2.064453125, 2.44189453125, 2.8193359375, 3.19677734375, 3.57421875, 3.95166015625, 4.3291015625, 4.70654296875, 5.083984375, 5.46142578125, 5.8388671875, 6.21630859375, 6.59375, 6.97119140625, 7.3486328125, 7.72607421875, 8.103515625, 8.48095703125, 8.8583984375, 9.23583984375, 9.61328125, 9.99072265625, 10.3681640625, 10.74560546875, 11.123046875, 11.50048828125, 11.8779296875, 12.25537109375, 12.6328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 11.0, 14.0, 9.0, 20.0, 18.0, 24.0, 28.0, 27.0, 39.0, 36.0, 56.0, 44.0, 53.0, 49.0, 56.0, 56.0, 55.0, 52.0, 50.0, 45.0, 45.0, 32.0, 28.0, 23.0, 20.0, 20.0, 12.0, 10.0, 5.0, 13.0, 4.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-32.94244384765625, -32.026336669921875, -31.110227584838867, -30.19411849975586, -29.278011322021484, -28.361902236938477, -27.44579315185547, -26.529685974121094, -25.613576889038086, -24.697467803955078, -23.781360626220703, -22.865251541137695, -21.949142456054688, -21.033035278320312, -20.116926193237305, -19.200817108154297, -18.284709930419922, -17.368600845336914, -16.45249366760254, -15.536384582519531, -14.62027645111084, -13.704168319702148, -12.78805923461914, -11.87195110321045, -10.955842971801758, -10.039734840393066, -9.123626708984375, -8.207517623901367, -7.291409492492676, -6.375301361083984, -5.459192752838135, -4.543084144592285, -3.626974105834961, -2.7108657360076904, -1.79475736618042, -0.8786489963531494, 0.037459373474121094, 0.9535675048828125, 1.869676113128662, 2.7857847213745117, 3.701892852783203, 4.6180009841918945, 5.534109592437744, 6.450218200683594, 7.366326332092285, 8.282434463500977, 9.198543548583984, 10.114651679992676, 11.030759811401367, 11.946867942810059, 12.86297607421875, 13.779085159301758, 14.69519329071045, 15.61130142211914, 16.52741050720215, 17.443519592285156, 18.35962677001953, 19.27573585510254, 20.191843032836914, 21.107952117919922, 22.024059295654297, 22.940168380737305, 23.856277465820312, 24.772384643554688, 25.688493728637695]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 5.0, 6.0, 9.0, 8.0, 10.0, 7.0, 13.0, 9.0, 14.0, 17.0, 24.0, 18.0, 15.0, 19.0, 25.0, 28.0, 36.0, 36.0, 34.0, 37.0, 44.0, 38.0, 29.0, 34.0, 34.0, 43.0, 46.0, 42.0, 26.0, 33.0, 24.0, 25.0, 19.0, 25.0, 24.0, 17.0, 13.0, 19.0, 14.0, 15.0, 7.0, 9.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.238008499145508, -23.473983764648438, -22.7099609375, -21.94593620300293, -21.18191146850586, -20.41788673400879, -19.65386199951172, -18.88983917236328, -18.12581443786621, -17.36178970336914, -16.597766876220703, -15.833742141723633, -15.069717407226562, -14.305692672729492, -13.541668891906738, -12.777645111083984, -12.013620376586914, -11.249595642089844, -10.48557186126709, -9.721548080444336, -8.957523345947266, -8.193498611450195, -7.429474830627441, -6.665450572967529, -5.901426315307617, -5.137402057647705, -4.373377799987793, -3.609353542327881, -2.8453292846679688, -2.0813050270080566, -1.3172807693481445, -0.5532565116882324, 0.2107696533203125, 0.9747939109802246, 1.7388181686401367, 2.502842426300049, 3.266866683959961, 4.030890941619873, 4.794915199279785, 5.558939456939697, 6.322963714599609, 7.0869879722595215, 7.851012229919434, 8.615036010742188, 9.379060745239258, 10.143085479736328, 10.907109260559082, 11.671133041381836, 12.435157775878906, 13.199182510375977, 13.96320629119873, 14.727230072021484, 15.491254806518555, 16.255279541015625, 17.019302368164062, 17.783327102661133, 18.547351837158203, 19.311376571655273, 20.075401306152344, 20.83942413330078, 21.60344886779785, 22.367473602294922, 23.13149642944336, 23.89552116394043, 24.6595458984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 9.0, 8.0, 10.0, 26.0, 24.0, 45.0, 55.0, 78.0, 134.0, 202.0, 314.0, 426.0, 674.0, 1000.0, 1470.0, 2185.0, 3453.0, 5416.0, 8505.0, 14178.0, 23495.0, 40416.0, 71634.0, 127461.0, 200170.0, 210690.0, 141321.0, 80729.0, 45499.0, 26478.0, 15654.0, 9691.0, 5938.0, 3927.0, 2446.0, 1631.0, 1085.0, 690.0, 460.0, 303.0, 195.0, 122.0, 102.0, 66.0, 56.0, 32.0, 17.0, 12.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.0, -32.94091796875, -31.8818359375, -30.82275390625, -29.763671875, -28.70458984375, -27.6455078125, -26.58642578125, -25.52734375, -24.46826171875, -23.4091796875, -22.35009765625, -21.291015625, -20.23193359375, -19.1728515625, -18.11376953125, -17.0546875, -15.99560546875, -14.9365234375, -13.87744140625, -12.818359375, -11.75927734375, -10.7001953125, -9.64111328125, -8.58203125, -7.52294921875, -6.4638671875, -5.40478515625, -4.345703125, -3.28662109375, -2.2275390625, -1.16845703125, -0.109375, 0.94970703125, 2.0087890625, 3.06787109375, 4.126953125, 5.18603515625, 6.2451171875, 7.30419921875, 8.36328125, 9.42236328125, 10.4814453125, 11.54052734375, 12.599609375, 13.65869140625, 14.7177734375, 15.77685546875, 16.8359375, 17.89501953125, 18.9541015625, 20.01318359375, 21.072265625, 22.13134765625, 23.1904296875, 24.24951171875, 25.30859375, 26.36767578125, 27.4267578125, 28.48583984375, 29.544921875, 30.60400390625, 31.6630859375, 32.72216796875, 33.78125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 13.0, 14.0, 8.0, 9.0, 17.0, 21.0, 26.0, 15.0, 26.0, 26.0, 24.0, 32.0, 32.0, 38.0, 48.0, 39.0, 34.0, 34.0, 24.0, 43.0, 60.0, 43.0, 38.0, 28.0, 26.0, 31.0, 24.0, 19.0, 24.0, 25.0, 13.0, 13.0, 11.0, 15.0, 9.0, 6.0, 11.0, 10.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.203125, -22.439208984375, -21.67529296875, -20.911376953125, -20.1474609375, -19.383544921875, -18.61962890625, -17.855712890625, -17.091796875, -16.327880859375, -15.56396484375, -14.800048828125, -14.0361328125, -13.272216796875, -12.50830078125, -11.744384765625, -10.98046875, -10.216552734375, -9.45263671875, -8.688720703125, -7.9248046875, -7.160888671875, -6.39697265625, -5.633056640625, -4.869140625, -4.105224609375, -3.34130859375, -2.577392578125, -1.8134765625, -1.049560546875, -0.28564453125, 0.478271484375, 1.2421875, 2.006103515625, 2.77001953125, 3.533935546875, 4.2978515625, 5.061767578125, 5.82568359375, 6.589599609375, 7.353515625, 8.117431640625, 8.88134765625, 9.645263671875, 10.4091796875, 11.173095703125, 11.93701171875, 12.700927734375, 13.46484375, 14.228759765625, 14.99267578125, 15.756591796875, 16.5205078125, 17.284423828125, 18.04833984375, 18.812255859375, 19.576171875, 20.340087890625, 21.10400390625, 21.867919921875, 22.6318359375, 23.395751953125, 24.15966796875, 24.923583984375, 25.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 10.0, 11.0, 13.0, 18.0, 24.0, 27.0, 47.0, 67.0, 102.0, 136.0, 174.0, 240.0, 365.0, 553.0, 787.0, 1148.0, 1964.0, 2883.0, 4853.0, 8771.0, 16792.0, 36609.0, 93884.0, 271205.0, 364846.0, 141723.0, 51611.0, 22245.0, 11003.0, 6198.0, 3607.0, 2197.0, 1440.0, 957.0, 620.0, 432.0, 303.0, 190.0, 157.0, 110.0, 76.0, 42.0, 37.0, 30.0, 17.0, 21.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-58.28125, -56.525390625, -54.76953125, -53.013671875, -51.2578125, -49.501953125, -47.74609375, -45.990234375, -44.234375, -42.478515625, -40.72265625, -38.966796875, -37.2109375, -35.455078125, -33.69921875, -31.943359375, -30.1875, -28.431640625, -26.67578125, -24.919921875, -23.1640625, -21.408203125, -19.65234375, -17.896484375, -16.140625, -14.384765625, -12.62890625, -10.873046875, -9.1171875, -7.361328125, -5.60546875, -3.849609375, -2.09375, -0.337890625, 1.41796875, 3.173828125, 4.9296875, 6.685546875, 8.44140625, 10.197265625, 11.953125, 13.708984375, 15.46484375, 17.220703125, 18.9765625, 20.732421875, 22.48828125, 24.244140625, 26.0, 27.755859375, 29.51171875, 31.267578125, 33.0234375, 34.779296875, 36.53515625, 38.291015625, 40.046875, 41.802734375, 43.55859375, 45.314453125, 47.0703125, 48.826171875, 50.58203125, 52.337890625, 54.09375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 6.0, 13.0, 14.0, 8.0, 15.0, 10.0, 18.0, 13.0, 13.0, 23.0, 20.0, 30.0, 35.0, 44.0, 25.0, 34.0, 41.0, 37.0, 43.0, 49.0, 38.0, 34.0, 41.0, 44.0, 34.0, 16.0, 39.0, 26.0, 33.0, 28.0, 25.0, 22.0, 21.0, 17.0, 17.0, 16.0, 10.0, 9.0, 7.0, 11.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.875, -14.3944091796875, -13.913818359375, -13.4332275390625, -12.95263671875, -12.4720458984375, -11.991455078125, -11.5108642578125, -11.0302734375, -10.5496826171875, -10.069091796875, -9.5885009765625, -9.10791015625, -8.6273193359375, -8.146728515625, -7.6661376953125, -7.185546875, -6.7049560546875, -6.224365234375, -5.7437744140625, -5.26318359375, -4.7825927734375, -4.302001953125, -3.8214111328125, -3.3408203125, -2.8602294921875, -2.379638671875, -1.8990478515625, -1.41845703125, -0.9378662109375, -0.457275390625, 0.0233154296875, 0.50390625, 0.9844970703125, 1.465087890625, 1.9456787109375, 2.42626953125, 2.9068603515625, 3.387451171875, 3.8680419921875, 4.3486328125, 4.8292236328125, 5.309814453125, 5.7904052734375, 6.27099609375, 6.7515869140625, 7.232177734375, 7.7127685546875, 8.193359375, 8.6739501953125, 9.154541015625, 9.6351318359375, 10.11572265625, 10.5963134765625, 11.076904296875, 11.5574951171875, 12.0380859375, 12.5186767578125, 12.999267578125, 13.4798583984375, 13.96044921875, 14.4410400390625, 14.921630859375, 15.4022216796875, 15.8828125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 11.0, 21.0, 18.0, 29.0, 33.0, 55.0, 74.0, 89.0, 127.0, 169.0, 291.0, 399.0, 626.0, 894.0, 1480.0, 2274.0, 3906.0, 7191.0, 13999.0, 31392.0, 81848.0, 251586.0, 404664.0, 150164.0, 51526.0, 21201.0, 10288.0, 5509.0, 3170.0, 1925.0, 1153.0, 789.0, 484.0, 358.0, 237.0, 168.0, 118.0, 71.0, 63.0, 46.0, 25.0, 21.0, 15.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-23.28125, -22.536865234375, -21.79248046875, -21.048095703125, -20.3037109375, -19.559326171875, -18.81494140625, -18.070556640625, -17.326171875, -16.581787109375, -15.83740234375, -15.093017578125, -14.3486328125, -13.604248046875, -12.85986328125, -12.115478515625, -11.37109375, -10.626708984375, -9.88232421875, -9.137939453125, -8.3935546875, -7.649169921875, -6.90478515625, -6.160400390625, -5.416015625, -4.671630859375, -3.92724609375, -3.182861328125, -2.4384765625, -1.694091796875, -0.94970703125, -0.205322265625, 0.5390625, 1.283447265625, 2.02783203125, 2.772216796875, 3.5166015625, 4.260986328125, 5.00537109375, 5.749755859375, 6.494140625, 7.238525390625, 7.98291015625, 8.727294921875, 9.4716796875, 10.216064453125, 10.96044921875, 11.704833984375, 12.44921875, 13.193603515625, 13.93798828125, 14.682373046875, 15.4267578125, 16.171142578125, 16.91552734375, 17.659912109375, 18.404296875, 19.148681640625, 19.89306640625, 20.637451171875, 21.3818359375, 22.126220703125, 22.87060546875, 23.614990234375, 24.359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 3.0, 11.0, 23.0, 31.0, 55.0, 95.0, 114.0, 171.0, 160.0, 119.0, 65.0, 43.0, 34.0, 18.0, 15.0, 11.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002227783203125, -0.002148240804672241, -0.0020686984062194824, -0.0019891560077667236, -0.0019096136093139648, -0.001830071210861206, -0.0017505288124084473, -0.0016709864139556885, -0.0015914440155029297, -0.001511901617050171, -0.0014323592185974121, -0.0013528168201446533, -0.0012732744216918945, -0.0011937320232391357, -0.001114189624786377, -0.0010346472263336182, -0.0009551048278808594, -0.0008755624294281006, -0.0007960200309753418, -0.000716477632522583, -0.0006369352340698242, -0.0005573928356170654, -0.00047785043716430664, -0.00039830803871154785, -0.00031876564025878906, -0.00023922324180603027, -0.00015968084335327148, -8.01384449005127e-05, -5.960464477539062e-07, 7.894635200500488e-05, 0.00015848875045776367, 0.00023803114891052246, 0.00031757354736328125, 0.00039711594581604004, 0.00047665834426879883, 0.0005562007427215576, 0.0006357431411743164, 0.0007152855396270752, 0.000794827938079834, 0.0008743703365325928, 0.0009539127349853516, 0.0010334551334381104, 0.0011129975318908691, 0.001192539930343628, 0.0012720823287963867, 0.0013516247272491455, 0.0014311671257019043, 0.001510709524154663, 0.0015902519226074219, 0.0016697943210601807, 0.0017493367195129395, 0.0018288791179656982, 0.001908421516418457, 0.001987963914871216, 0.0020675063133239746, 0.0021470487117767334, 0.002226591110229492, 0.002306133508682251, 0.0023856759071350098, 0.0024652183055877686, 0.0025447607040405273, 0.002624303102493286, 0.002703845500946045, 0.0027833878993988037, 0.0028629302978515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 18.0, 16.0, 28.0, 33.0, 39.0, 77.0, 105.0, 135.0, 193.0, 253.0, 341.0, 513.0, 773.0, 1180.0, 1789.0, 2878.0, 4337.0, 7461.0, 12984.0, 23460.0, 45649.0, 93299.0, 190333.0, 273352.0, 192067.0, 94409.0, 45878.0, 23462.0, 13141.0, 7384.0, 4438.0, 2811.0, 1842.0, 1247.0, 766.0, 549.0, 404.0, 279.0, 167.0, 129.0, 95.0, 62.0, 58.0, 41.0, 24.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-17.453125, -16.899169921875, -16.34521484375, -15.791259765625, -15.2373046875, -14.683349609375, -14.12939453125, -13.575439453125, -13.021484375, -12.467529296875, -11.91357421875, -11.359619140625, -10.8056640625, -10.251708984375, -9.69775390625, -9.143798828125, -8.58984375, -8.035888671875, -7.48193359375, -6.927978515625, -6.3740234375, -5.820068359375, -5.26611328125, -4.712158203125, -4.158203125, -3.604248046875, -3.05029296875, -2.496337890625, -1.9423828125, -1.388427734375, -0.83447265625, -0.280517578125, 0.2734375, 0.827392578125, 1.38134765625, 1.935302734375, 2.4892578125, 3.043212890625, 3.59716796875, 4.151123046875, 4.705078125, 5.259033203125, 5.81298828125, 6.366943359375, 6.9208984375, 7.474853515625, 8.02880859375, 8.582763671875, 9.13671875, 9.690673828125, 10.24462890625, 10.798583984375, 11.3525390625, 11.906494140625, 12.46044921875, 13.014404296875, 13.568359375, 14.122314453125, 14.67626953125, 15.230224609375, 15.7841796875, 16.338134765625, 16.89208984375, 17.446044921875, 18.0]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 10.0, 5.0, 13.0, 24.0, 14.0, 27.0, 42.0, 44.0, 46.0, 64.0, 86.0, 83.0, 84.0, 92.0, 81.0, 56.0, 56.0, 53.0, 25.0, 22.0, 16.0, 10.0, 11.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.11590576171875, -5.8997802734375, -5.68365478515625, -5.467529296875, -5.25140380859375, -5.0352783203125, -4.81915283203125, -4.60302734375, -4.38690185546875, -4.1707763671875, -3.95465087890625, -3.738525390625, -3.52239990234375, -3.3062744140625, -3.09014892578125, -2.8740234375, -2.65789794921875, -2.4417724609375, -2.22564697265625, -2.009521484375, -1.79339599609375, -1.5772705078125, -1.36114501953125, -1.14501953125, -0.92889404296875, -0.7127685546875, -0.49664306640625, -0.280517578125, -0.06439208984375, 0.1517333984375, 0.36785888671875, 0.583984375, 0.80010986328125, 1.0162353515625, 1.23236083984375, 1.448486328125, 1.66461181640625, 1.8807373046875, 2.09686279296875, 2.31298828125, 2.52911376953125, 2.7452392578125, 2.96136474609375, 3.177490234375, 3.39361572265625, 3.6097412109375, 3.82586669921875, 4.0419921875, 4.25811767578125, 4.4742431640625, 4.69036865234375, 4.906494140625, 5.12261962890625, 5.3387451171875, 5.55487060546875, 5.77099609375, 5.98712158203125, 6.2032470703125, 6.41937255859375, 6.635498046875, 6.85162353515625, 7.0677490234375, 7.28387451171875, 7.5]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 3.0, 7.0, 7.0, 4.0, 7.0, 13.0, 20.0, 32.0, 23.0, 33.0, 26.0, 52.0, 65.0, 57.0, 61.0, 73.0, 73.0, 62.0, 58.0, 51.0, 54.0, 44.0, 39.0, 23.0, 27.0, 22.0, 14.0, 11.0, 11.0, 2.0, 2.0, 9.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.64973831176758, -37.58329772949219, -36.51686096191406, -35.45042037963867, -34.38397979736328, -33.317543029785156, -32.251102447509766, -31.184663772583008, -30.11822509765625, -29.051786422729492, -27.985347747802734, -26.918907165527344, -25.852468490600586, -24.786029815673828, -23.719589233398438, -22.65315055847168, -21.586711883544922, -20.520273208618164, -19.453834533691406, -18.387393951416016, -17.320955276489258, -16.2545166015625, -15.188076972961426, -14.121637344360352, -13.055198669433594, -11.988759994506836, -10.922320365905762, -9.855880737304688, -8.78944206237793, -7.723002910614014, -6.656563758850098, -5.590124607086182, -4.523689270019531, -3.4572501182556152, -2.390810966491699, -1.3243718147277832, -0.2579326629638672, 0.8085064888000488, 1.8749456405639648, 2.941384792327881, 4.007823944091797, 5.074263095855713, 6.140702247619629, 7.207141399383545, 8.273580551147461, 9.340019226074219, 10.406458854675293, 11.472898483276367, 12.539337158203125, 13.605775833129883, 14.672215461730957, 15.738655090332031, 16.80509376525879, 17.871532440185547, 18.937973022460938, 20.004411697387695, 21.070850372314453, 22.13728904724121, 23.20372772216797, 24.27016830444336, 25.336606979370117, 26.403045654296875, 27.469486236572266, 28.535924911499023, 29.60236358642578]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 11.0, 9.0, 7.0, 10.0, 8.0, 15.0, 13.0, 16.0, 13.0, 19.0, 19.0, 23.0, 20.0, 23.0, 27.0, 26.0, 42.0, 37.0, 33.0, 33.0, 29.0, 41.0, 31.0, 38.0, 37.0, 32.0, 40.0, 44.0, 26.0, 24.0, 22.0, 21.0, 19.0, 19.0, 19.0, 16.0, 16.0, 23.0, 5.0, 14.0, 12.0, 9.0, 10.0, 6.0, 6.0, 8.0, 4.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 5.0, 1.0], "bins": [-21.573646545410156, -20.88542938232422, -20.19721221923828, -19.508995056152344, -18.820775985717773, -18.132558822631836, -17.4443416595459, -16.75612449645996, -16.06790542602539, -15.379688262939453, -14.6914701461792, -14.003252983093262, -13.315034866333008, -12.62681770324707, -11.938600540161133, -11.250383377075195, -10.562166213989258, -9.87394905090332, -9.185730934143066, -8.497513771057129, -7.809296131134033, -7.1210784912109375, -6.432861328125, -5.744643688201904, -5.056426048278809, -4.368208408355713, -3.6799910068511963, -2.9917736053466797, -2.303555965423584, -1.6153383255004883, -0.9271211624145508, -0.23890352249145508, 0.44931602478027344, 1.1375335454940796, 1.8257510662078857, 2.5139684677124023, 3.202186107635498, 3.8904037475585938, 4.578620910644531, 5.266838550567627, 5.955056190490723, 6.643273830413818, 7.331491470336914, 8.019708633422852, 8.707925796508789, 9.396143913269043, 10.08436107635498, 10.772579193115234, 11.460796356201172, 12.14901351928711, 12.837231636047363, 13.5254487991333, 14.213666915893555, 14.901884078979492, 15.59010124206543, 16.278318405151367, 16.966537475585938, 17.654754638671875, 18.342971801757812, 19.03118896484375, 19.71940803527832, 20.407625198364258, 21.095842361450195, 21.784059524536133, 22.47227668762207]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 2.0, 6.0, 18.0, 14.0, 20.0, 25.0, 43.0, 54.0, 80.0, 147.0, 209.0, 332.0, 560.0, 939.0, 1608.0, 2865.0, 4711.0, 8638.0, 15448.0, 29074.0, 55112.0, 102144.0, 172028.0, 221212.0, 185136.0, 114001.0, 61455.0, 32741.0, 17334.0, 9473.0, 5431.0, 3153.0, 1786.0, 1074.0, 625.0, 379.0, 220.0, 143.0, 114.0, 72.0, 36.0, 21.0, 16.0, 11.0, 12.0, 6.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.53125, -45.103515625, -43.67578125, -42.248046875, -40.8203125, -39.392578125, -37.96484375, -36.537109375, -35.109375, -33.681640625, -32.25390625, -30.826171875, -29.3984375, -27.970703125, -26.54296875, -25.115234375, -23.6875, -22.259765625, -20.83203125, -19.404296875, -17.9765625, -16.548828125, -15.12109375, -13.693359375, -12.265625, -10.837890625, -9.41015625, -7.982421875, -6.5546875, -5.126953125, -3.69921875, -2.271484375, -0.84375, 0.583984375, 2.01171875, 3.439453125, 4.8671875, 6.294921875, 7.72265625, 9.150390625, 10.578125, 12.005859375, 13.43359375, 14.861328125, 16.2890625, 17.716796875, 19.14453125, 20.572265625, 22.0, 23.427734375, 24.85546875, 26.283203125, 27.7109375, 29.138671875, 30.56640625, 31.994140625, 33.421875, 34.849609375, 36.27734375, 37.705078125, 39.1328125, 40.560546875, 41.98828125, 43.416015625, 44.84375]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 7.0, 10.0, 6.0, 17.0, 12.0, 16.0, 8.0, 24.0, 18.0, 24.0, 30.0, 17.0, 41.0, 33.0, 33.0, 44.0, 36.0, 38.0, 29.0, 26.0, 45.0, 36.0, 46.0, 47.0, 29.0, 32.0, 32.0, 30.0, 21.0, 27.0, 22.0, 21.0, 20.0, 11.0, 19.0, 14.0, 9.0, 11.0, 13.0, 1.0, 8.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.622802734375, -19.93310546875, -19.243408203125, -18.5537109375, -17.864013671875, -17.17431640625, -16.484619140625, -15.794921875, -15.105224609375, -14.41552734375, -13.725830078125, -13.0361328125, -12.346435546875, -11.65673828125, -10.967041015625, -10.27734375, -9.587646484375, -8.89794921875, -8.208251953125, -7.5185546875, -6.828857421875, -6.13916015625, -5.449462890625, -4.759765625, -4.070068359375, -3.38037109375, -2.690673828125, -2.0009765625, -1.311279296875, -0.62158203125, 0.068115234375, 0.7578125, 1.447509765625, 2.13720703125, 2.826904296875, 3.5166015625, 4.206298828125, 4.89599609375, 5.585693359375, 6.275390625, 6.965087890625, 7.65478515625, 8.344482421875, 9.0341796875, 9.723876953125, 10.41357421875, 11.103271484375, 11.79296875, 12.482666015625, 13.17236328125, 13.862060546875, 14.5517578125, 15.241455078125, 15.93115234375, 16.620849609375, 17.310546875, 18.000244140625, 18.68994140625, 19.379638671875, 20.0693359375, 20.759033203125, 21.44873046875, 22.138427734375, 22.828125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 8.0, 8.0, 10.0, 15.0, 22.0, 34.0, 52.0, 72.0, 117.0, 178.0, 245.0, 385.0, 580.0, 920.0, 1447.0, 2152.0, 3354.0, 5352.0, 8276.0, 13269.0, 20618.0, 32850.0, 51662.0, 79269.0, 114072.0, 146385.0, 155756.0, 133467.0, 97386.0, 65522.0, 42208.0, 26447.0, 17062.0, 10433.0, 6662.0, 4265.0, 2755.0, 1833.0, 1152.0, 775.0, 464.0, 332.0, 221.0, 156.0, 107.0, 69.0, 51.0, 27.0, 13.0, 17.0, 14.0, 7.0, 5.0, 4.0, 0.0, 1.0, 3.0], "bins": [-28.421875, -27.567626953125, -26.71337890625, -25.859130859375, -25.0048828125, -24.150634765625, -23.29638671875, -22.442138671875, -21.587890625, -20.733642578125, -19.87939453125, -19.025146484375, -18.1708984375, -17.316650390625, -16.46240234375, -15.608154296875, -14.75390625, -13.899658203125, -13.04541015625, -12.191162109375, -11.3369140625, -10.482666015625, -9.62841796875, -8.774169921875, -7.919921875, -7.065673828125, -6.21142578125, -5.357177734375, -4.5029296875, -3.648681640625, -2.79443359375, -1.940185546875, -1.0859375, -0.231689453125, 0.62255859375, 1.476806640625, 2.3310546875, 3.185302734375, 4.03955078125, 4.893798828125, 5.748046875, 6.602294921875, 7.45654296875, 8.310791015625, 9.1650390625, 10.019287109375, 10.87353515625, 11.727783203125, 12.58203125, 13.436279296875, 14.29052734375, 15.144775390625, 15.9990234375, 16.853271484375, 17.70751953125, 18.561767578125, 19.416015625, 20.270263671875, 21.12451171875, 21.978759765625, 22.8330078125, 23.687255859375, 24.54150390625, 25.395751953125, 26.25]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 3.0, 7.0, 12.0, 13.0, 16.0, 21.0, 19.0, 18.0, 29.0, 25.0, 37.0, 28.0, 33.0, 41.0, 48.0, 39.0, 32.0, 46.0, 40.0, 53.0, 40.0, 48.0, 41.0, 42.0, 32.0, 34.0, 39.0, 25.0, 20.0, 18.0, 19.0, 14.0, 19.0, 11.0, 6.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.1953125, -14.7066650390625, -14.218017578125, -13.7293701171875, -13.24072265625, -12.7520751953125, -12.263427734375, -11.7747802734375, -11.2861328125, -10.7974853515625, -10.308837890625, -9.8201904296875, -9.33154296875, -8.8428955078125, -8.354248046875, -7.8656005859375, -7.376953125, -6.8883056640625, -6.399658203125, -5.9110107421875, -5.42236328125, -4.9337158203125, -4.445068359375, -3.9564208984375, -3.4677734375, -2.9791259765625, -2.490478515625, -2.0018310546875, -1.51318359375, -1.0245361328125, -0.535888671875, -0.0472412109375, 0.44140625, 0.9300537109375, 1.418701171875, 1.9073486328125, 2.39599609375, 2.8846435546875, 3.373291015625, 3.8619384765625, 4.3505859375, 4.8392333984375, 5.327880859375, 5.8165283203125, 6.30517578125, 6.7938232421875, 7.282470703125, 7.7711181640625, 8.259765625, 8.7484130859375, 9.237060546875, 9.7257080078125, 10.21435546875, 10.7030029296875, 11.191650390625, 11.6802978515625, 12.1689453125, 12.6575927734375, 13.146240234375, 13.6348876953125, 14.12353515625, 14.6121826171875, 15.100830078125, 15.5894775390625, 16.078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 21.0, 28.0, 35.0, 59.0, 73.0, 97.0, 190.0, 232.0, 330.0, 534.0, 828.0, 1427.0, 2299.0, 4072.0, 7399.0, 15171.0, 33170.0, 81085.0, 199448.0, 328346.0, 215336.0, 87728.0, 35572.0, 16185.0, 8062.0, 4261.0, 2454.0, 1506.0, 907.0, 613.0, 339.0, 248.0, 151.0, 106.0, 68.0, 34.0, 44.0, 20.0, 11.0, 18.0, 16.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.921875, -25.978759765625, -25.03564453125, -24.092529296875, -23.1494140625, -22.206298828125, -21.26318359375, -20.320068359375, -19.376953125, -18.433837890625, -17.49072265625, -16.547607421875, -15.6044921875, -14.661376953125, -13.71826171875, -12.775146484375, -11.83203125, -10.888916015625, -9.94580078125, -9.002685546875, -8.0595703125, -7.116455078125, -6.17333984375, -5.230224609375, -4.287109375, -3.343994140625, -2.40087890625, -1.457763671875, -0.5146484375, 0.428466796875, 1.37158203125, 2.314697265625, 3.2578125, 4.200927734375, 5.14404296875, 6.087158203125, 7.0302734375, 7.973388671875, 8.91650390625, 9.859619140625, 10.802734375, 11.745849609375, 12.68896484375, 13.632080078125, 14.5751953125, 15.518310546875, 16.46142578125, 17.404541015625, 18.34765625, 19.290771484375, 20.23388671875, 21.177001953125, 22.1201171875, 23.063232421875, 24.00634765625, 24.949462890625, 25.892578125, 26.835693359375, 27.77880859375, 28.721923828125, 29.6650390625, 30.608154296875, 31.55126953125, 32.494384765625, 33.4375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 6.0, 13.0, 11.0, 15.0, 18.0, 22.0, 29.0, 38.0, 61.0, 43.0, 56.0, 62.0, 75.0, 81.0, 71.0, 72.0, 70.0, 46.0, 44.0, 29.0, 21.0, 23.0, 13.0, 18.0, 13.0, 10.0, 6.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018987655639648438, -0.0018338114023208618, -0.0017688572406768799, -0.001703903079032898, -0.001638948917388916, -0.001573994755744934, -0.0015090405941009521, -0.0014440864324569702, -0.0013791322708129883, -0.0013141781091690063, -0.0012492239475250244, -0.0011842697858810425, -0.0011193156242370605, -0.0010543614625930786, -0.0009894073009490967, -0.0009244531393051147, -0.0008594989776611328, -0.0007945448160171509, -0.0007295906543731689, -0.000664636492729187, -0.0005996823310852051, -0.0005347281694412231, -0.0004697740077972412, -0.0004048198461532593, -0.00033986568450927734, -0.0002749115228652954, -0.00020995736122131348, -0.00014500319957733154, -8.004903793334961e-05, -1.5094876289367676e-05, 4.985928535461426e-05, 0.00011481344699859619, 0.00017976760864257812, 0.00024472177028656006, 0.000309675931930542, 0.0003746300935745239, 0.00043958425521850586, 0.0005045384168624878, 0.0005694925785064697, 0.0006344467401504517, 0.0006994009017944336, 0.0007643550634384155, 0.0008293092250823975, 0.0008942633867263794, 0.0009592175483703613, 0.0010241717100143433, 0.0010891258716583252, 0.0011540800333023071, 0.001219034194946289, 0.001283988356590271, 0.001348942518234253, 0.0014138966798782349, 0.0014788508415222168, 0.0015438050031661987, 0.0016087591648101807, 0.0016737133264541626, 0.0017386674880981445, 0.0018036216497421265, 0.0018685758113861084, 0.0019335299730300903, 0.0019984841346740723, 0.002063438296318054, 0.002128392457962036, 0.002193346619606018, 0.00225830078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 15.0, 10.0, 24.0, 30.0, 45.0, 65.0, 104.0, 144.0, 204.0, 288.0, 411.0, 655.0, 1031.0, 1535.0, 2497.0, 4234.0, 7410.0, 13860.0, 28001.0, 58628.0, 124370.0, 228737.0, 257271.0, 162911.0, 78495.0, 36481.0, 17881.0, 9517.0, 5127.0, 3026.0, 1922.0, 1218.0, 796.0, 525.0, 337.0, 239.0, 161.0, 111.0, 69.0, 55.0, 37.0, 34.0, 15.0, 15.0, 9.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.59375, -23.852783203125, -23.11181640625, -22.370849609375, -21.6298828125, -20.888916015625, -20.14794921875, -19.406982421875, -18.666015625, -17.925048828125, -17.18408203125, -16.443115234375, -15.7021484375, -14.961181640625, -14.22021484375, -13.479248046875, -12.73828125, -11.997314453125, -11.25634765625, -10.515380859375, -9.7744140625, -9.033447265625, -8.29248046875, -7.551513671875, -6.810546875, -6.069580078125, -5.32861328125, -4.587646484375, -3.8466796875, -3.105712890625, -2.36474609375, -1.623779296875, -0.8828125, -0.141845703125, 0.59912109375, 1.340087890625, 2.0810546875, 2.822021484375, 3.56298828125, 4.303955078125, 5.044921875, 5.785888671875, 6.52685546875, 7.267822265625, 8.0087890625, 8.749755859375, 9.49072265625, 10.231689453125, 10.97265625, 11.713623046875, 12.45458984375, 13.195556640625, 13.9365234375, 14.677490234375, 15.41845703125, 16.159423828125, 16.900390625, 17.641357421875, 18.38232421875, 19.123291015625, 19.8642578125, 20.605224609375, 21.34619140625, 22.087158203125, 22.828125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 4.0, 7.0, 1.0, 4.0, 5.0, 16.0, 18.0, 18.0, 24.0, 38.0, 44.0, 51.0, 65.0, 67.0, 69.0, 72.0, 74.0, 68.0, 77.0, 59.0, 47.0, 52.0, 37.0, 19.0, 23.0, 9.0, 10.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.84375, -7.599609375, -7.35546875, -7.111328125, -6.8671875, -6.623046875, -6.37890625, -6.134765625, -5.890625, -5.646484375, -5.40234375, -5.158203125, -4.9140625, -4.669921875, -4.42578125, -4.181640625, -3.9375, -3.693359375, -3.44921875, -3.205078125, -2.9609375, -2.716796875, -2.47265625, -2.228515625, -1.984375, -1.740234375, -1.49609375, -1.251953125, -1.0078125, -0.763671875, -0.51953125, -0.275390625, -0.03125, 0.212890625, 0.45703125, 0.701171875, 0.9453125, 1.189453125, 1.43359375, 1.677734375, 1.921875, 2.166015625, 2.41015625, 2.654296875, 2.8984375, 3.142578125, 3.38671875, 3.630859375, 3.875, 4.119140625, 4.36328125, 4.607421875, 4.8515625, 5.095703125, 5.33984375, 5.583984375, 5.828125, 6.072265625, 6.31640625, 6.560546875, 6.8046875, 7.048828125, 7.29296875, 7.537109375, 7.78125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 4.0, 2.0, 11.0, 13.0, 6.0, 18.0, 11.0, 21.0, 21.0, 37.0, 42.0, 45.0, 54.0, 61.0, 37.0, 64.0, 69.0, 62.0, 62.0, 52.0, 55.0, 42.0, 37.0, 37.0, 36.0, 19.0, 20.0, 9.0, 9.0, 8.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.54153060913086, -29.627031326293945, -28.71253204345703, -27.798032760620117, -26.883533477783203, -25.969036102294922, -25.054536819458008, -24.140037536621094, -23.22553825378418, -22.311038970947266, -21.39653968811035, -20.482040405273438, -19.567543029785156, -18.65304183959961, -17.738544464111328, -16.824045181274414, -15.9095458984375, -14.995046615600586, -14.080547332763672, -13.166049003601074, -12.25154972076416, -11.337050437927246, -10.422552108764648, -9.508052825927734, -8.59355354309082, -7.679054260253906, -6.76455545425415, -5.8500566482543945, -4.9355573654174805, -4.021058082580566, -3.1065592765808105, -2.1920604705810547, -1.2775592803955078, -0.36306023597717285, 0.5514388084411621, 1.465937852859497, 2.380436897277832, 3.294936180114746, 4.209434986114502, 5.123933792114258, 6.038433074951172, 6.952932357788086, 7.867431163787842, 8.781929969787598, 9.696429252624512, 10.610928535461426, 11.525426864624023, 12.439926147460938, 13.354425430297852, 14.268924713134766, 15.18342399597168, 16.097923278808594, 17.012420654296875, 17.926921844482422, 18.841419219970703, 19.755918502807617, 20.67041778564453, 21.584917068481445, 22.49941635131836, 23.413915634155273, 24.328414916992188, 25.24291229248047, 26.157411575317383, 27.071910858154297, 27.98641014099121]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 7.0, 13.0, 15.0, 15.0, 16.0, 19.0, 16.0, 18.0, 20.0, 24.0, 35.0, 29.0, 22.0, 35.0, 37.0, 32.0, 30.0, 37.0, 41.0, 42.0, 42.0, 31.0, 38.0, 40.0, 43.0, 22.0, 32.0, 24.0, 28.0, 23.0, 27.0, 16.0, 12.0, 11.0, 15.0, 15.0, 11.0, 9.0, 8.0, 8.0, 4.0, 7.0, 4.0, 8.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.380128860473633, -20.699838638305664, -20.019548416137695, -19.339258193969727, -18.658967971801758, -17.97867774963379, -17.298389434814453, -16.618099212646484, -15.9378080368042, -15.25751781463623, -14.577227592468262, -13.89693832397461, -13.21664810180664, -12.536357879638672, -11.856067657470703, -11.175777435302734, -10.495487213134766, -9.815196990966797, -9.134906768798828, -8.45461654663086, -7.774326801300049, -7.09403657913208, -6.4137468338012695, -5.733456611633301, -5.053166389465332, -4.372876167297363, -3.6925861835479736, -3.012296199798584, -2.3320059776306152, -1.6517157554626465, -0.9714260101318359, -0.2911357879638672, 0.38915443420410156, 1.0694445371627808, 1.74973464012146, 2.4300246238708496, 3.1103148460388184, 3.790605068206787, 4.470894813537598, 5.151185035705566, 5.831475257873535, 6.511765480041504, 7.192055702209473, 7.872345447540283, 8.552635192871094, 9.232925415039062, 9.913215637207031, 10.593505859375, 11.273796081542969, 11.954086303710938, 12.634376525878906, 13.314666748046875, 13.994956970214844, 14.675247192382812, 15.355536460876465, 16.03582763671875, 16.71611785888672, 17.396408081054688, 18.076698303222656, 18.756988525390625, 19.437278747558594, 20.117568969726562, 20.79785919189453, 21.4781494140625, 22.158437728881836]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 13.0, 15.0, 27.0, 47.0, 81.0, 125.0, 180.0, 304.0, 497.0, 809.0, 1332.0, 2214.0, 3590.0, 6102.0, 10400.0, 18062.0, 33305.0, 62867.0, 127469.0, 296389.0, 747645.0, 1287171.0, 915094.0, 370714.0, 151622.0, 72225.0, 37897.0, 20423.0, 11429.0, 6597.0, 3805.0, 2256.0, 1368.0, 829.0, 515.0, 323.0, 185.0, 125.0, 88.0, 44.0, 37.0, 24.0, 8.0, 14.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-30.375, -29.44384765625, -28.5126953125, -27.58154296875, -26.650390625, -25.71923828125, -24.7880859375, -23.85693359375, -22.92578125, -21.99462890625, -21.0634765625, -20.13232421875, -19.201171875, -18.27001953125, -17.3388671875, -16.40771484375, -15.4765625, -14.54541015625, -13.6142578125, -12.68310546875, -11.751953125, -10.82080078125, -9.8896484375, -8.95849609375, -8.02734375, -7.09619140625, -6.1650390625, -5.23388671875, -4.302734375, -3.37158203125, -2.4404296875, -1.50927734375, -0.578125, 0.35302734375, 1.2841796875, 2.21533203125, 3.146484375, 4.07763671875, 5.0087890625, 5.93994140625, 6.87109375, 7.80224609375, 8.7333984375, 9.66455078125, 10.595703125, 11.52685546875, 12.4580078125, 13.38916015625, 14.3203125, 15.25146484375, 16.1826171875, 17.11376953125, 18.044921875, 18.97607421875, 19.9072265625, 20.83837890625, 21.76953125, 22.70068359375, 23.6318359375, 24.56298828125, 25.494140625, 26.42529296875, 27.3564453125, 28.28759765625, 29.21875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 6.0, 11.0, 17.0, 4.0, 17.0, 18.0, 18.0, 23.0, 17.0, 26.0, 30.0, 31.0, 38.0, 29.0, 32.0, 35.0, 40.0, 38.0, 35.0, 34.0, 39.0, 37.0, 45.0, 41.0, 29.0, 30.0, 30.0, 17.0, 36.0, 23.0, 21.0, 22.0, 10.0, 12.0, 16.0, 11.0, 9.0, 6.0, 7.0, 6.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.046875, -14.593505859375, -14.14013671875, -13.686767578125, -13.2333984375, -12.780029296875, -12.32666015625, -11.873291015625, -11.419921875, -10.966552734375, -10.51318359375, -10.059814453125, -9.6064453125, -9.153076171875, -8.69970703125, -8.246337890625, -7.79296875, -7.339599609375, -6.88623046875, -6.432861328125, -5.9794921875, -5.526123046875, -5.07275390625, -4.619384765625, -4.166015625, -3.712646484375, -3.25927734375, -2.805908203125, -2.3525390625, -1.899169921875, -1.44580078125, -0.992431640625, -0.5390625, -0.085693359375, 0.36767578125, 0.821044921875, 1.2744140625, 1.727783203125, 2.18115234375, 2.634521484375, 3.087890625, 3.541259765625, 3.99462890625, 4.447998046875, 4.9013671875, 5.354736328125, 5.80810546875, 6.261474609375, 6.71484375, 7.168212890625, 7.62158203125, 8.074951171875, 8.5283203125, 8.981689453125, 9.43505859375, 9.888427734375, 10.341796875, 10.795166015625, 11.24853515625, 11.701904296875, 12.1552734375, 12.608642578125, 13.06201171875, 13.515380859375, 13.96875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 14.0, 7.0, 29.0, 43.0, 59.0, 81.0, 141.0, 187.0, 326.0, 527.0, 826.0, 1407.0, 2393.0, 4096.0, 7037.0, 12258.0, 22276.0, 40195.0, 75436.0, 145883.0, 291993.0, 593150.0, 1029057.0, 941153.0, 505559.0, 249119.0, 125115.0, 65405.0, 34923.0, 19357.0, 10768.0, 6219.0, 3561.0, 2130.0, 1277.0, 824.0, 513.0, 325.0, 188.0, 136.0, 94.0, 68.0, 46.0, 28.0, 18.0, 9.0, 11.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.13330078125, -23.2978515625, -22.46240234375, -21.626953125, -20.79150390625, -19.9560546875, -19.12060546875, -18.28515625, -17.44970703125, -16.6142578125, -15.77880859375, -14.943359375, -14.10791015625, -13.2724609375, -12.43701171875, -11.6015625, -10.76611328125, -9.9306640625, -9.09521484375, -8.259765625, -7.42431640625, -6.5888671875, -5.75341796875, -4.91796875, -4.08251953125, -3.2470703125, -2.41162109375, -1.576171875, -0.74072265625, 0.0947265625, 0.93017578125, 1.765625, 2.60107421875, 3.4365234375, 4.27197265625, 5.107421875, 5.94287109375, 6.7783203125, 7.61376953125, 8.44921875, 9.28466796875, 10.1201171875, 10.95556640625, 11.791015625, 12.62646484375, 13.4619140625, 14.29736328125, 15.1328125, 15.96826171875, 16.8037109375, 17.63916015625, 18.474609375, 19.31005859375, 20.1455078125, 20.98095703125, 21.81640625, 22.65185546875, 23.4873046875, 24.32275390625, 25.158203125, 25.99365234375, 26.8291015625, 27.66455078125, 28.5]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 4.0, 9.0, 9.0, 9.0, 18.0, 21.0, 27.0, 41.0, 41.0, 48.0, 58.0, 90.0, 94.0, 115.0, 122.0, 135.0, 182.0, 218.0, 276.0, 300.0, 283.0, 309.0, 288.0, 248.0, 209.0, 158.0, 152.0, 126.0, 109.0, 64.0, 71.0, 53.0, 30.0, 40.0, 26.0, 19.0, 24.0, 9.0, 11.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-9.8125, -9.528564453125, -9.24462890625, -8.960693359375, -8.6767578125, -8.392822265625, -8.10888671875, -7.824951171875, -7.541015625, -7.257080078125, -6.97314453125, -6.689208984375, -6.4052734375, -6.121337890625, -5.83740234375, -5.553466796875, -5.26953125, -4.985595703125, -4.70166015625, -4.417724609375, -4.1337890625, -3.849853515625, -3.56591796875, -3.281982421875, -2.998046875, -2.714111328125, -2.43017578125, -2.146240234375, -1.8623046875, -1.578369140625, -1.29443359375, -1.010498046875, -0.7265625, -0.442626953125, -0.15869140625, 0.125244140625, 0.4091796875, 0.693115234375, 0.97705078125, 1.260986328125, 1.544921875, 1.828857421875, 2.11279296875, 2.396728515625, 2.6806640625, 2.964599609375, 3.24853515625, 3.532470703125, 3.81640625, 4.100341796875, 4.38427734375, 4.668212890625, 4.9521484375, 5.236083984375, 5.52001953125, 5.803955078125, 6.087890625, 6.371826171875, 6.65576171875, 6.939697265625, 7.2236328125, 7.507568359375, 7.79150390625, 8.075439453125, 8.359375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 3.0, 6.0, 16.0, 16.0, 14.0, 25.0, 33.0, 36.0, 48.0, 47.0, 69.0, 76.0, 71.0, 85.0, 70.0, 82.0, 54.0, 53.0, 40.0, 39.0, 27.0, 22.0, 18.0, 15.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.57342529296875, -34.563270568847656, -33.5531120300293, -32.5429573059082, -31.53280258178711, -30.522645950317383, -29.512489318847656, -28.502334594726562, -27.492177963256836, -26.48202133178711, -25.471866607666016, -24.46170997619629, -23.451553344726562, -22.44139862060547, -21.431241989135742, -20.421085357666016, -19.410930633544922, -18.400774002075195, -17.3906192779541, -16.380462646484375, -15.370306968688965, -14.360151290893555, -13.349994659423828, -12.339838981628418, -11.329683303833008, -10.319527626037598, -9.309371948242188, -8.299215316772461, -7.289059638977051, -6.278903961181641, -5.268747806549072, -4.258591651916504, -3.248432159423828, -2.238276243209839, -1.2281203269958496, -0.21796441078186035, 0.7921915054321289, 1.802347183227539, 2.8125033378601074, 3.822659492492676, 4.832815170288086, 5.842970848083496, 6.8531270027160645, 7.863283157348633, 8.873438835144043, 9.883594512939453, 10.89375114440918, 11.90390682220459, 12.9140625, 13.92421817779541, 14.93437385559082, 15.944530487060547, 16.95468521118164, 17.964841842651367, 18.974998474121094, 19.985153198242188, 20.995309829711914, 22.00546646118164, 23.015621185302734, 24.02577781677246, 25.035934448242188, 26.04608917236328, 27.056245803833008, 28.066402435302734, 29.076557159423828]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 8.0, 10.0, 12.0, 16.0, 8.0, 14.0, 19.0, 16.0, 29.0, 24.0, 21.0, 28.0, 38.0, 42.0, 32.0, 32.0, 51.0, 43.0, 40.0, 33.0, 35.0, 40.0, 39.0, 52.0, 36.0, 33.0, 19.0, 23.0, 24.0, 18.0, 19.0, 20.0, 18.0, 20.0, 18.0, 11.0, 14.0, 9.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.64584732055664, -20.00339698791504, -19.360946655273438, -18.71849822998047, -18.076047897338867, -17.433597564697266, -16.791149139404297, -16.148698806762695, -15.506248474121094, -14.863798141479492, -14.221348762512207, -13.578899383544922, -12.93644905090332, -12.293998718261719, -11.651549339294434, -11.009099960327148, -10.366649627685547, -9.724199295043945, -9.08174991607666, -8.439300537109375, -7.796850204467773, -7.15440034866333, -6.511950492858887, -5.869500637054443, -5.22705078125, -4.584600925445557, -3.9421510696411133, -3.29970121383667, -2.6572513580322266, -2.014801502227783, -1.3723516464233398, -0.7299017906188965, -0.08745193481445312, 0.5549979209899902, 1.1974477767944336, 1.839897632598877, 2.4823474884033203, 3.1247973442077637, 3.767247200012207, 4.40969705581665, 5.052146911621094, 5.694596767425537, 6.3370466232299805, 6.979496479034424, 7.621946334838867, 8.264396667480469, 8.906846046447754, 9.549295425415039, 10.19174575805664, 10.834196090698242, 11.476645469665527, 12.119094848632812, 12.761545181274414, 13.403995513916016, 14.0464448928833, 14.688894271850586, 15.331344604492188, 15.973794937133789, 16.61624526977539, 17.25869369506836, 17.90114402770996, 18.543594360351562, 19.18604278564453, 19.828493118286133, 20.470943450927734]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 13.0, 10.0, 21.0, 17.0, 42.0, 46.0, 83.0, 91.0, 188.0, 241.0, 349.0, 553.0, 775.0, 1239.0, 1865.0, 3104.0, 4937.0, 8022.0, 13539.0, 23809.0, 44951.0, 87947.0, 173445.0, 260211.0, 199595.0, 103846.0, 52240.0, 27816.0, 15416.0, 9000.0, 5564.0, 3292.0, 2139.0, 1379.0, 943.0, 586.0, 385.0, 278.0, 184.0, 112.0, 86.0, 46.0, 41.0, 30.0, 25.0, 20.0, 5.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-29.1875, -28.292724609375, -27.39794921875, -26.503173828125, -25.6083984375, -24.713623046875, -23.81884765625, -22.924072265625, -22.029296875, -21.134521484375, -20.23974609375, -19.344970703125, -18.4501953125, -17.555419921875, -16.66064453125, -15.765869140625, -14.87109375, -13.976318359375, -13.08154296875, -12.186767578125, -11.2919921875, -10.397216796875, -9.50244140625, -8.607666015625, -7.712890625, -6.818115234375, -5.92333984375, -5.028564453125, -4.1337890625, -3.239013671875, -2.34423828125, -1.449462890625, -0.5546875, 0.340087890625, 1.23486328125, 2.129638671875, 3.0244140625, 3.919189453125, 4.81396484375, 5.708740234375, 6.603515625, 7.498291015625, 8.39306640625, 9.287841796875, 10.1826171875, 11.077392578125, 11.97216796875, 12.866943359375, 13.76171875, 14.656494140625, 15.55126953125, 16.446044921875, 17.3408203125, 18.235595703125, 19.13037109375, 20.025146484375, 20.919921875, 21.814697265625, 22.70947265625, 23.604248046875, 24.4990234375, 25.393798828125, 26.28857421875, 27.183349609375, 28.078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 1.0, 8.0, 15.0, 16.0, 15.0, 29.0, 24.0, 27.0, 23.0, 36.0, 35.0, 39.0, 25.0, 42.0, 34.0, 58.0, 46.0, 34.0, 59.0, 39.0, 52.0, 49.0, 33.0, 27.0, 33.0, 26.0, 20.0, 28.0, 9.0, 17.0, 19.0, 17.0, 8.0, 12.0, 3.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.375, -21.67138671875, -20.9677734375, -20.26416015625, -19.560546875, -18.85693359375, -18.1533203125, -17.44970703125, -16.74609375, -16.04248046875, -15.3388671875, -14.63525390625, -13.931640625, -13.22802734375, -12.5244140625, -11.82080078125, -11.1171875, -10.41357421875, -9.7099609375, -9.00634765625, -8.302734375, -7.59912109375, -6.8955078125, -6.19189453125, -5.48828125, -4.78466796875, -4.0810546875, -3.37744140625, -2.673828125, -1.97021484375, -1.2666015625, -0.56298828125, 0.140625, 0.84423828125, 1.5478515625, 2.25146484375, 2.955078125, 3.65869140625, 4.3623046875, 5.06591796875, 5.76953125, 6.47314453125, 7.1767578125, 7.88037109375, 8.583984375, 9.28759765625, 9.9912109375, 10.69482421875, 11.3984375, 12.10205078125, 12.8056640625, 13.50927734375, 14.212890625, 14.91650390625, 15.6201171875, 16.32373046875, 17.02734375, 17.73095703125, 18.4345703125, 19.13818359375, 19.841796875, 20.54541015625, 21.2490234375, 21.95263671875, 22.65625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 18.0, 23.0, 17.0, 29.0, 28.0, 51.0, 75.0, 112.0, 151.0, 231.0, 305.0, 498.0, 720.0, 1099.0, 1665.0, 2764.0, 4615.0, 8312.0, 16142.0, 35204.0, 90886.0, 262570.0, 370165.0, 149504.0, 54028.0, 22750.0, 10966.0, 6015.0, 3427.0, 2110.0, 1363.0, 836.0, 565.0, 389.0, 276.0, 181.0, 137.0, 92.0, 58.0, 40.0, 35.0, 20.0, 21.0, 11.0, 13.0, 8.0, 10.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.625, -36.337890625, -35.05078125, -33.763671875, -32.4765625, -31.189453125, -29.90234375, -28.615234375, -27.328125, -26.041015625, -24.75390625, -23.466796875, -22.1796875, -20.892578125, -19.60546875, -18.318359375, -17.03125, -15.744140625, -14.45703125, -13.169921875, -11.8828125, -10.595703125, -9.30859375, -8.021484375, -6.734375, -5.447265625, -4.16015625, -2.873046875, -1.5859375, -0.298828125, 0.98828125, 2.275390625, 3.5625, 4.849609375, 6.13671875, 7.423828125, 8.7109375, 9.998046875, 11.28515625, 12.572265625, 13.859375, 15.146484375, 16.43359375, 17.720703125, 19.0078125, 20.294921875, 21.58203125, 22.869140625, 24.15625, 25.443359375, 26.73046875, 28.017578125, 29.3046875, 30.591796875, 31.87890625, 33.166015625, 34.453125, 35.740234375, 37.02734375, 38.314453125, 39.6015625, 40.888671875, 42.17578125, 43.462890625, 44.75]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 6.0, 13.0, 4.0, 12.0, 14.0, 18.0, 21.0, 15.0, 26.0, 21.0, 22.0, 29.0, 21.0, 43.0, 32.0, 38.0, 26.0, 35.0, 30.0, 40.0, 28.0, 29.0, 25.0, 45.0, 23.0, 32.0, 23.0, 21.0, 26.0, 31.0, 27.0, 24.0, 32.0, 19.0, 17.0, 17.0, 18.0, 14.0, 15.0, 6.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 8.0, 3.0, 2.0, 4.0, 1.0], "bins": [-10.921875, -10.59521484375, -10.2685546875, -9.94189453125, -9.615234375, -9.28857421875, -8.9619140625, -8.63525390625, -8.30859375, -7.98193359375, -7.6552734375, -7.32861328125, -7.001953125, -6.67529296875, -6.3486328125, -6.02197265625, -5.6953125, -5.36865234375, -5.0419921875, -4.71533203125, -4.388671875, -4.06201171875, -3.7353515625, -3.40869140625, -3.08203125, -2.75537109375, -2.4287109375, -2.10205078125, -1.775390625, -1.44873046875, -1.1220703125, -0.79541015625, -0.46875, -0.14208984375, 0.1845703125, 0.51123046875, 0.837890625, 1.16455078125, 1.4912109375, 1.81787109375, 2.14453125, 2.47119140625, 2.7978515625, 3.12451171875, 3.451171875, 3.77783203125, 4.1044921875, 4.43115234375, 4.7578125, 5.08447265625, 5.4111328125, 5.73779296875, 6.064453125, 6.39111328125, 6.7177734375, 7.04443359375, 7.37109375, 7.69775390625, 8.0244140625, 8.35107421875, 8.677734375, 9.00439453125, 9.3310546875, 9.65771484375, 9.984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 10.0, 20.0, 24.0, 31.0, 49.0, 75.0, 103.0, 166.0, 214.0, 327.0, 473.0, 747.0, 1063.0, 1727.0, 2801.0, 4450.0, 7558.0, 13695.0, 26917.0, 59508.0, 152028.0, 358886.0, 244497.0, 90704.0, 38305.0, 18526.0, 10080.0, 5664.0, 3469.0, 2175.0, 1419.0, 881.0, 584.0, 432.0, 265.0, 200.0, 142.0, 93.0, 65.0, 62.0, 31.0, 20.0, 12.0, 16.0, 11.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.53125, -13.117919921875, -12.70458984375, -12.291259765625, -11.8779296875, -11.464599609375, -11.05126953125, -10.637939453125, -10.224609375, -9.811279296875, -9.39794921875, -8.984619140625, -8.5712890625, -8.157958984375, -7.74462890625, -7.331298828125, -6.91796875, -6.504638671875, -6.09130859375, -5.677978515625, -5.2646484375, -4.851318359375, -4.43798828125, -4.024658203125, -3.611328125, -3.197998046875, -2.78466796875, -2.371337890625, -1.9580078125, -1.544677734375, -1.13134765625, -0.718017578125, -0.3046875, 0.108642578125, 0.52197265625, 0.935302734375, 1.3486328125, 1.761962890625, 2.17529296875, 2.588623046875, 3.001953125, 3.415283203125, 3.82861328125, 4.241943359375, 4.6552734375, 5.068603515625, 5.48193359375, 5.895263671875, 6.30859375, 6.721923828125, 7.13525390625, 7.548583984375, 7.9619140625, 8.375244140625, 8.78857421875, 9.201904296875, 9.615234375, 10.028564453125, 10.44189453125, 10.855224609375, 11.2685546875, 11.681884765625, 12.09521484375, 12.508544921875, 12.921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 5.0, 11.0, 13.0, 13.0, 21.0, 36.0, 44.0, 72.0, 86.0, 117.0, 111.0, 106.0, 98.0, 54.0, 49.0, 37.0, 29.0, 15.0, 18.0, 11.0, 13.0, 8.0, 2.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011739730834960938, -0.001140102744102478, -0.0011062324047088623, -0.0010723620653152466, -0.0010384917259216309, -0.0010046213865280151, -0.0009707510471343994, -0.0009368807077407837, -0.000903010368347168, -0.0008691400289535522, -0.0008352696895599365, -0.0008013993501663208, -0.0007675290107727051, -0.0007336586713790894, -0.0006997883319854736, -0.0006659179925918579, -0.0006320476531982422, -0.0005981773138046265, -0.0005643069744110107, -0.000530436635017395, -0.0004965662956237793, -0.0004626959562301636, -0.00042882561683654785, -0.00039495527744293213, -0.0003610849380493164, -0.0003272145986557007, -0.00029334425926208496, -0.00025947391986846924, -0.00022560358047485352, -0.0001917332410812378, -0.00015786290168762207, -0.00012399256229400635, -9.012222290039062e-05, -5.62518835067749e-05, -2.238154411315918e-05, 1.1488795280456543e-05, 4.5359134674072266e-05, 7.922947406768799e-05, 0.00011309981346130371, 0.00014697015285491943, 0.00018084049224853516, 0.00021471083164215088, 0.0002485811710357666, 0.0002824515104293823, 0.00031632184982299805, 0.00035019218921661377, 0.0003840625286102295, 0.0004179328680038452, 0.00045180320739746094, 0.00048567354679107666, 0.0005195438861846924, 0.0005534142255783081, 0.0005872845649719238, 0.0006211549043655396, 0.0006550252437591553, 0.000688895583152771, 0.0007227659225463867, 0.0007566362619400024, 0.0007905066013336182, 0.0008243769407272339, 0.0008582472801208496, 0.0008921176195144653, 0.0009259879589080811, 0.0009598582983016968, 0.0009937286376953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 11.0, 14.0, 16.0, 13.0, 23.0, 39.0, 51.0, 91.0, 124.0, 152.0, 259.0, 362.0, 501.0, 768.0, 1072.0, 1670.0, 2570.0, 4233.0, 7364.0, 13400.0, 25690.0, 54222.0, 119218.0, 234953.0, 272051.0, 160756.0, 73813.0, 34349.0, 17124.0, 9267.0, 5229.0, 3196.0, 1999.0, 1306.0, 827.0, 562.0, 378.0, 264.0, 198.0, 112.0, 91.0, 67.0, 50.0, 38.0, 24.0, 13.0, 10.0, 9.0, 1.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.1328125, -11.7559814453125, -11.379150390625, -11.0023193359375, -10.62548828125, -10.2486572265625, -9.871826171875, -9.4949951171875, -9.1181640625, -8.7413330078125, -8.364501953125, -7.9876708984375, -7.61083984375, -7.2340087890625, -6.857177734375, -6.4803466796875, -6.103515625, -5.7266845703125, -5.349853515625, -4.9730224609375, -4.59619140625, -4.2193603515625, -3.842529296875, -3.4656982421875, -3.0888671875, -2.7120361328125, -2.335205078125, -1.9583740234375, -1.58154296875, -1.2047119140625, -0.827880859375, -0.4510498046875, -0.07421875, 0.3026123046875, 0.679443359375, 1.0562744140625, 1.43310546875, 1.8099365234375, 2.186767578125, 2.5635986328125, 2.9404296875, 3.3172607421875, 3.694091796875, 4.0709228515625, 4.44775390625, 4.8245849609375, 5.201416015625, 5.5782470703125, 5.955078125, 6.3319091796875, 6.708740234375, 7.0855712890625, 7.46240234375, 7.8392333984375, 8.216064453125, 8.5928955078125, 8.9697265625, 9.3465576171875, 9.723388671875, 10.1002197265625, 10.47705078125, 10.8538818359375, 11.230712890625, 11.6075439453125, 11.984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 9.0, 10.0, 13.0, 15.0, 14.0, 22.0, 31.0, 34.0, 50.0, 53.0, 59.0, 52.0, 66.0, 59.0, 65.0, 65.0, 53.0, 58.0, 41.0, 46.0, 24.0, 30.0, 19.0, 18.0, 9.0, 11.0, 16.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.73370361328125, -2.6314697265625, -2.52923583984375, -2.427001953125, -2.32476806640625, -2.2225341796875, -2.12030029296875, -2.01806640625, -1.91583251953125, -1.8135986328125, -1.71136474609375, -1.609130859375, -1.50689697265625, -1.4046630859375, -1.30242919921875, -1.2001953125, -1.09796142578125, -0.9957275390625, -0.89349365234375, -0.791259765625, -0.68902587890625, -0.5867919921875, -0.48455810546875, -0.38232421875, -0.28009033203125, -0.1778564453125, -0.07562255859375, 0.026611328125, 0.12884521484375, 0.2310791015625, 0.33331298828125, 0.435546875, 0.53778076171875, 0.6400146484375, 0.74224853515625, 0.844482421875, 0.94671630859375, 1.0489501953125, 1.15118408203125, 1.25341796875, 1.35565185546875, 1.4578857421875, 1.56011962890625, 1.662353515625, 1.76458740234375, 1.8668212890625, 1.96905517578125, 2.0712890625, 2.17352294921875, 2.2757568359375, 2.37799072265625, 2.480224609375, 2.58245849609375, 2.6846923828125, 2.78692626953125, 2.88916015625, 2.99139404296875, 3.0936279296875, 3.19586181640625, 3.298095703125, 3.40032958984375, 3.5025634765625, 3.60479736328125, 3.70703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 9.0, 9.0, 5.0, 14.0, 13.0, 31.0, 40.0, 49.0, 34.0, 61.0, 73.0, 93.0, 87.0, 80.0, 73.0, 70.0, 59.0, 50.0, 29.0, 33.0, 24.0, 21.0, 14.0, 9.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.513336181640625, -39.43730163574219, -38.36126708984375, -37.28523635864258, -36.20920181274414, -35.1331672668457, -34.05713653564453, -32.981101989746094, -31.905067443847656, -30.82903289794922, -29.753000259399414, -28.67696762084961, -27.600933074951172, -26.524898529052734, -25.44886589050293, -24.372833251953125, -23.296798706054688, -22.22076416015625, -21.144731521606445, -20.06869888305664, -18.992664337158203, -17.916629791259766, -16.84059715270996, -15.76456356048584, -14.688529968261719, -13.612496376037598, -12.536462783813477, -11.460429191589355, -10.384395599365234, -9.308362007141113, -8.232328414916992, -7.156294822692871, -6.080257415771484, -5.004223823547363, -3.928190231323242, -2.852156639099121, -1.776123046875, -0.7000894546508789, 0.3759441375732422, 1.4519777297973633, 2.5280113220214844, 3.6040449142456055, 4.680078506469727, 5.756112098693848, 6.832145690917969, 7.90817928314209, 8.984212875366211, 10.060246467590332, 11.136280059814453, 12.212313652038574, 13.288347244262695, 14.364380836486816, 15.440414428710938, 16.516448974609375, 17.59248161315918, 18.668514251708984, 19.744548797607422, 20.82058334350586, 21.896615982055664, 22.97264862060547, 24.048683166503906, 25.124717712402344, 26.20075035095215, 27.276782989501953, 28.35281753540039]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 12.0, 8.0, 15.0, 10.0, 14.0, 8.0, 18.0, 18.0, 20.0, 29.0, 27.0, 32.0, 28.0, 33.0, 38.0, 31.0, 39.0, 54.0, 48.0, 33.0, 41.0, 31.0, 41.0, 49.0, 39.0, 35.0, 28.0, 21.0, 24.0, 19.0, 15.0, 25.0, 18.0, 16.0, 17.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-20.40717124938965, -19.779266357421875, -19.15135955810547, -18.523454666137695, -17.895549774169922, -17.267642974853516, -16.639738082885742, -16.01183319091797, -15.383927345275879, -14.756021499633789, -14.128116607666016, -13.500210762023926, -12.872304916381836, -12.244400024414062, -11.616494178771973, -10.988588333129883, -10.36068344116211, -9.73277759552002, -9.104872703552246, -8.476966857910156, -7.849061489105225, -7.221156120300293, -6.593250274658203, -5.9653449058532715, -5.33743953704834, -4.709534168243408, -4.081628799438477, -3.4537229537963867, -2.825817584991455, -2.1979122161865234, -1.5700066089630127, -0.942101001739502, -0.3141975402832031, 0.31370794773101807, 0.9416134357452393, 1.5695189237594604, 2.1974244117736816, 2.8253297805786133, 3.453235387802124, 4.081140995025635, 4.709046363830566, 5.336951732635498, 5.96485710144043, 6.5927629470825195, 7.220668315887451, 7.848573684692383, 8.476479530334473, 9.104385375976562, 9.732290267944336, 10.360196113586426, 10.9881010055542, 11.616006851196289, 12.243911743164062, 12.871817588806152, 13.499723434448242, 14.127628326416016, 14.755534172058105, 15.383440017700195, 16.01134490966797, 16.639249801635742, 17.26715660095215, 17.895061492919922, 18.522966384887695, 19.1508731842041, 19.778778076171875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 16.0, 20.0, 32.0, 28.0, 46.0, 77.0, 113.0, 175.0, 243.0, 429.0, 647.0, 977.0, 1543.0, 2396.0, 3931.0, 6232.0, 10146.0, 16175.0, 27403.0, 45848.0, 76744.0, 123715.0, 172745.0, 182832.0, 142887.0, 92821.0, 55655.0, 32676.0, 19908.0, 12131.0, 7456.0, 4555.0, 2893.0, 1793.0, 1184.0, 725.0, 501.0, 318.0, 179.0, 105.0, 85.0, 61.0, 47.0, 24.0, 11.0, 13.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.73876953125, -25.7900390625, -24.84130859375, -23.892578125, -22.94384765625, -21.9951171875, -21.04638671875, -20.09765625, -19.14892578125, -18.2001953125, -17.25146484375, -16.302734375, -15.35400390625, -14.4052734375, -13.45654296875, -12.5078125, -11.55908203125, -10.6103515625, -9.66162109375, -8.712890625, -7.76416015625, -6.8154296875, -5.86669921875, -4.91796875, -3.96923828125, -3.0205078125, -2.07177734375, -1.123046875, -0.17431640625, 0.7744140625, 1.72314453125, 2.671875, 3.62060546875, 4.5693359375, 5.51806640625, 6.466796875, 7.41552734375, 8.3642578125, 9.31298828125, 10.26171875, 11.21044921875, 12.1591796875, 13.10791015625, 14.056640625, 15.00537109375, 15.9541015625, 16.90283203125, 17.8515625, 18.80029296875, 19.7490234375, 20.69775390625, 21.646484375, 22.59521484375, 23.5439453125, 24.49267578125, 25.44140625, 26.39013671875, 27.3388671875, 28.28759765625, 29.236328125, 30.18505859375, 31.1337890625, 32.08251953125, 33.03125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 4.0, 9.0, 12.0, 11.0, 17.0, 19.0, 22.0, 23.0, 23.0, 31.0, 30.0, 42.0, 37.0, 38.0, 33.0, 39.0, 43.0, 43.0, 32.0, 43.0, 44.0, 49.0, 35.0, 31.0, 32.0, 22.0, 37.0, 18.0, 17.0, 23.0, 14.0, 12.0, 16.0, 16.0, 16.0, 11.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -17.97802734375, -17.3779296875, -16.77783203125, -16.177734375, -15.57763671875, -14.9775390625, -14.37744140625, -13.77734375, -13.17724609375, -12.5771484375, -11.97705078125, -11.376953125, -10.77685546875, -10.1767578125, -9.57666015625, -8.9765625, -8.37646484375, -7.7763671875, -7.17626953125, -6.576171875, -5.97607421875, -5.3759765625, -4.77587890625, -4.17578125, -3.57568359375, -2.9755859375, -2.37548828125, -1.775390625, -1.17529296875, -0.5751953125, 0.02490234375, 0.625, 1.22509765625, 1.8251953125, 2.42529296875, 3.025390625, 3.62548828125, 4.2255859375, 4.82568359375, 5.42578125, 6.02587890625, 6.6259765625, 7.22607421875, 7.826171875, 8.42626953125, 9.0263671875, 9.62646484375, 10.2265625, 10.82666015625, 11.4267578125, 12.02685546875, 12.626953125, 13.22705078125, 13.8271484375, 14.42724609375, 15.02734375, 15.62744140625, 16.2275390625, 16.82763671875, 17.427734375, 18.02783203125, 18.6279296875, 19.22802734375, 19.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 13.0, 12.0, 20.0, 34.0, 66.0, 72.0, 118.0, 179.0, 231.0, 370.0, 583.0, 871.0, 1276.0, 1920.0, 3077.0, 4805.0, 7528.0, 11822.0, 19135.0, 31268.0, 49780.0, 77373.0, 115421.0, 151244.0, 162121.0, 137984.0, 98403.0, 63831.0, 40489.0, 25328.0, 15767.0, 9891.0, 6105.0, 3936.0, 2562.0, 1672.0, 1080.0, 669.0, 498.0, 321.0, 210.0, 153.0, 94.0, 82.0, 51.0, 22.0, 20.0, 12.0, 13.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.953125, -22.219482421875, -21.48583984375, -20.752197265625, -20.0185546875, -19.284912109375, -18.55126953125, -17.817626953125, -17.083984375, -16.350341796875, -15.61669921875, -14.883056640625, -14.1494140625, -13.415771484375, -12.68212890625, -11.948486328125, -11.21484375, -10.481201171875, -9.74755859375, -9.013916015625, -8.2802734375, -7.546630859375, -6.81298828125, -6.079345703125, -5.345703125, -4.612060546875, -3.87841796875, -3.144775390625, -2.4111328125, -1.677490234375, -0.94384765625, -0.210205078125, 0.5234375, 1.257080078125, 1.99072265625, 2.724365234375, 3.4580078125, 4.191650390625, 4.92529296875, 5.658935546875, 6.392578125, 7.126220703125, 7.85986328125, 8.593505859375, 9.3271484375, 10.060791015625, 10.79443359375, 11.528076171875, 12.26171875, 12.995361328125, 13.72900390625, 14.462646484375, 15.1962890625, 15.929931640625, 16.66357421875, 17.397216796875, 18.130859375, 18.864501953125, 19.59814453125, 20.331787109375, 21.0654296875, 21.799072265625, 22.53271484375, 23.266357421875, 24.0]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 15.0, 10.0, 17.0, 19.0, 21.0, 19.0, 32.0, 31.0, 32.0, 38.0, 41.0, 43.0, 43.0, 50.0, 48.0, 48.0, 50.0, 48.0, 41.0, 41.0, 38.0, 39.0, 34.0, 37.0, 29.0, 11.0, 18.0, 16.0, 20.0, 13.0, 7.0, 5.0, 9.0, 7.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.2254638671875, -9.802490234375, -9.3795166015625, -8.95654296875, -8.5335693359375, -8.110595703125, -7.6876220703125, -7.2646484375, -6.8416748046875, -6.418701171875, -5.9957275390625, -5.57275390625, -5.1497802734375, -4.726806640625, -4.3038330078125, -3.880859375, -3.4578857421875, -3.034912109375, -2.6119384765625, -2.18896484375, -1.7659912109375, -1.343017578125, -0.9200439453125, -0.4970703125, -0.0740966796875, 0.348876953125, 0.7718505859375, 1.19482421875, 1.6177978515625, 2.040771484375, 2.4637451171875, 2.88671875, 3.3096923828125, 3.732666015625, 4.1556396484375, 4.57861328125, 5.0015869140625, 5.424560546875, 5.8475341796875, 6.2705078125, 6.6934814453125, 7.116455078125, 7.5394287109375, 7.96240234375, 8.3853759765625, 8.808349609375, 9.2313232421875, 9.654296875, 10.0772705078125, 10.500244140625, 10.9232177734375, 11.34619140625, 11.7691650390625, 12.192138671875, 12.6151123046875, 13.0380859375, 13.4610595703125, 13.884033203125, 14.3070068359375, 14.72998046875, 15.1529541015625, 15.575927734375, 15.9989013671875, 16.421875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 4.0, 5.0, 9.0, 20.0, 25.0, 35.0, 52.0, 69.0, 104.0, 147.0, 234.0, 352.0, 525.0, 812.0, 1383.0, 2230.0, 3573.0, 6153.0, 10407.0, 19143.0, 37192.0, 77164.0, 160943.0, 264611.0, 226710.0, 117714.0, 55671.0, 27557.0, 14873.0, 8194.0, 4789.0, 2904.0, 1729.0, 1145.0, 664.0, 456.0, 296.0, 203.0, 149.0, 106.0, 60.0, 51.0, 34.0, 13.0, 16.0, 13.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.53125, -22.834716796875, -22.13818359375, -21.441650390625, -20.7451171875, -20.048583984375, -19.35205078125, -18.655517578125, -17.958984375, -17.262451171875, -16.56591796875, -15.869384765625, -15.1728515625, -14.476318359375, -13.77978515625, -13.083251953125, -12.38671875, -11.690185546875, -10.99365234375, -10.297119140625, -9.6005859375, -8.904052734375, -8.20751953125, -7.510986328125, -6.814453125, -6.117919921875, -5.42138671875, -4.724853515625, -4.0283203125, -3.331787109375, -2.63525390625, -1.938720703125, -1.2421875, -0.545654296875, 0.15087890625, 0.847412109375, 1.5439453125, 2.240478515625, 2.93701171875, 3.633544921875, 4.330078125, 5.026611328125, 5.72314453125, 6.419677734375, 7.1162109375, 7.812744140625, 8.50927734375, 9.205810546875, 9.90234375, 10.598876953125, 11.29541015625, 11.991943359375, 12.6884765625, 13.385009765625, 14.08154296875, 14.778076171875, 15.474609375, 16.171142578125, 16.86767578125, 17.564208984375, 18.2607421875, 18.957275390625, 19.65380859375, 20.350341796875, 21.046875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 6.0, 5.0, 13.0, 12.0, 16.0, 16.0, 24.0, 42.0, 52.0, 60.0, 79.0, 85.0, 101.0, 93.0, 86.0, 65.0, 53.0, 52.0, 30.0, 29.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00269317626953125, -0.0026217252016067505, -0.002550274133682251, -0.0024788230657577515, -0.002407371997833252, -0.0023359209299087524, -0.002264469861984253, -0.0021930187940597534, -0.002121567726135254, -0.0020501166582107544, -0.001978665590286255, -0.0019072145223617554, -0.0018357634544372559, -0.0017643123865127563, -0.0016928613185882568, -0.0016214102506637573, -0.0015499591827392578, -0.0014785081148147583, -0.0014070570468902588, -0.0013356059789657593, -0.0012641549110412598, -0.0011927038431167603, -0.0011212527751922607, -0.0010498017072677612, -0.0009783506393432617, -0.0009068995714187622, -0.0008354485034942627, -0.0007639974355697632, -0.0006925463676452637, -0.0006210952997207642, -0.0005496442317962646, -0.00047819316387176514, -0.0004067420959472656, -0.0003352910280227661, -0.0002638399600982666, -0.0001923888921737671, -0.00012093782424926758, -4.9486756324768066e-05, 2.1964311599731445e-05, 9.341537952423096e-05, 0.00016486644744873047, 0.00023631751537322998, 0.0003077685832977295, 0.000379219651222229, 0.0004506707191467285, 0.000522121787071228, 0.0005935728549957275, 0.000665023922920227, 0.0007364749908447266, 0.0008079260587692261, 0.0008793771266937256, 0.0009508281946182251, 0.0010222792625427246, 0.0010937303304672241, 0.0011651813983917236, 0.0012366324663162231, 0.0013080835342407227, 0.0013795346021652222, 0.0014509856700897217, 0.0015224367380142212, 0.0015938878059387207, 0.0016653388738632202, 0.0017367899417877197, 0.0018082410097122192, 0.0018796920776367188]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 11.0, 11.0, 8.0, 16.0, 34.0, 47.0, 55.0, 93.0, 136.0, 191.0, 283.0, 439.0, 702.0, 1083.0, 1669.0, 2775.0, 4676.0, 7957.0, 13626.0, 25774.0, 50356.0, 101901.0, 192673.0, 257301.0, 185043.0, 96316.0, 48224.0, 24604.0, 13307.0, 7433.0, 4434.0, 2781.0, 1601.0, 1015.0, 673.0, 438.0, 267.0, 194.0, 137.0, 77.0, 63.0, 43.0, 22.0, 19.0, 17.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-21.96875, -21.331298828125, -20.69384765625, -20.056396484375, -19.4189453125, -18.781494140625, -18.14404296875, -17.506591796875, -16.869140625, -16.231689453125, -15.59423828125, -14.956787109375, -14.3193359375, -13.681884765625, -13.04443359375, -12.406982421875, -11.76953125, -11.132080078125, -10.49462890625, -9.857177734375, -9.2197265625, -8.582275390625, -7.94482421875, -7.307373046875, -6.669921875, -6.032470703125, -5.39501953125, -4.757568359375, -4.1201171875, -3.482666015625, -2.84521484375, -2.207763671875, -1.5703125, -0.932861328125, -0.29541015625, 0.342041015625, 0.9794921875, 1.616943359375, 2.25439453125, 2.891845703125, 3.529296875, 4.166748046875, 4.80419921875, 5.441650390625, 6.0791015625, 6.716552734375, 7.35400390625, 7.991455078125, 8.62890625, 9.266357421875, 9.90380859375, 10.541259765625, 11.1787109375, 11.816162109375, 12.45361328125, 13.091064453125, 13.728515625, 14.365966796875, 15.00341796875, 15.640869140625, 16.2783203125, 16.915771484375, 17.55322265625, 18.190673828125, 18.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 3.0, 7.0, 13.0, 6.0, 22.0, 13.0, 20.0, 29.0, 23.0, 30.0, 42.0, 53.0, 46.0, 52.0, 80.0, 67.0, 48.0, 67.0, 54.0, 50.0, 55.0, 43.0, 30.0, 27.0, 25.0, 21.0, 9.0, 9.0, 12.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.66668701171875, -6.4622802734375, -6.25787353515625, -6.053466796875, -5.84906005859375, -5.6446533203125, -5.44024658203125, -5.23583984375, -5.03143310546875, -4.8270263671875, -4.62261962890625, -4.418212890625, -4.21380615234375, -4.0093994140625, -3.80499267578125, -3.6005859375, -3.39617919921875, -3.1917724609375, -2.98736572265625, -2.782958984375, -2.57855224609375, -2.3741455078125, -2.16973876953125, -1.96533203125, -1.76092529296875, -1.5565185546875, -1.35211181640625, -1.147705078125, -0.94329833984375, -0.7388916015625, -0.53448486328125, -0.330078125, -0.12567138671875, 0.0787353515625, 0.28314208984375, 0.487548828125, 0.69195556640625, 0.8963623046875, 1.10076904296875, 1.30517578125, 1.50958251953125, 1.7139892578125, 1.91839599609375, 2.122802734375, 2.32720947265625, 2.5316162109375, 2.73602294921875, 2.9404296875, 3.14483642578125, 3.3492431640625, 3.55364990234375, 3.758056640625, 3.96246337890625, 4.1668701171875, 4.37127685546875, 4.57568359375, 4.78009033203125, 4.9844970703125, 5.18890380859375, 5.393310546875, 5.59771728515625, 5.8021240234375, 6.00653076171875, 6.2109375]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 2.0, 6.0, 9.0, 10.0, 13.0, 14.0, 18.0, 12.0, 22.0, 46.0, 45.0, 58.0, 63.0, 48.0, 61.0, 65.0, 71.0, 68.0, 69.0, 51.0, 38.0, 48.0, 35.0, 31.0, 20.0, 25.0, 18.0, 8.0, 10.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-32.1630973815918, -31.305805206298828, -30.448514938354492, -29.591222763061523, -28.733930587768555, -27.87664031982422, -27.01934814453125, -26.16205596923828, -25.304763793945312, -24.447471618652344, -23.590181350708008, -22.73288917541504, -21.87559700012207, -21.018306732177734, -20.161014556884766, -19.303722381591797, -18.44643211364746, -17.589139938354492, -16.731849670410156, -15.874557495117188, -15.017265319824219, -14.159974098205566, -13.302682876586914, -12.445390701293945, -11.588099479675293, -10.73080825805664, -9.873516082763672, -9.01622486114502, -8.158933639526367, -7.301641464233398, -6.444350242614746, -5.5870585441589355, -4.729764938354492, -3.8724732398986816, -3.01518177986145, -2.1578903198242188, -1.3005986213684082, -0.44330692291259766, 0.4139842987060547, 1.2712759971618652, 2.128567695617676, 2.9858593940734863, 3.8431508541107178, 4.700442314147949, 5.55773401260376, 6.41502571105957, 7.272316932678223, 8.129608154296875, 8.986900329589844, 9.844191551208496, 10.701483726501465, 11.558774948120117, 12.416067123413086, 13.273358345031738, 14.13064956665039, 14.98794174194336, 15.845232963562012, 16.702524185180664, 17.559816360473633, 18.41710662841797, 19.274398803710938, 20.131690979003906, 20.988983154296875, 21.84627342224121, 22.70356559753418]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 8.0, 18.0, 8.0, 18.0, 14.0, 17.0, 16.0, 25.0, 23.0, 37.0, 31.0, 44.0, 41.0, 41.0, 40.0, 33.0, 42.0, 36.0, 38.0, 32.0, 32.0, 35.0, 26.0, 29.0, 27.0, 24.0, 26.0, 24.0, 28.0, 23.0, 29.0, 15.0, 16.0, 12.0, 13.0, 9.0, 7.0, 8.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-17.78821563720703, -17.234272003173828, -16.680328369140625, -16.126384735107422, -15.572442054748535, -15.018498420715332, -14.464555740356445, -13.910612106323242, -13.356668472290039, -12.802724838256836, -12.248781204223633, -11.694838523864746, -11.140894889831543, -10.58695125579834, -10.033008575439453, -9.47906494140625, -8.925121307373047, -8.371177673339844, -7.817234516143799, -7.263291358947754, -6.709347724914551, -6.155404090881348, -5.601460933685303, -5.047517776489258, -4.493574142456055, -3.9396307468414307, -3.3856873512268066, -2.8317439556121826, -2.2778005599975586, -1.7238571643829346, -1.1699137687683105, -0.6159703731536865, -0.0620269775390625, 0.4919164180755615, 1.0458598136901855, 1.5998032093048096, 2.1537466049194336, 2.7076900005340576, 3.2616333961486816, 3.8155767917633057, 4.36952018737793, 4.923463821411133, 5.477406978607178, 6.031350135803223, 6.585293769836426, 7.139237403869629, 7.693180561065674, 8.247123718261719, 8.801067352294922, 9.355010986328125, 9.908954620361328, 10.462897300720215, 11.016840934753418, 11.570784568786621, 12.124727249145508, 12.678670883178711, 13.232614517211914, 13.786558151245117, 14.34050178527832, 14.894444465637207, 15.44838809967041, 16.002330780029297, 16.5562744140625, 17.110218048095703, 17.664161682128906]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 20.0, 21.0, 35.0, 41.0, 82.0, 139.0, 164.0, 237.0, 354.0, 595.0, 874.0, 1330.0, 2048.0, 3266.0, 5453.0, 8833.0, 14703.0, 25698.0, 48105.0, 96546.0, 220211.0, 557134.0, 1167312.0, 1130109.0, 513901.0, 201722.0, 89836.0, 44741.0, 24489.0, 14045.0, 8367.0, 5032.0, 3131.0, 1989.0, 1262.0, 807.0, 571.0, 366.0, 215.0, 159.0, 104.0, 74.0, 43.0, 32.0, 22.0, 18.0, 13.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-26.0625, -25.271728515625, -24.48095703125, -23.690185546875, -22.8994140625, -22.108642578125, -21.31787109375, -20.527099609375, -19.736328125, -18.945556640625, -18.15478515625, -17.364013671875, -16.5732421875, -15.782470703125, -14.99169921875, -14.200927734375, -13.41015625, -12.619384765625, -11.82861328125, -11.037841796875, -10.2470703125, -9.456298828125, -8.66552734375, -7.874755859375, -7.083984375, -6.293212890625, -5.50244140625, -4.711669921875, -3.9208984375, -3.130126953125, -2.33935546875, -1.548583984375, -0.7578125, 0.032958984375, 0.82373046875, 1.614501953125, 2.4052734375, 3.196044921875, 3.98681640625, 4.777587890625, 5.568359375, 6.359130859375, 7.14990234375, 7.940673828125, 8.7314453125, 9.522216796875, 10.31298828125, 11.103759765625, 11.89453125, 12.685302734375, 13.47607421875, 14.266845703125, 15.0576171875, 15.848388671875, 16.63916015625, 17.429931640625, 18.220703125, 19.011474609375, 19.80224609375, 20.593017578125, 21.3837890625, 22.174560546875, 22.96533203125, 23.756103515625, 24.546875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 9.0, 13.0, 16.0, 13.0, 25.0, 20.0, 24.0, 33.0, 32.0, 41.0, 38.0, 40.0, 50.0, 41.0, 54.0, 50.0, 39.0, 36.0, 30.0, 33.0, 34.0, 35.0, 26.0, 31.0, 34.0, 34.0, 20.0, 22.0, 19.0, 15.0, 12.0, 12.0, 5.0, 6.0, 8.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5234375, -13.101318359375, -12.67919921875, -12.257080078125, -11.8349609375, -11.412841796875, -10.99072265625, -10.568603515625, -10.146484375, -9.724365234375, -9.30224609375, -8.880126953125, -8.4580078125, -8.035888671875, -7.61376953125, -7.191650390625, -6.76953125, -6.347412109375, -5.92529296875, -5.503173828125, -5.0810546875, -4.658935546875, -4.23681640625, -3.814697265625, -3.392578125, -2.970458984375, -2.54833984375, -2.126220703125, -1.7041015625, -1.281982421875, -0.85986328125, -0.437744140625, -0.015625, 0.406494140625, 0.82861328125, 1.250732421875, 1.6728515625, 2.094970703125, 2.51708984375, 2.939208984375, 3.361328125, 3.783447265625, 4.20556640625, 4.627685546875, 5.0498046875, 5.471923828125, 5.89404296875, 6.316162109375, 6.73828125, 7.160400390625, 7.58251953125, 8.004638671875, 8.4267578125, 8.848876953125, 9.27099609375, 9.693115234375, 10.115234375, 10.537353515625, 10.95947265625, 11.381591796875, 11.8037109375, 12.225830078125, 12.64794921875, 13.070068359375, 13.4921875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 4.0, 8.0, 9.0, 12.0, 16.0, 29.0, 52.0, 66.0, 115.0, 224.0, 351.0, 606.0, 1023.0, 1796.0, 3257.0, 5905.0, 11205.0, 21617.0, 44142.0, 94207.0, 216346.0, 521327.0, 1134760.0, 1168347.0, 548569.0, 227556.0, 98537.0, 46148.0, 22769.0, 11556.0, 6092.0, 3263.0, 1819.0, 985.0, 615.0, 352.0, 205.0, 130.0, 105.0, 53.0, 30.0, 26.0, 21.0, 16.0, 10.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.125, -23.232421875, -22.33984375, -21.447265625, -20.5546875, -19.662109375, -18.76953125, -17.876953125, -16.984375, -16.091796875, -15.19921875, -14.306640625, -13.4140625, -12.521484375, -11.62890625, -10.736328125, -9.84375, -8.951171875, -8.05859375, -7.166015625, -6.2734375, -5.380859375, -4.48828125, -3.595703125, -2.703125, -1.810546875, -0.91796875, -0.025390625, 0.8671875, 1.759765625, 2.65234375, 3.544921875, 4.4375, 5.330078125, 6.22265625, 7.115234375, 8.0078125, 8.900390625, 9.79296875, 10.685546875, 11.578125, 12.470703125, 13.36328125, 14.255859375, 15.1484375, 16.041015625, 16.93359375, 17.826171875, 18.71875, 19.611328125, 20.50390625, 21.396484375, 22.2890625, 23.181640625, 24.07421875, 24.966796875, 25.859375, 26.751953125, 27.64453125, 28.537109375, 29.4296875, 30.322265625, 31.21484375, 32.107421875, 33.0]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 12.0, 8.0, 9.0, 9.0, 16.0, 12.0, 22.0, 21.0, 30.0, 34.0, 52.0, 68.0, 70.0, 86.0, 117.0, 132.0, 173.0, 230.0, 288.0, 293.0, 329.0, 300.0, 268.0, 241.0, 255.0, 190.0, 160.0, 153.0, 109.0, 91.0, 70.0, 52.0, 37.0, 32.0, 23.0, 21.0, 18.0, 11.0, 10.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.15625, -8.902587890625, -8.64892578125, -8.395263671875, -8.1416015625, -7.887939453125, -7.63427734375, -7.380615234375, -7.126953125, -6.873291015625, -6.61962890625, -6.365966796875, -6.1123046875, -5.858642578125, -5.60498046875, -5.351318359375, -5.09765625, -4.843994140625, -4.59033203125, -4.336669921875, -4.0830078125, -3.829345703125, -3.57568359375, -3.322021484375, -3.068359375, -2.814697265625, -2.56103515625, -2.307373046875, -2.0537109375, -1.800048828125, -1.54638671875, -1.292724609375, -1.0390625, -0.785400390625, -0.53173828125, -0.278076171875, -0.0244140625, 0.229248046875, 0.48291015625, 0.736572265625, 0.990234375, 1.243896484375, 1.49755859375, 1.751220703125, 2.0048828125, 2.258544921875, 2.51220703125, 2.765869140625, 3.01953125, 3.273193359375, 3.52685546875, 3.780517578125, 4.0341796875, 4.287841796875, 4.54150390625, 4.795166015625, 5.048828125, 5.302490234375, 5.55615234375, 5.809814453125, 6.0634765625, 6.317138671875, 6.57080078125, 6.824462890625, 7.078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 10.0, 6.0, 5.0, 14.0, 12.0, 18.0, 24.0, 26.0, 40.0, 41.0, 39.0, 59.0, 60.0, 87.0, 77.0, 60.0, 58.0, 72.0, 59.0, 54.0, 35.0, 36.0, 26.0, 16.0, 17.0, 12.0, 11.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.712608337402344, -28.87921142578125, -28.04581642150879, -27.212419509887695, -26.379024505615234, -25.54562759399414, -24.712230682373047, -23.878833770751953, -23.045438766479492, -22.2120418548584, -21.378646850585938, -20.545249938964844, -19.71185302734375, -18.87845802307129, -18.045061111450195, -17.211666107177734, -16.37826919555664, -15.544873237609863, -14.711477279663086, -13.878080368041992, -13.044684410095215, -12.211288452148438, -11.377891540527344, -10.544495582580566, -9.711099624633789, -8.877703666687012, -8.044307708740234, -7.210910797119141, -6.377514839172363, -5.544118881225586, -4.71072244644165, -3.877326011657715, -3.0439319610595703, -2.210535764694214, -1.3771395683288574, -0.543743371963501, 0.28965282440185547, 1.1230487823486328, 1.9564452171325684, 2.789841651916504, 3.6232376098632812, 4.456633567810059, 5.290030002593994, 6.12342643737793, 6.956822395324707, 7.790218353271484, 8.623615264892578, 9.457011222839355, 10.290407180786133, 11.12380313873291, 11.957199096679688, 12.790596008300781, 13.623991966247559, 14.457387924194336, 15.29078483581543, 16.12417984008789, 16.957576751708984, 17.790973663330078, 18.62436866760254, 19.457765579223633, 20.291160583496094, 21.124557495117188, 21.95795440673828, 22.791351318359375, 23.624746322631836]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 12.0, 10.0, 9.0, 21.0, 18.0, 24.0, 31.0, 28.0, 34.0, 34.0, 37.0, 33.0, 48.0, 35.0, 43.0, 34.0, 40.0, 39.0, 48.0, 37.0, 43.0, 38.0, 29.0, 36.0, 38.0, 20.0, 24.0, 22.0, 30.0, 8.0, 9.0, 9.0, 13.0, 9.0, 9.0, 6.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-20.108001708984375, -19.531063079833984, -18.954124450683594, -18.377185821533203, -17.800247192382812, -17.223308563232422, -16.64636993408203, -16.06943130493164, -15.49249267578125, -14.91555404663086, -14.338615417480469, -13.761676788330078, -13.184738159179688, -12.607799530029297, -12.030860900878906, -11.453922271728516, -10.876983642578125, -10.300045013427734, -9.723106384277344, -9.146167755126953, -8.569229125976562, -7.992290496826172, -7.415351867675781, -6.838413238525391, -6.261474609375, -5.684535980224609, -5.107597351074219, -4.530658721923828, -3.9537200927734375, -3.376781463623047, -2.7998428344726562, -2.2229042053222656, -1.6459636688232422, -1.0690250396728516, -0.49208641052246094, 0.08485221862792969, 0.6617908477783203, 1.238729476928711, 1.8156681060791016, 2.392606735229492, 2.969545364379883, 3.5464839935302734, 4.123422622680664, 4.700361251831055, 5.277299880981445, 5.854238510131836, 6.431177139282227, 7.008115768432617, 7.585054397583008, 8.161993026733398, 8.738931655883789, 9.31587028503418, 9.89280891418457, 10.469747543334961, 11.046686172485352, 11.623624801635742, 12.200563430786133, 12.777502059936523, 13.354440689086914, 13.931379318237305, 14.508317947387695, 15.085256576538086, 15.662195205688477, 16.239133834838867, 16.816072463989258]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 11.0, 7.0, 19.0, 20.0, 24.0, 37.0, 43.0, 92.0, 107.0, 189.0, 240.0, 373.0, 525.0, 824.0, 1223.0, 1852.0, 2842.0, 4515.0, 7333.0, 11935.0, 19965.0, 33961.0, 58546.0, 100311.0, 159969.0, 203569.0, 171763.0, 110043.0, 64046.0, 36835.0, 21892.0, 13018.0, 8066.0, 5043.0, 3268.0, 2022.0, 1358.0, 877.0, 570.0, 402.0, 263.0, 178.0, 121.0, 85.0, 56.0, 43.0, 22.0, 24.0, 16.0, 6.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.8125, -16.296630859375, -15.78076171875, -15.264892578125, -14.7490234375, -14.233154296875, -13.71728515625, -13.201416015625, -12.685546875, -12.169677734375, -11.65380859375, -11.137939453125, -10.6220703125, -10.106201171875, -9.59033203125, -9.074462890625, -8.55859375, -8.042724609375, -7.52685546875, -7.010986328125, -6.4951171875, -5.979248046875, -5.46337890625, -4.947509765625, -4.431640625, -3.915771484375, -3.39990234375, -2.884033203125, -2.3681640625, -1.852294921875, -1.33642578125, -0.820556640625, -0.3046875, 0.211181640625, 0.72705078125, 1.242919921875, 1.7587890625, 2.274658203125, 2.79052734375, 3.306396484375, 3.822265625, 4.338134765625, 4.85400390625, 5.369873046875, 5.8857421875, 6.401611328125, 6.91748046875, 7.433349609375, 7.94921875, 8.465087890625, 8.98095703125, 9.496826171875, 10.0126953125, 10.528564453125, 11.04443359375, 11.560302734375, 12.076171875, 12.592041015625, 13.10791015625, 13.623779296875, 14.1396484375, 14.655517578125, 15.17138671875, 15.687255859375, 16.203125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 11.0, 17.0, 24.0, 25.0, 20.0, 25.0, 35.0, 24.0, 38.0, 31.0, 40.0, 45.0, 49.0, 37.0, 49.0, 45.0, 39.0, 40.0, 43.0, 26.0, 39.0, 36.0, 24.0, 30.0, 30.0, 20.0, 17.0, 21.0, 9.0, 8.0, 15.0, 4.0, 8.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-19.171875, -18.59033203125, -18.0087890625, -17.42724609375, -16.845703125, -16.26416015625, -15.6826171875, -15.10107421875, -14.51953125, -13.93798828125, -13.3564453125, -12.77490234375, -12.193359375, -11.61181640625, -11.0302734375, -10.44873046875, -9.8671875, -9.28564453125, -8.7041015625, -8.12255859375, -7.541015625, -6.95947265625, -6.3779296875, -5.79638671875, -5.21484375, -4.63330078125, -4.0517578125, -3.47021484375, -2.888671875, -2.30712890625, -1.7255859375, -1.14404296875, -0.5625, 0.01904296875, 0.6005859375, 1.18212890625, 1.763671875, 2.34521484375, 2.9267578125, 3.50830078125, 4.08984375, 4.67138671875, 5.2529296875, 5.83447265625, 6.416015625, 6.99755859375, 7.5791015625, 8.16064453125, 8.7421875, 9.32373046875, 9.9052734375, 10.48681640625, 11.068359375, 11.64990234375, 12.2314453125, 12.81298828125, 13.39453125, 13.97607421875, 14.5576171875, 15.13916015625, 15.720703125, 16.30224609375, 16.8837890625, 17.46533203125, 18.046875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 9.0, 12.0, 7.0, 20.0, 21.0, 33.0, 47.0, 59.0, 107.0, 148.0, 217.0, 313.0, 488.0, 825.0, 1360.0, 2410.0, 4568.0, 9438.0, 22417.0, 63936.0, 219168.0, 442618.0, 186738.0, 55408.0, 19963.0, 8310.0, 4167.0, 2220.0, 1309.0, 768.0, 474.0, 301.0, 195.0, 150.0, 95.0, 78.0, 42.0, 34.0, 24.0, 17.0, 10.0, 6.0, 9.0, 3.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-39.65625, -38.47021484375, -37.2841796875, -36.09814453125, -34.912109375, -33.72607421875, -32.5400390625, -31.35400390625, -30.16796875, -28.98193359375, -27.7958984375, -26.60986328125, -25.423828125, -24.23779296875, -23.0517578125, -21.86572265625, -20.6796875, -19.49365234375, -18.3076171875, -17.12158203125, -15.935546875, -14.74951171875, -13.5634765625, -12.37744140625, -11.19140625, -10.00537109375, -8.8193359375, -7.63330078125, -6.447265625, -5.26123046875, -4.0751953125, -2.88916015625, -1.703125, -0.51708984375, 0.6689453125, 1.85498046875, 3.041015625, 4.22705078125, 5.4130859375, 6.59912109375, 7.78515625, 8.97119140625, 10.1572265625, 11.34326171875, 12.529296875, 13.71533203125, 14.9013671875, 16.08740234375, 17.2734375, 18.45947265625, 19.6455078125, 20.83154296875, 22.017578125, 23.20361328125, 24.3896484375, 25.57568359375, 26.76171875, 27.94775390625, 29.1337890625, 30.31982421875, 31.505859375, 32.69189453125, 33.8779296875, 35.06396484375, 36.25]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 5.0, 6.0, 7.0, 5.0, 12.0, 11.0, 13.0, 11.0, 25.0, 18.0, 22.0, 31.0, 41.0, 37.0, 49.0, 22.0, 38.0, 40.0, 38.0, 47.0, 29.0, 32.0, 41.0, 41.0, 48.0, 29.0, 33.0, 38.0, 42.0, 23.0, 21.0, 26.0, 16.0, 11.0, 11.0, 18.0, 13.0, 7.0, 10.0, 6.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3565673828125, -9.033447265625, -8.7103271484375, -8.38720703125, -8.0640869140625, -7.740966796875, -7.4178466796875, -7.0947265625, -6.7716064453125, -6.448486328125, -6.1253662109375, -5.80224609375, -5.4791259765625, -5.156005859375, -4.8328857421875, -4.509765625, -4.1866455078125, -3.863525390625, -3.5404052734375, -3.21728515625, -2.8941650390625, -2.571044921875, -2.2479248046875, -1.9248046875, -1.6016845703125, -1.278564453125, -0.9554443359375, -0.63232421875, -0.3092041015625, 0.013916015625, 0.3370361328125, 0.66015625, 0.9832763671875, 1.306396484375, 1.6295166015625, 1.95263671875, 2.2757568359375, 2.598876953125, 2.9219970703125, 3.2451171875, 3.5682373046875, 3.891357421875, 4.2144775390625, 4.53759765625, 4.8607177734375, 5.183837890625, 5.5069580078125, 5.830078125, 6.1531982421875, 6.476318359375, 6.7994384765625, 7.12255859375, 7.4456787109375, 7.768798828125, 8.0919189453125, 8.4150390625, 8.7381591796875, 9.061279296875, 9.3843994140625, 9.70751953125, 10.0306396484375, 10.353759765625, 10.6768798828125, 11.0]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 13.0, 25.0, 19.0, 25.0, 32.0, 56.0, 102.0, 110.0, 173.0, 245.0, 413.0, 606.0, 881.0, 1402.0, 2286.0, 3919.0, 6778.0, 12521.0, 24454.0, 50371.0, 114225.0, 259136.0, 303518.0, 141652.0, 62036.0, 29047.0, 14668.0, 8052.0, 4460.0, 2674.0, 1664.0, 986.0, 646.0, 443.0, 242.0, 174.0, 141.0, 102.0, 66.0, 58.0, 41.0, 21.0, 21.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3916015625, -8.103515625, -7.8154296875, -7.52734375, -7.2392578125, -6.951171875, -6.6630859375, -6.375, -6.0869140625, -5.798828125, -5.5107421875, -5.22265625, -4.9345703125, -4.646484375, -4.3583984375, -4.0703125, -3.7822265625, -3.494140625, -3.2060546875, -2.91796875, -2.6298828125, -2.341796875, -2.0537109375, -1.765625, -1.4775390625, -1.189453125, -0.9013671875, -0.61328125, -0.3251953125, -0.037109375, 0.2509765625, 0.5390625, 0.8271484375, 1.115234375, 1.4033203125, 1.69140625, 1.9794921875, 2.267578125, 2.5556640625, 2.84375, 3.1318359375, 3.419921875, 3.7080078125, 3.99609375, 4.2841796875, 4.572265625, 4.8603515625, 5.1484375, 5.4365234375, 5.724609375, 6.0126953125, 6.30078125, 6.5888671875, 6.876953125, 7.1650390625, 7.453125, 7.7412109375, 8.029296875, 8.3173828125, 8.60546875, 8.8935546875, 9.181640625, 9.4697265625, 9.7578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 10.0, 9.0, 18.0, 20.0, 24.0, 42.0, 79.0, 85.0, 151.0, 131.0, 106.0, 94.0, 69.0, 35.0, 30.0, 19.0, 15.0, 17.0, 12.0, 5.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006551742553710938, -0.0006259679794311523, -0.0005967617034912109, -0.0005675554275512695, -0.0005383491516113281, -0.0005091428756713867, -0.0004799365997314453, -0.0004507303237915039, -0.0004215240478515625, -0.0003923177719116211, -0.0003631114959716797, -0.0003339052200317383, -0.0003046989440917969, -0.00027549266815185547, -0.00024628639221191406, -0.00021708011627197266, -0.00018787384033203125, -0.00015866756439208984, -0.00012946128845214844, -0.00010025501251220703, -7.104873657226562e-05, -4.184246063232422e-05, -1.2636184692382812e-05, 1.6570091247558594e-05, 4.57763671875e-05, 7.49826431274414e-05, 0.00010418891906738281, 0.00013339519500732422, 0.00016260147094726562, 0.00019180774688720703, 0.00022101402282714844, 0.00025022029876708984, 0.00027942657470703125, 0.00030863285064697266, 0.00033783912658691406, 0.00036704540252685547, 0.0003962516784667969, 0.0004254579544067383, 0.0004546642303466797, 0.0004838705062866211, 0.0005130767822265625, 0.0005422830581665039, 0.0005714893341064453, 0.0006006956100463867, 0.0006299018859863281, 0.0006591081619262695, 0.0006883144378662109, 0.0007175207138061523, 0.0007467269897460938, 0.0007759332656860352, 0.0008051395416259766, 0.000834345817565918, 0.0008635520935058594, 0.0008927583694458008, 0.0009219646453857422, 0.0009511709213256836, 0.000980377197265625, 0.0010095834732055664, 0.0010387897491455078, 0.0010679960250854492, 0.0010972023010253906, 0.001126408576965332, 0.0011556148529052734, 0.0011848211288452148, 0.0012140274047851562]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 15.0, 19.0, 26.0, 34.0, 56.0, 78.0, 114.0, 162.0, 213.0, 361.0, 478.0, 823.0, 1137.0, 1852.0, 2746.0, 4379.0, 7063.0, 11846.0, 20061.0, 33961.0, 59112.0, 101993.0, 164642.0, 206599.0, 171051.0, 107260.0, 62331.0, 36050.0, 21049.0, 12593.0, 7561.0, 4554.0, 2903.0, 1830.0, 1156.0, 796.0, 534.0, 359.0, 235.0, 176.0, 101.0, 85.0, 47.0, 44.0, 26.0, 13.0, 11.0, 4.0, 6.0, 1.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4296875, -6.22589111328125, -6.0220947265625, -5.81829833984375, -5.614501953125, -5.41070556640625, -5.2069091796875, -5.00311279296875, -4.79931640625, -4.59552001953125, -4.3917236328125, -4.18792724609375, -3.984130859375, -3.78033447265625, -3.5765380859375, -3.37274169921875, -3.1689453125, -2.96514892578125, -2.7613525390625, -2.55755615234375, -2.353759765625, -2.14996337890625, -1.9461669921875, -1.74237060546875, -1.53857421875, -1.33477783203125, -1.1309814453125, -0.92718505859375, -0.723388671875, -0.51959228515625, -0.3157958984375, -0.11199951171875, 0.091796875, 0.29559326171875, 0.4993896484375, 0.70318603515625, 0.906982421875, 1.11077880859375, 1.3145751953125, 1.51837158203125, 1.72216796875, 1.92596435546875, 2.1297607421875, 2.33355712890625, 2.537353515625, 2.74114990234375, 2.9449462890625, 3.14874267578125, 3.3525390625, 3.55633544921875, 3.7601318359375, 3.96392822265625, 4.167724609375, 4.37152099609375, 4.5753173828125, 4.77911376953125, 4.98291015625, 5.18670654296875, 5.3905029296875, 5.59429931640625, 5.798095703125, 6.00189208984375, 6.2056884765625, 6.40948486328125, 6.61328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 7.0, 6.0, 10.0, 19.0, 12.0, 14.0, 24.0, 34.0, 31.0, 35.0, 55.0, 60.0, 67.0, 50.0, 58.0, 77.0, 57.0, 50.0, 49.0, 39.0, 48.0, 32.0, 22.0, 25.0, 19.0, 6.0, 18.0, 12.0, 6.0, 7.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.443359375, -2.373291015625, -2.30322265625, -2.233154296875, -2.1630859375, -2.093017578125, -2.02294921875, -1.952880859375, -1.8828125, -1.812744140625, -1.74267578125, -1.672607421875, -1.6025390625, -1.532470703125, -1.46240234375, -1.392333984375, -1.322265625, -1.252197265625, -1.18212890625, -1.112060546875, -1.0419921875, -0.971923828125, -0.90185546875, -0.831787109375, -0.76171875, -0.691650390625, -0.62158203125, -0.551513671875, -0.4814453125, -0.411376953125, -0.34130859375, -0.271240234375, -0.201171875, -0.131103515625, -0.06103515625, 0.009033203125, 0.0791015625, 0.149169921875, 0.21923828125, 0.289306640625, 0.359375, 0.429443359375, 0.49951171875, 0.569580078125, 0.6396484375, 0.709716796875, 0.77978515625, 0.849853515625, 0.919921875, 0.989990234375, 1.06005859375, 1.130126953125, 1.2001953125, 1.270263671875, 1.34033203125, 1.410400390625, 1.48046875, 1.550537109375, 1.62060546875, 1.690673828125, 1.7607421875, 1.830810546875, 1.90087890625, 1.970947265625, 2.041015625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 14.0, 9.0, 10.0, 17.0, 20.0, 24.0, 29.0, 34.0, 43.0, 37.0, 57.0, 78.0, 82.0, 77.0, 62.0, 68.0, 67.0, 58.0, 41.0, 33.0, 35.0, 20.0, 21.0, 14.0, 14.0, 6.0, 4.0, 8.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.31219482421875, -30.474313735961914, -29.636432647705078, -28.798551559448242, -27.960670471191406, -27.122787475585938, -26.284908294677734, -25.447025299072266, -24.60914421081543, -23.771263122558594, -22.933382034301758, -22.095500946044922, -21.257619857788086, -20.41973876953125, -19.58185577392578, -18.743974685668945, -17.90609359741211, -17.068212509155273, -16.230331420898438, -15.392450332641602, -14.55456829071045, -13.716687202453613, -12.878806114196777, -12.040924072265625, -11.203044891357422, -10.365163803100586, -9.52728271484375, -8.689401626586914, -7.851519584655762, -7.013638496398926, -6.17575740814209, -5.337875843048096, -4.499994277954102, -3.6621129512786865, -2.8242316246032715, -1.9863505363464355, -1.1484692096710205, -0.31058788299560547, 0.5272932052612305, 1.3651747703552246, 2.2030558586120605, 3.0409371852874756, 3.8788185119628906, 4.716699600219727, 5.5545806884765625, 6.392462253570557, 7.230343341827393, 8.068224906921387, 8.906105995178223, 9.743987083435059, 10.581868171691895, 11.419750213623047, 12.257631301879883, 13.095512390136719, 13.933393478393555, 14.77127456665039, 15.609155654907227, 16.447036743164062, 17.2849178314209, 18.122798919677734, 18.96068000793457, 19.798561096191406, 20.636444091796875, 21.47432518005371, 22.312206268310547]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 10.0, 10.0, 6.0, 17.0, 21.0, 19.0, 19.0, 33.0, 35.0, 33.0, 29.0, 34.0, 43.0, 39.0, 38.0, 38.0, 32.0, 41.0, 45.0, 40.0, 38.0, 34.0, 41.0, 34.0, 31.0, 38.0, 24.0, 22.0, 26.0, 16.0, 16.0, 10.0, 10.0, 10.0, 12.0, 9.0, 8.0, 2.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-19.04004669189453, -18.49024772644043, -17.940448760986328, -17.390649795532227, -16.840850830078125, -16.291051864624023, -15.741252899169922, -15.19145393371582, -14.641654968261719, -14.091856002807617, -13.542057037353516, -12.992258071899414, -12.442459106445312, -11.892660140991211, -11.34286117553711, -10.793062210083008, -10.243263244628906, -9.693464279174805, -9.143665313720703, -8.593866348266602, -8.0440673828125, -7.494268417358398, -6.944469451904297, -6.394670486450195, -5.844871520996094, -5.295072555541992, -4.745273590087891, -4.195474624633789, -3.6456756591796875, -3.095876693725586, -2.5460777282714844, -1.9962787628173828, -1.4464797973632812, -0.8966808319091797, -0.3468818664550781, 0.20291709899902344, 0.752716064453125, 1.3025150299072266, 1.8523139953613281, 2.4021129608154297, 2.9519119262695312, 3.501710891723633, 4.051509857177734, 4.601308822631836, 5.1511077880859375, 5.700906753540039, 6.250705718994141, 6.800504684448242, 7.350303649902344, 7.900102615356445, 8.449901580810547, 8.999700546264648, 9.54949951171875, 10.099298477172852, 10.649097442626953, 11.198896408081055, 11.748695373535156, 12.298494338989258, 12.84829330444336, 13.398092269897461, 13.947891235351562, 14.497690200805664, 15.047489166259766, 15.597288131713867, 16.14708709716797]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 7.0, 19.0, 24.0, 24.0, 30.0, 50.0, 57.0, 114.0, 149.0, 216.0, 299.0, 407.0, 652.0, 978.0, 1435.0, 2196.0, 3322.0, 5129.0, 7661.0, 11773.0, 18715.0, 29101.0, 45634.0, 71640.0, 105930.0, 144135.0, 160938.0, 141295.0, 103211.0, 68965.0, 44404.0, 28644.0, 17820.0, 11575.0, 7467.0, 4962.0, 3189.0, 2072.0, 1387.0, 909.0, 610.0, 446.0, 313.0, 215.0, 144.0, 90.0, 63.0, 56.0, 27.0, 21.0, 12.0, 13.0, 1.0, 6.0, 3.0, 7.0, 0.0, 1.0], "bins": [-22.46875, -21.776611328125, -21.08447265625, -20.392333984375, -19.7001953125, -19.008056640625, -18.31591796875, -17.623779296875, -16.931640625, -16.239501953125, -15.54736328125, -14.855224609375, -14.1630859375, -13.470947265625, -12.77880859375, -12.086669921875, -11.39453125, -10.702392578125, -10.01025390625, -9.318115234375, -8.6259765625, -7.933837890625, -7.24169921875, -6.549560546875, -5.857421875, -5.165283203125, -4.47314453125, -3.781005859375, -3.0888671875, -2.396728515625, -1.70458984375, -1.012451171875, -0.3203125, 0.371826171875, 1.06396484375, 1.756103515625, 2.4482421875, 3.140380859375, 3.83251953125, 4.524658203125, 5.216796875, 5.908935546875, 6.60107421875, 7.293212890625, 7.9853515625, 8.677490234375, 9.36962890625, 10.061767578125, 10.75390625, 11.446044921875, 12.13818359375, 12.830322265625, 13.5224609375, 14.214599609375, 14.90673828125, 15.598876953125, 16.291015625, 16.983154296875, 17.67529296875, 18.367431640625, 19.0595703125, 19.751708984375, 20.44384765625, 21.135986328125, 21.828125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 8.0, 7.0, 12.0, 11.0, 10.0, 18.0, 22.0, 26.0, 33.0, 39.0, 32.0, 49.0, 43.0, 28.0, 52.0, 50.0, 38.0, 49.0, 43.0, 46.0, 40.0, 44.0, 41.0, 34.0, 42.0, 29.0, 19.0, 20.0, 20.0, 12.0, 14.0, 11.0, 11.0, 13.0, 5.0, 8.0, 5.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.430419921875, -17.84521484375, -17.260009765625, -16.6748046875, -16.089599609375, -15.50439453125, -14.919189453125, -14.333984375, -13.748779296875, -13.16357421875, -12.578369140625, -11.9931640625, -11.407958984375, -10.82275390625, -10.237548828125, -9.65234375, -9.067138671875, -8.48193359375, -7.896728515625, -7.3115234375, -6.726318359375, -6.14111328125, -5.555908203125, -4.970703125, -4.385498046875, -3.80029296875, -3.215087890625, -2.6298828125, -2.044677734375, -1.45947265625, -0.874267578125, -0.2890625, 0.296142578125, 0.88134765625, 1.466552734375, 2.0517578125, 2.636962890625, 3.22216796875, 3.807373046875, 4.392578125, 4.977783203125, 5.56298828125, 6.148193359375, 6.7333984375, 7.318603515625, 7.90380859375, 8.489013671875, 9.07421875, 9.659423828125, 10.24462890625, 10.829833984375, 11.4150390625, 12.000244140625, 12.58544921875, 13.170654296875, 13.755859375, 14.341064453125, 14.92626953125, 15.511474609375, 16.0966796875, 16.681884765625, 17.26708984375, 17.852294921875, 18.4375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 16.0, 28.0, 37.0, 57.0, 87.0, 122.0, 182.0, 276.0, 403.0, 651.0, 1071.0, 1687.0, 2801.0, 4524.0, 7607.0, 13049.0, 22323.0, 37500.0, 63435.0, 102307.0, 150740.0, 181062.0, 162660.0, 115452.0, 72844.0, 43708.0, 25903.0, 15196.0, 9097.0, 5212.0, 3212.0, 1952.0, 1137.0, 777.0, 480.0, 305.0, 224.0, 130.0, 98.0, 65.0, 41.0, 25.0, 22.0, 12.0, 10.0, 5.0, 1.0, 5.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.71875, -20.06396484375, -19.4091796875, -18.75439453125, -18.099609375, -17.44482421875, -16.7900390625, -16.13525390625, -15.48046875, -14.82568359375, -14.1708984375, -13.51611328125, -12.861328125, -12.20654296875, -11.5517578125, -10.89697265625, -10.2421875, -9.58740234375, -8.9326171875, -8.27783203125, -7.623046875, -6.96826171875, -6.3134765625, -5.65869140625, -5.00390625, -4.34912109375, -3.6943359375, -3.03955078125, -2.384765625, -1.72998046875, -1.0751953125, -0.42041015625, 0.234375, 0.88916015625, 1.5439453125, 2.19873046875, 2.853515625, 3.50830078125, 4.1630859375, 4.81787109375, 5.47265625, 6.12744140625, 6.7822265625, 7.43701171875, 8.091796875, 8.74658203125, 9.4013671875, 10.05615234375, 10.7109375, 11.36572265625, 12.0205078125, 12.67529296875, 13.330078125, 13.98486328125, 14.6396484375, 15.29443359375, 15.94921875, 16.60400390625, 17.2587890625, 17.91357421875, 18.568359375, 19.22314453125, 19.8779296875, 20.53271484375, 21.1875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 5.0, 15.0, 11.0, 19.0, 28.0, 25.0, 30.0, 32.0, 28.0, 33.0, 42.0, 27.0, 48.0, 32.0, 44.0, 44.0, 44.0, 33.0, 43.0, 41.0, 38.0, 37.0, 42.0, 28.0, 28.0, 25.0, 13.0, 28.0, 12.0, 21.0, 12.0, 12.0, 11.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.587890625, -9.26953125, -8.951171875, -8.6328125, -8.314453125, -7.99609375, -7.677734375, -7.359375, -7.041015625, -6.72265625, -6.404296875, -6.0859375, -5.767578125, -5.44921875, -5.130859375, -4.8125, -4.494140625, -4.17578125, -3.857421875, -3.5390625, -3.220703125, -2.90234375, -2.583984375, -2.265625, -1.947265625, -1.62890625, -1.310546875, -0.9921875, -0.673828125, -0.35546875, -0.037109375, 0.28125, 0.599609375, 0.91796875, 1.236328125, 1.5546875, 1.873046875, 2.19140625, 2.509765625, 2.828125, 3.146484375, 3.46484375, 3.783203125, 4.1015625, 4.419921875, 4.73828125, 5.056640625, 5.375, 5.693359375, 6.01171875, 6.330078125, 6.6484375, 6.966796875, 7.28515625, 7.603515625, 7.921875, 8.240234375, 8.55859375, 8.876953125, 9.1953125, 9.513671875, 9.83203125, 10.150390625, 10.46875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 9.0, 11.0, 24.0, 41.0, 48.0, 82.0, 107.0, 165.0, 267.0, 408.0, 608.0, 1001.0, 1475.0, 2485.0, 3898.0, 6459.0, 10733.0, 18947.0, 33194.0, 59089.0, 102710.0, 161691.0, 202082.0, 172867.0, 114166.0, 66848.0, 37428.0, 20968.0, 11834.0, 7078.0, 4367.0, 2764.0, 1644.0, 1090.0, 664.0, 437.0, 283.0, 210.0, 123.0, 95.0, 46.0, 36.0, 29.0, 19.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.3857421875, -11.013671875, -10.6416015625, -10.26953125, -9.8974609375, -9.525390625, -9.1533203125, -8.78125, -8.4091796875, -8.037109375, -7.6650390625, -7.29296875, -6.9208984375, -6.548828125, -6.1767578125, -5.8046875, -5.4326171875, -5.060546875, -4.6884765625, -4.31640625, -3.9443359375, -3.572265625, -3.2001953125, -2.828125, -2.4560546875, -2.083984375, -1.7119140625, -1.33984375, -0.9677734375, -0.595703125, -0.2236328125, 0.1484375, 0.5205078125, 0.892578125, 1.2646484375, 1.63671875, 2.0087890625, 2.380859375, 2.7529296875, 3.125, 3.4970703125, 3.869140625, 4.2412109375, 4.61328125, 4.9853515625, 5.357421875, 5.7294921875, 6.1015625, 6.4736328125, 6.845703125, 7.2177734375, 7.58984375, 7.9619140625, 8.333984375, 8.7060546875, 9.078125, 9.4501953125, 9.822265625, 10.1943359375, 10.56640625, 10.9384765625, 11.310546875, 11.6826171875, 12.0546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 10.0, 16.0, 13.0, 26.0, 18.0, 39.0, 46.0, 52.0, 74.0, 80.0, 89.0, 93.0, 71.0, 83.0, 64.0, 57.0, 38.0, 32.0, 29.0, 25.0, 12.0, 6.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0019311904907226562, -0.0018766522407531738, -0.0018221139907836914, -0.001767575740814209, -0.0017130374908447266, -0.0016584992408752441, -0.0016039609909057617, -0.0015494227409362793, -0.0014948844909667969, -0.0014403462409973145, -0.001385807991027832, -0.0013312697410583496, -0.0012767314910888672, -0.0012221932411193848, -0.0011676549911499023, -0.00111311674118042, -0.0010585784912109375, -0.001004040241241455, -0.0009495019912719727, -0.0008949637413024902, -0.0008404254913330078, -0.0007858872413635254, -0.000731348991394043, -0.0006768107414245605, -0.0006222724914550781, -0.0005677342414855957, -0.0005131959915161133, -0.00045865774154663086, -0.00040411949157714844, -0.000349581241607666, -0.0002950429916381836, -0.00024050474166870117, -0.00018596649169921875, -0.00013142824172973633, -7.68899917602539e-05, -2.2351741790771484e-05, 3.218650817871094e-05, 8.672475814819336e-05, 0.00014126300811767578, 0.0001958012580871582, 0.0002503395080566406, 0.00030487775802612305, 0.00035941600799560547, 0.0004139542579650879, 0.0004684925079345703, 0.0005230307579040527, 0.0005775690078735352, 0.0006321072578430176, 0.0006866455078125, 0.0007411837577819824, 0.0007957220077514648, 0.0008502602577209473, 0.0009047985076904297, 0.0009593367576599121, 0.0010138750076293945, 0.001068413257598877, 0.0011229515075683594, 0.0011774897575378418, 0.0012320280075073242, 0.0012865662574768066, 0.001341104507446289, 0.0013956427574157715, 0.001450181007385254, 0.0015047192573547363, 0.0015592575073242188]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 10.0, 9.0, 9.0, 18.0, 27.0, 42.0, 65.0, 77.0, 137.0, 201.0, 295.0, 435.0, 645.0, 1036.0, 1506.0, 2400.0, 3754.0, 5830.0, 9492.0, 15142.0, 24695.0, 40865.0, 66320.0, 104411.0, 149860.0, 172866.0, 154493.0, 110623.0, 70318.0, 43157.0, 26446.0, 15993.0, 10050.0, 6215.0, 3997.0, 2434.0, 1615.0, 1009.0, 679.0, 447.0, 307.0, 214.0, 132.0, 86.0, 63.0, 39.0, 31.0, 26.0, 19.0, 8.0, 9.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.1953125, -9.8822021484375, -9.569091796875, -9.2559814453125, -8.94287109375, -8.6297607421875, -8.316650390625, -8.0035400390625, -7.6904296875, -7.3773193359375, -7.064208984375, -6.7510986328125, -6.43798828125, -6.1248779296875, -5.811767578125, -5.4986572265625, -5.185546875, -4.8724365234375, -4.559326171875, -4.2462158203125, -3.93310546875, -3.6199951171875, -3.306884765625, -2.9937744140625, -2.6806640625, -2.3675537109375, -2.054443359375, -1.7413330078125, -1.42822265625, -1.1151123046875, -0.802001953125, -0.4888916015625, -0.17578125, 0.1373291015625, 0.450439453125, 0.7635498046875, 1.07666015625, 1.3897705078125, 1.702880859375, 2.0159912109375, 2.3291015625, 2.6422119140625, 2.955322265625, 3.2684326171875, 3.58154296875, 3.8946533203125, 4.207763671875, 4.5208740234375, 4.833984375, 5.1470947265625, 5.460205078125, 5.7733154296875, 6.08642578125, 6.3995361328125, 6.712646484375, 7.0257568359375, 7.3388671875, 7.6519775390625, 7.965087890625, 8.2781982421875, 8.59130859375, 8.9044189453125, 9.217529296875, 9.5306396484375, 9.84375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 5.0, 4.0, 3.0, 18.0, 19.0, 24.0, 20.0, 33.0, 34.0, 34.0, 70.0, 51.0, 76.0, 77.0, 66.0, 65.0, 67.0, 57.0, 55.0, 38.0, 43.0, 26.0, 23.0, 18.0, 12.0, 14.0, 12.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9765625, -4.82794189453125, -4.6793212890625, -4.53070068359375, -4.382080078125, -4.23345947265625, -4.0848388671875, -3.93621826171875, -3.78759765625, -3.63897705078125, -3.4903564453125, -3.34173583984375, -3.193115234375, -3.04449462890625, -2.8958740234375, -2.74725341796875, -2.5986328125, -2.45001220703125, -2.3013916015625, -2.15277099609375, -2.004150390625, -1.85552978515625, -1.7069091796875, -1.55828857421875, -1.40966796875, -1.26104736328125, -1.1124267578125, -0.96380615234375, -0.815185546875, -0.66656494140625, -0.5179443359375, -0.36932373046875, -0.220703125, -0.07208251953125, 0.0765380859375, 0.22515869140625, 0.373779296875, 0.52239990234375, 0.6710205078125, 0.81964111328125, 0.96826171875, 1.11688232421875, 1.2655029296875, 1.41412353515625, 1.562744140625, 1.71136474609375, 1.8599853515625, 2.00860595703125, 2.1572265625, 2.30584716796875, 2.4544677734375, 2.60308837890625, 2.751708984375, 2.90032958984375, 3.0489501953125, 3.19757080078125, 3.34619140625, 3.49481201171875, 3.6434326171875, 3.79205322265625, 3.940673828125, 4.08929443359375, 4.2379150390625, 4.38653564453125, 4.53515625]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 5.0, 9.0, 13.0, 13.0, 10.0, 27.0, 29.0, 34.0, 34.0, 38.0, 58.0, 53.0, 58.0, 61.0, 66.0, 63.0, 63.0, 53.0, 37.0, 46.0, 51.0, 30.0, 25.0, 18.0, 15.0, 11.0, 17.0, 14.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40544891357422, -21.735342025756836, -21.065237045288086, -20.395130157470703, -19.72502326965332, -19.054916381835938, -18.384811401367188, -17.714704513549805, -17.044597625732422, -16.37449073791504, -15.704384803771973, -15.034278869628906, -14.364171981811523, -13.694066047668457, -13.02396011352539, -12.353853225708008, -11.683747291564941, -11.013641357421875, -10.343534469604492, -9.673428535461426, -9.003321647644043, -8.333215713500977, -7.663109302520752, -6.993002891540527, -6.322896480560303, -5.652790069580078, -4.9826836585998535, -4.312577247619629, -3.6424710750579834, -2.972364664077759, -2.3022584915161133, -1.6321520805358887, -0.9620456695556641, -0.29193931818008423, 0.3781670331954956, 1.0482733249664307, 1.7183797359466553, 2.38848614692688, 3.0585923194885254, 3.72869873046875, 4.398805141448975, 5.068911552429199, 5.739017963409424, 6.409124374389648, 7.079230308532715, 7.749337196350098, 8.419443130493164, 9.089550018310547, 9.759655952453613, 10.42976188659668, 11.099868774414062, 11.769974708557129, 12.440081596374512, 13.110187530517578, 13.780294418334961, 14.450400352478027, 15.120506286621094, 15.79061222076416, 16.460718154907227, 17.13082504272461, 17.800931930541992, 18.471038818359375, 19.141143798828125, 19.811250686645508, 20.48135757446289]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 7.0, 5.0, 8.0, 5.0, 14.0, 16.0, 16.0, 23.0, 35.0, 35.0, 38.0, 36.0, 41.0, 46.0, 37.0, 48.0, 45.0, 52.0, 52.0, 46.0, 39.0, 48.0, 49.0, 32.0, 33.0, 31.0, 28.0, 24.0, 20.0, 11.0, 20.0, 13.0, 8.0, 7.0, 9.0, 4.0, 7.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.724685668945312, -19.14139747619629, -18.558109283447266, -17.97481918334961, -17.391530990600586, -16.808242797851562, -16.22495460510254, -15.641666412353516, -15.058377265930176, -14.475089073181152, -13.891799926757812, -13.308511734008789, -12.725223541259766, -12.141934394836426, -11.558646202087402, -10.975357055664062, -10.392068862915039, -9.808780670166016, -9.225491523742676, -8.642203330993652, -8.058914184570312, -7.475625991821289, -6.892337799072266, -6.309049129486084, -5.725760459899902, -5.142471790313721, -4.559183120727539, -3.9758949279785156, -3.392606258392334, -2.8093175888061523, -2.22602915763855, -1.6427407264709473, -1.0594520568847656, -0.47616350650787354, 0.10712504386901855, 0.6904135942459106, 1.2737021446228027, 1.8569908142089844, 2.440279245376587, 3.0235676765441895, 3.606856346130371, 4.190145015716553, 4.773433685302734, 5.356721878051758, 5.9400105476379395, 6.523299217224121, 7.1065874099731445, 7.689876079559326, 8.273164749145508, 8.856452941894531, 9.439742088317871, 10.023030281066895, 10.606319427490234, 11.189607620239258, 11.772895812988281, 12.356184005737305, 12.939473152160645, 13.522761344909668, 14.106050491333008, 14.689338684082031, 15.272626876831055, 15.855916023254395, 16.439205169677734, 17.022493362426758, 17.60578155517578]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 6.0, 6.0, 11.0, 18.0, 33.0, 40.0, 59.0, 94.0, 159.0, 243.0, 394.0, 588.0, 909.0, 1346.0, 2140.0, 3396.0, 5352.0, 8612.0, 14132.0, 23755.0, 42142.0, 78269.0, 158158.0, 347349.0, 743516.0, 1122446.0, 847643.0, 404780.0, 182341.0, 89386.0, 47133.0, 26602.0, 16160.0, 9643.0, 6051.0, 3905.0, 2535.0, 1701.0, 1073.0, 726.0, 469.0, 337.0, 211.0, 140.0, 95.0, 51.0, 49.0, 37.0, 15.0, 7.0, 6.0, 12.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.8125, -18.217041015625, -17.62158203125, -17.026123046875, -16.4306640625, -15.835205078125, -15.23974609375, -14.644287109375, -14.048828125, -13.453369140625, -12.85791015625, -12.262451171875, -11.6669921875, -11.071533203125, -10.47607421875, -9.880615234375, -9.28515625, -8.689697265625, -8.09423828125, -7.498779296875, -6.9033203125, -6.307861328125, -5.71240234375, -5.116943359375, -4.521484375, -3.926025390625, -3.33056640625, -2.735107421875, -2.1396484375, -1.544189453125, -0.94873046875, -0.353271484375, 0.2421875, 0.837646484375, 1.43310546875, 2.028564453125, 2.6240234375, 3.219482421875, 3.81494140625, 4.410400390625, 5.005859375, 5.601318359375, 6.19677734375, 6.792236328125, 7.3876953125, 7.983154296875, 8.57861328125, 9.174072265625, 9.76953125, 10.364990234375, 10.96044921875, 11.555908203125, 12.1513671875, 12.746826171875, 13.34228515625, 13.937744140625, 14.533203125, 15.128662109375, 15.72412109375, 16.319580078125, 16.9150390625, 17.510498046875, 18.10595703125, 18.701416015625, 19.296875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 9.0, 6.0, 10.0, 10.0, 15.0, 15.0, 14.0, 21.0, 24.0, 29.0, 24.0, 38.0, 57.0, 48.0, 36.0, 34.0, 52.0, 53.0, 44.0, 31.0, 44.0, 43.0, 48.0, 47.0, 36.0, 32.0, 36.0, 18.0, 27.0, 15.0, 13.0, 13.0, 16.0, 11.0, 5.0, 5.0, 6.0, 3.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.9765625, -12.5977783203125, -12.218994140625, -11.8402099609375, -11.46142578125, -11.0826416015625, -10.703857421875, -10.3250732421875, -9.9462890625, -9.5675048828125, -9.188720703125, -8.8099365234375, -8.43115234375, -8.0523681640625, -7.673583984375, -7.2947998046875, -6.916015625, -6.5372314453125, -6.158447265625, -5.7796630859375, -5.40087890625, -5.0220947265625, -4.643310546875, -4.2645263671875, -3.8857421875, -3.5069580078125, -3.128173828125, -2.7493896484375, -2.37060546875, -1.9918212890625, -1.613037109375, -1.2342529296875, -0.85546875, -0.4766845703125, -0.097900390625, 0.2808837890625, 0.65966796875, 1.0384521484375, 1.417236328125, 1.7960205078125, 2.1748046875, 2.5535888671875, 2.932373046875, 3.3111572265625, 3.68994140625, 4.0687255859375, 4.447509765625, 4.8262939453125, 5.205078125, 5.5838623046875, 5.962646484375, 6.3414306640625, 6.72021484375, 7.0989990234375, 7.477783203125, 7.8565673828125, 8.2353515625, 8.6141357421875, 8.992919921875, 9.3717041015625, 9.75048828125, 10.1292724609375, 10.508056640625, 10.8868408203125, 11.265625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 7.0, 9.0, 13.0, 26.0, 34.0, 56.0, 75.0, 112.0, 176.0, 234.0, 341.0, 646.0, 1087.0, 1762.0, 3138.0, 5444.0, 10057.0, 19801.0, 40228.0, 86528.0, 197452.0, 470914.0, 1030642.0, 1210334.0, 629962.0, 266463.0, 114236.0, 51497.0, 24489.0, 12694.0, 6688.0, 3691.0, 2197.0, 1211.0, 759.0, 465.0, 265.0, 180.0, 125.0, 85.0, 49.0, 33.0, 26.0, 21.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-25.21875, -24.480712890625, -23.74267578125, -23.004638671875, -22.2666015625, -21.528564453125, -20.79052734375, -20.052490234375, -19.314453125, -18.576416015625, -17.83837890625, -17.100341796875, -16.3623046875, -15.624267578125, -14.88623046875, -14.148193359375, -13.41015625, -12.672119140625, -11.93408203125, -11.196044921875, -10.4580078125, -9.719970703125, -8.98193359375, -8.243896484375, -7.505859375, -6.767822265625, -6.02978515625, -5.291748046875, -4.5537109375, -3.815673828125, -3.07763671875, -2.339599609375, -1.6015625, -0.863525390625, -0.12548828125, 0.612548828125, 1.3505859375, 2.088623046875, 2.82666015625, 3.564697265625, 4.302734375, 5.040771484375, 5.77880859375, 6.516845703125, 7.2548828125, 7.992919921875, 8.73095703125, 9.468994140625, 10.20703125, 10.945068359375, 11.68310546875, 12.421142578125, 13.1591796875, 13.897216796875, 14.63525390625, 15.373291015625, 16.111328125, 16.849365234375, 17.58740234375, 18.325439453125, 19.0634765625, 19.801513671875, 20.53955078125, 21.277587890625, 22.015625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 7.0, 7.0, 5.0, 8.0, 16.0, 17.0, 24.0, 20.0, 32.0, 51.0, 63.0, 76.0, 113.0, 135.0, 189.0, 216.0, 252.0, 291.0, 316.0, 362.0, 352.0, 289.0, 265.0, 217.0, 176.0, 150.0, 99.0, 94.0, 72.0, 49.0, 35.0, 23.0, 24.0, 8.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.9296875, -8.69171142578125, -8.4537353515625, -8.21575927734375, -7.977783203125, -7.73980712890625, -7.5018310546875, -7.26385498046875, -7.02587890625, -6.78790283203125, -6.5499267578125, -6.31195068359375, -6.073974609375, -5.83599853515625, -5.5980224609375, -5.36004638671875, -5.1220703125, -4.88409423828125, -4.6461181640625, -4.40814208984375, -4.170166015625, -3.93218994140625, -3.6942138671875, -3.45623779296875, -3.21826171875, -2.98028564453125, -2.7423095703125, -2.50433349609375, -2.266357421875, -2.02838134765625, -1.7904052734375, -1.55242919921875, -1.314453125, -1.07647705078125, -0.8385009765625, -0.60052490234375, -0.362548828125, -0.12457275390625, 0.1134033203125, 0.35137939453125, 0.58935546875, 0.82733154296875, 1.0653076171875, 1.30328369140625, 1.541259765625, 1.77923583984375, 2.0172119140625, 2.25518798828125, 2.4931640625, 2.73114013671875, 2.9691162109375, 3.20709228515625, 3.445068359375, 3.68304443359375, 3.9210205078125, 4.15899658203125, 4.39697265625, 4.63494873046875, 4.8729248046875, 5.11090087890625, 5.348876953125, 5.58685302734375, 5.8248291015625, 6.06280517578125, 6.30078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 9.0, 3.0, 11.0, 3.0, 11.0, 12.0, 18.0, 17.0, 19.0, 36.0, 41.0, 54.0, 63.0, 66.0, 65.0, 69.0, 67.0, 68.0, 53.0, 59.0, 53.0, 43.0, 36.0, 32.0, 23.0, 18.0, 12.0, 9.0, 5.0, 8.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.6554012298584, -23.96820831298828, -23.281017303466797, -22.593826293945312, -21.906633377075195, -21.219440460205078, -20.532249450683594, -19.84505844116211, -19.157865524291992, -18.470672607421875, -17.78348159790039, -17.096290588378906, -16.40909767150879, -15.721905708312988, -15.034713745117188, -14.347521781921387, -13.660329818725586, -12.973137855529785, -12.285945892333984, -11.598753929138184, -10.911561965942383, -10.224370002746582, -9.537178039550781, -8.84998607635498, -8.16279411315918, -7.475602149963379, -6.788410186767578, -6.101218223571777, -5.414026260375977, -4.726834297180176, -4.039642333984375, -3.352450370788574, -2.6652603149414062, -1.9780683517456055, -1.2908763885498047, -0.6036844253540039, 0.08350753784179688, 0.7706995010375977, 1.4578914642333984, 2.145083427429199, 2.832275390625, 3.519467353820801, 4.206659317016602, 4.893851280212402, 5.581043243408203, 6.268235206604004, 6.955427169799805, 7.6426191329956055, 8.329811096191406, 9.017003059387207, 9.704195022583008, 10.391386985778809, 11.07857894897461, 11.76577091217041, 12.452962875366211, 13.140154838562012, 13.827346801757812, 14.514538764953613, 15.201730728149414, 15.888922691345215, 16.576114654541016, 17.2633056640625, 17.950498580932617, 18.637691497802734, 19.32488250732422]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 8.0, 8.0, 14.0, 11.0, 21.0, 13.0, 30.0, 24.0, 30.0, 27.0, 33.0, 33.0, 35.0, 34.0, 37.0, 41.0, 22.0, 37.0, 39.0, 45.0, 42.0, 51.0, 31.0, 31.0, 38.0, 26.0, 36.0, 19.0, 15.0, 20.0, 18.0, 15.0, 17.0, 14.0, 8.0, 13.0, 7.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.058521270751953, -13.622529983520508, -13.186539649963379, -12.750548362731934, -12.314558029174805, -11.87856674194336, -11.442575454711914, -11.006584167480469, -10.57059383392334, -10.134602546691895, -9.698612213134766, -9.26262092590332, -8.826629638671875, -8.390639305114746, -7.954648017883301, -7.518657207489014, -7.082666397094727, -6.6466755867004395, -6.210684776306152, -5.774693489074707, -5.33870267868042, -4.902711868286133, -4.4667205810546875, -4.0307297706604, -3.5947389602661133, -3.158748149871826, -2.72275710105896, -2.2867660522460938, -1.8507752418518066, -1.4147844314575195, -0.9787933826446533, -0.5428023338317871, -0.1068124771118164, 0.32917845249176025, 0.7651693820953369, 1.2011603116989136, 1.6371512413024902, 2.0731420516967773, 2.5091331005096436, 2.9451241493225098, 3.381114959716797, 3.817105770111084, 4.253096580505371, 4.689087867736816, 5.1250786781311035, 5.561069488525391, 5.997060775756836, 6.433051586151123, 6.86904239654541, 7.305033206939697, 7.741024017333984, 8.17701530456543, 8.613006591796875, 9.048996925354004, 9.48498821258545, 9.920978546142578, 10.356969833374023, 10.792961120605469, 11.228951454162598, 11.664942741394043, 12.100933074951172, 12.536924362182617, 12.972915649414062, 13.408906936645508, 13.844897270202637]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 6.0, 16.0, 23.0, 35.0, 49.0, 81.0, 127.0, 204.0, 339.0, 587.0, 825.0, 1495.0, 2558.0, 4520.0, 7584.0, 14333.0, 26688.0, 52698.0, 104643.0, 190646.0, 247384.0, 185086.0, 100653.0, 50492.0, 25778.0, 13604.0, 7540.0, 4315.0, 2440.0, 1437.0, 915.0, 519.0, 355.0, 230.0, 113.0, 95.0, 47.0, 33.0, 23.0, 11.0, 11.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-16.15625, -15.7132568359375, -15.270263671875, -14.8272705078125, -14.38427734375, -13.9412841796875, -13.498291015625, -13.0552978515625, -12.6123046875, -12.1693115234375, -11.726318359375, -11.2833251953125, -10.84033203125, -10.3973388671875, -9.954345703125, -9.5113525390625, -9.068359375, -8.6253662109375, -8.182373046875, -7.7393798828125, -7.29638671875, -6.8533935546875, -6.410400390625, -5.9674072265625, -5.5244140625, -5.0814208984375, -4.638427734375, -4.1954345703125, -3.75244140625, -3.3094482421875, -2.866455078125, -2.4234619140625, -1.98046875, -1.5374755859375, -1.094482421875, -0.6514892578125, -0.20849609375, 0.2344970703125, 0.677490234375, 1.1204833984375, 1.5634765625, 2.0064697265625, 2.449462890625, 2.8924560546875, 3.33544921875, 3.7784423828125, 4.221435546875, 4.6644287109375, 5.107421875, 5.5504150390625, 5.993408203125, 6.4364013671875, 6.87939453125, 7.3223876953125, 7.765380859375, 8.2083740234375, 8.6513671875, 9.0943603515625, 9.537353515625, 9.9803466796875, 10.42333984375, 10.8663330078125, 11.309326171875, 11.7523193359375, 12.1953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 2.0, 7.0, 10.0, 13.0, 13.0, 17.0, 21.0, 19.0, 36.0, 27.0, 26.0, 34.0, 36.0, 37.0, 36.0, 33.0, 34.0, 46.0, 40.0, 35.0, 46.0, 51.0, 34.0, 36.0, 36.0, 32.0, 30.0, 36.0, 17.0, 19.0, 16.0, 11.0, 19.0, 14.0, 14.0, 12.0, 9.0, 9.0, 7.0, 3.0, 1.0, 1.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.7578125, -14.2823486328125, -13.806884765625, -13.3314208984375, -12.85595703125, -12.3804931640625, -11.905029296875, -11.4295654296875, -10.9541015625, -10.4786376953125, -10.003173828125, -9.5277099609375, -9.05224609375, -8.5767822265625, -8.101318359375, -7.6258544921875, -7.150390625, -6.6749267578125, -6.199462890625, -5.7239990234375, -5.24853515625, -4.7730712890625, -4.297607421875, -3.8221435546875, -3.3466796875, -2.8712158203125, -2.395751953125, -1.9202880859375, -1.44482421875, -0.9693603515625, -0.493896484375, -0.0184326171875, 0.45703125, 0.9324951171875, 1.407958984375, 1.8834228515625, 2.35888671875, 2.8343505859375, 3.309814453125, 3.7852783203125, 4.2607421875, 4.7362060546875, 5.211669921875, 5.6871337890625, 6.16259765625, 6.6380615234375, 7.113525390625, 7.5889892578125, 8.064453125, 8.5399169921875, 9.015380859375, 9.4908447265625, 9.96630859375, 10.4417724609375, 10.917236328125, 11.3927001953125, 11.8681640625, 12.3436279296875, 12.819091796875, 13.2945556640625, 13.77001953125, 14.2454833984375, 14.720947265625, 15.1964111328125, 15.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 15.0, 11.0, 15.0, 26.0, 27.0, 35.0, 38.0, 71.0, 99.0, 123.0, 210.0, 339.0, 541.0, 828.0, 1374.0, 2215.0, 3796.0, 6884.0, 14047.0, 30600.0, 73998.0, 186090.0, 344090.0, 222220.0, 89602.0, 36524.0, 16248.0, 7875.0, 4122.0, 2400.0, 1442.0, 910.0, 597.0, 351.0, 253.0, 150.0, 106.0, 71.0, 53.0, 38.0, 17.0, 30.0, 20.0, 12.0, 6.0, 11.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.580322265625, -17.97314453125, -17.365966796875, -16.7587890625, -16.151611328125, -15.54443359375, -14.937255859375, -14.330078125, -13.722900390625, -13.11572265625, -12.508544921875, -11.9013671875, -11.294189453125, -10.68701171875, -10.079833984375, -9.47265625, -8.865478515625, -8.25830078125, -7.651123046875, -7.0439453125, -6.436767578125, -5.82958984375, -5.222412109375, -4.615234375, -4.008056640625, -3.40087890625, -2.793701171875, -2.1865234375, -1.579345703125, -0.97216796875, -0.364990234375, 0.2421875, 0.849365234375, 1.45654296875, 2.063720703125, 2.6708984375, 3.278076171875, 3.88525390625, 4.492431640625, 5.099609375, 5.706787109375, 6.31396484375, 6.921142578125, 7.5283203125, 8.135498046875, 8.74267578125, 9.349853515625, 9.95703125, 10.564208984375, 11.17138671875, 11.778564453125, 12.3857421875, 12.992919921875, 13.60009765625, 14.207275390625, 14.814453125, 15.421630859375, 16.02880859375, 16.635986328125, 17.2431640625, 17.850341796875, 18.45751953125, 19.064697265625, 19.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 3.0, 7.0, 2.0, 8.0, 12.0, 12.0, 19.0, 20.0, 22.0, 24.0, 28.0, 35.0, 29.0, 28.0, 25.0, 28.0, 24.0, 46.0, 46.0, 56.0, 43.0, 38.0, 41.0, 42.0, 34.0, 40.0, 31.0, 28.0, 32.0, 20.0, 22.0, 19.0, 30.0, 15.0, 13.0, 15.0, 6.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.296875, -8.03662109375, -7.7763671875, -7.51611328125, -7.255859375, -6.99560546875, -6.7353515625, -6.47509765625, -6.21484375, -5.95458984375, -5.6943359375, -5.43408203125, -5.173828125, -4.91357421875, -4.6533203125, -4.39306640625, -4.1328125, -3.87255859375, -3.6123046875, -3.35205078125, -3.091796875, -2.83154296875, -2.5712890625, -2.31103515625, -2.05078125, -1.79052734375, -1.5302734375, -1.27001953125, -1.009765625, -0.74951171875, -0.4892578125, -0.22900390625, 0.03125, 0.29150390625, 0.5517578125, 0.81201171875, 1.072265625, 1.33251953125, 1.5927734375, 1.85302734375, 2.11328125, 2.37353515625, 2.6337890625, 2.89404296875, 3.154296875, 3.41455078125, 3.6748046875, 3.93505859375, 4.1953125, 4.45556640625, 4.7158203125, 4.97607421875, 5.236328125, 5.49658203125, 5.7568359375, 6.01708984375, 6.27734375, 6.53759765625, 6.7978515625, 7.05810546875, 7.318359375, 7.57861328125, 7.8388671875, 8.09912109375, 8.359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 9.0, 11.0, 11.0, 13.0, 22.0, 31.0, 33.0, 82.0, 111.0, 177.0, 256.0, 369.0, 608.0, 868.0, 1471.0, 2578.0, 4161.0, 7060.0, 12674.0, 23010.0, 43531.0, 86027.0, 171233.0, 273485.0, 202614.0, 103694.0, 52188.0, 27026.0, 14573.0, 8278.0, 4727.0, 2832.0, 1744.0, 1118.0, 676.0, 446.0, 273.0, 178.0, 119.0, 64.0, 65.0, 31.0, 30.0, 10.0, 16.0, 11.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.4375, -5.2708740234375, -5.104248046875, -4.9376220703125, -4.77099609375, -4.6043701171875, -4.437744140625, -4.2711181640625, -4.1044921875, -3.9378662109375, -3.771240234375, -3.6046142578125, -3.43798828125, -3.2713623046875, -3.104736328125, -2.9381103515625, -2.771484375, -2.6048583984375, -2.438232421875, -2.2716064453125, -2.10498046875, -1.9383544921875, -1.771728515625, -1.6051025390625, -1.4384765625, -1.2718505859375, -1.105224609375, -0.9385986328125, -0.77197265625, -0.6053466796875, -0.438720703125, -0.2720947265625, -0.10546875, 0.0611572265625, 0.227783203125, 0.3944091796875, 0.56103515625, 0.7276611328125, 0.894287109375, 1.0609130859375, 1.2275390625, 1.3941650390625, 1.560791015625, 1.7274169921875, 1.89404296875, 2.0606689453125, 2.227294921875, 2.3939208984375, 2.560546875, 2.7271728515625, 2.893798828125, 3.0604248046875, 3.22705078125, 3.3936767578125, 3.560302734375, 3.7269287109375, 3.8935546875, 4.0601806640625, 4.226806640625, 4.3934326171875, 4.56005859375, 4.7266845703125, 4.893310546875, 5.0599365234375, 5.2265625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 12.0, 6.0, 13.0, 11.0, 10.0, 18.0, 26.0, 30.0, 26.0, 48.0, 46.0, 40.0, 46.0, 54.0, 71.0, 65.0, 57.0, 72.0, 48.0, 52.0, 36.0, 38.0, 30.0, 25.0, 21.0, 16.0, 14.0, 16.0, 7.0, 10.0, 4.0, 5.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00027680397033691406, -0.0002676956355571747, -0.0002585873007774353, -0.0002494789659976959, -0.00024037063121795654, -0.00023126229643821716, -0.00022215396165847778, -0.0002130456268787384, -0.00020393729209899902, -0.00019482895731925964, -0.00018572062253952026, -0.00017661228775978088, -0.0001675039529800415, -0.00015839561820030212, -0.00014928728342056274, -0.00014017894864082336, -0.00013107061386108398, -0.0001219622790813446, -0.00011285394430160522, -0.00010374560952186584, -9.463727474212646e-05, -8.552893996238708e-05, -7.64206051826477e-05, -6.731227040290833e-05, -5.8203935623168945e-05, -4.9095600843429565e-05, -3.9987266063690186e-05, -3.0878931283950806e-05, -2.1770596504211426e-05, -1.2662261724472046e-05, -3.553926944732666e-06, 5.554407835006714e-06, 1.4662742614746094e-05, 2.3771077394485474e-05, 3.2879412174224854e-05, 4.1987746953964233e-05, 5.109608173370361e-05, 6.020441651344299e-05, 6.931275129318237e-05, 7.842108607292175e-05, 8.752942085266113e-05, 9.663775563240051e-05, 0.00010574609041213989, 0.00011485442519187927, 0.00012396275997161865, 0.00013307109475135803, 0.0001421794295310974, 0.0001512877643108368, 0.00016039609909057617, 0.00016950443387031555, 0.00017861276865005493, 0.0001877211034297943, 0.0001968294382095337, 0.00020593777298927307, 0.00021504610776901245, 0.00022415444254875183, 0.0002332627773284912, 0.0002423711121082306, 0.00025147944688796997, 0.00026058778166770935, 0.00026969611644744873, 0.0002788044512271881, 0.0002879127860069275, 0.00029702112078666687, 0.00030612945556640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 1.0, 9.0, 24.0, 16.0, 44.0, 80.0, 126.0, 236.0, 412.0, 808.0, 1670.0, 3316.0, 7120.0, 15501.0, 34388.0, 78449.0, 167563.0, 273607.0, 237387.0, 125439.0, 55956.0, 24580.0, 11373.0, 5334.0, 2571.0, 1233.0, 575.0, 320.0, 165.0, 96.0, 46.0, 31.0, 19.0, 11.0, 13.0, 8.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.41015625, -6.20855712890625, -6.0069580078125, -5.80535888671875, -5.603759765625, -5.40216064453125, -5.2005615234375, -4.99896240234375, -4.79736328125, -4.59576416015625, -4.3941650390625, -4.19256591796875, -3.990966796875, -3.78936767578125, -3.5877685546875, -3.38616943359375, -3.1845703125, -2.98297119140625, -2.7813720703125, -2.57977294921875, -2.378173828125, -2.17657470703125, -1.9749755859375, -1.77337646484375, -1.57177734375, -1.37017822265625, -1.1685791015625, -0.96697998046875, -0.765380859375, -0.56378173828125, -0.3621826171875, -0.16058349609375, 0.041015625, 0.24261474609375, 0.4442138671875, 0.64581298828125, 0.847412109375, 1.04901123046875, 1.2506103515625, 1.45220947265625, 1.65380859375, 1.85540771484375, 2.0570068359375, 2.25860595703125, 2.460205078125, 2.66180419921875, 2.8634033203125, 3.06500244140625, 3.2666015625, 3.46820068359375, 3.6697998046875, 3.87139892578125, 4.072998046875, 4.27459716796875, 4.4761962890625, 4.67779541015625, 4.87939453125, 5.08099365234375, 5.2825927734375, 5.48419189453125, 5.685791015625, 5.88739013671875, 6.0889892578125, 6.29058837890625, 6.4921875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 14.0, 2.0, 17.0, 13.0, 18.0, 23.0, 28.0, 31.0, 48.0, 47.0, 68.0, 62.0, 87.0, 76.0, 76.0, 65.0, 64.0, 67.0, 37.0, 33.0, 36.0, 25.0, 18.0, 19.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1562957763671875, -1.102630615234375, -1.0489654541015625, -0.99530029296875, -0.9416351318359375, -0.887969970703125, -0.8343048095703125, -0.7806396484375, -0.7269744873046875, -0.673309326171875, -0.6196441650390625, -0.56597900390625, -0.5123138427734375, -0.458648681640625, -0.4049835205078125, -0.351318359375, -0.2976531982421875, -0.243988037109375, -0.1903228759765625, -0.13665771484375, -0.0829925537109375, -0.029327392578125, 0.0243377685546875, 0.0780029296875, 0.1316680908203125, 0.185333251953125, 0.2389984130859375, 0.29266357421875, 0.3463287353515625, 0.399993896484375, 0.4536590576171875, 0.50732421875, 0.5609893798828125, 0.614654541015625, 0.6683197021484375, 0.72198486328125, 0.7756500244140625, 0.829315185546875, 0.8829803466796875, 0.9366455078125, 0.9903106689453125, 1.043975830078125, 1.0976409912109375, 1.15130615234375, 1.2049713134765625, 1.258636474609375, 1.3123016357421875, 1.365966796875, 1.4196319580078125, 1.473297119140625, 1.5269622802734375, 1.58062744140625, 1.6342926025390625, 1.687957763671875, 1.7416229248046875, 1.7952880859375, 1.8489532470703125, 1.902618408203125, 1.9562835693359375, 2.00994873046875, 2.0636138916015625, 2.117279052734375, 2.1709442138671875, 2.224609375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 7.0, 9.0, 5.0, 9.0, 8.0, 24.0, 18.0, 26.0, 37.0, 40.0, 64.0, 52.0, 76.0, 60.0, 79.0, 69.0, 74.0, 59.0, 50.0, 42.0, 45.0, 36.0, 30.0, 15.0, 20.0, 13.0, 10.0, 2.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.163774490356445, -24.45777702331543, -23.75177764892578, -23.045780181884766, -22.33978271484375, -21.633785247802734, -20.92778778076172, -20.22178840637207, -19.515790939331055, -18.80979347229004, -18.10379409790039, -17.397796630859375, -16.69179916381836, -15.985801696777344, -15.279803276062012, -14.57380485534668, -13.867807388305664, -13.161809921264648, -12.455811500549316, -11.749813079833984, -11.043815612792969, -10.337818145751953, -9.631819725036621, -8.925821304321289, -8.219823837280273, -7.5138258934021, -6.807827949523926, -6.101830005645752, -5.395832061767578, -4.689834117889404, -3.9838361740112305, -3.2778382301330566, -2.571840286254883, -1.865842342376709, -1.1598443984985352, -0.45384645462036133, 0.2521514892578125, 0.9581494331359863, 1.6641473770141602, 2.370145320892334, 3.076143264770508, 3.7821412086486816, 4.4881391525268555, 5.194137096405029, 5.900135040283203, 6.606132984161377, 7.312130928039551, 8.018129348754883, 8.724126815795898, 9.430124282836914, 10.136122703552246, 10.842121124267578, 11.548118591308594, 12.25411605834961, 12.960114479064941, 13.666112899780273, 14.372110366821289, 15.078107833862305, 15.784106254577637, 16.49010467529297, 17.196102142333984, 17.902099609375, 18.608097076416016, 19.314096450805664, 20.02009391784668]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 1.0, 8.0, 10.0, 5.0, 11.0, 13.0, 18.0, 18.0, 18.0, 23.0, 27.0, 39.0, 38.0, 23.0, 37.0, 43.0, 34.0, 29.0, 36.0, 23.0, 53.0, 29.0, 47.0, 50.0, 33.0, 31.0, 32.0, 36.0, 32.0, 28.0, 19.0, 15.0, 17.0, 13.0, 17.0, 16.0, 15.0, 5.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.621931076049805, -13.190160751342773, -12.758390426635742, -12.326620101928711, -11.89484977722168, -11.463079452514648, -11.031309127807617, -10.599538803100586, -10.167768478393555, -9.735998153686523, -9.304227828979492, -8.872457504272461, -8.44068717956543, -8.008916854858398, -7.577147006988525, -7.145376682281494, -6.713606834411621, -6.28183650970459, -5.850066184997559, -5.418295860290527, -4.986525535583496, -4.554755210876465, -4.122985363006592, -3.6912150382995605, -3.2594447135925293, -2.827674388885498, -2.395904064178467, -1.9641339778900146, -1.5323636531829834, -1.1005933284759521, -0.6688232421875, -0.23705291748046875, 0.1947164535522461, 0.6264867186546326, 1.058256983757019, 1.4900271892547607, 1.921797513961792, 2.3535678386688232, 2.7853379249572754, 3.2171082496643066, 3.648878574371338, 4.080648899078369, 4.5124192237854, 4.944189071655273, 5.375959396362305, 5.807729721069336, 6.239500045776367, 6.671270370483398, 7.10304069519043, 7.534811019897461, 7.966581344604492, 8.398351669311523, 8.830121994018555, 9.261892318725586, 9.693662643432617, 10.125432968139648, 10.55720329284668, 10.988973617553711, 11.420743942260742, 11.852514266967773, 12.284284591674805, 12.716054916381836, 13.147825241088867, 13.579595565795898, 14.011364936828613]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 11.0, 15.0, 28.0, 38.0, 69.0, 102.0, 134.0, 249.0, 398.0, 612.0, 1052.0, 1662.0, 2864.0, 4796.0, 7838.0, 13628.0, 24020.0, 42188.0, 74492.0, 124950.0, 181463.0, 195827.0, 151193.0, 93339.0, 54378.0, 30750.0, 17430.0, 10080.0, 5987.0, 3579.0, 2042.0, 1277.0, 746.0, 461.0, 316.0, 190.0, 117.0, 84.0, 49.0, 37.0, 23.0, 16.0, 7.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.625, -17.987548828125, -17.35009765625, -16.712646484375, -16.0751953125, -15.437744140625, -14.80029296875, -14.162841796875, -13.525390625, -12.887939453125, -12.25048828125, -11.613037109375, -10.9755859375, -10.338134765625, -9.70068359375, -9.063232421875, -8.42578125, -7.788330078125, -7.15087890625, -6.513427734375, -5.8759765625, -5.238525390625, -4.60107421875, -3.963623046875, -3.326171875, -2.688720703125, -2.05126953125, -1.413818359375, -0.7763671875, -0.138916015625, 0.49853515625, 1.135986328125, 1.7734375, 2.410888671875, 3.04833984375, 3.685791015625, 4.3232421875, 4.960693359375, 5.59814453125, 6.235595703125, 6.873046875, 7.510498046875, 8.14794921875, 8.785400390625, 9.4228515625, 10.060302734375, 10.69775390625, 11.335205078125, 11.97265625, 12.610107421875, 13.24755859375, 13.885009765625, 14.5224609375, 15.159912109375, 15.79736328125, 16.434814453125, 17.072265625, 17.709716796875, 18.34716796875, 18.984619140625, 19.6220703125, 20.259521484375, 20.89697265625, 21.534423828125, 22.171875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 3.0, 12.0, 9.0, 9.0, 19.0, 20.0, 26.0, 16.0, 33.0, 34.0, 38.0, 36.0, 36.0, 37.0, 35.0, 37.0, 45.0, 39.0, 46.0, 58.0, 30.0, 40.0, 31.0, 36.0, 34.0, 22.0, 29.0, 28.0, 22.0, 17.0, 16.0, 16.0, 15.0, 16.0, 7.0, 9.0, 9.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.5546875, -14.083984375, -13.61328125, -13.142578125, -12.671875, -12.201171875, -11.73046875, -11.259765625, -10.7890625, -10.318359375, -9.84765625, -9.376953125, -8.90625, -8.435546875, -7.96484375, -7.494140625, -7.0234375, -6.552734375, -6.08203125, -5.611328125, -5.140625, -4.669921875, -4.19921875, -3.728515625, -3.2578125, -2.787109375, -2.31640625, -1.845703125, -1.375, -0.904296875, -0.43359375, 0.037109375, 0.5078125, 0.978515625, 1.44921875, 1.919921875, 2.390625, 2.861328125, 3.33203125, 3.802734375, 4.2734375, 4.744140625, 5.21484375, 5.685546875, 6.15625, 6.626953125, 7.09765625, 7.568359375, 8.0390625, 8.509765625, 8.98046875, 9.451171875, 9.921875, 10.392578125, 10.86328125, 11.333984375, 11.8046875, 12.275390625, 12.74609375, 13.216796875, 13.6875, 14.158203125, 14.62890625, 15.099609375, 15.5703125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 14.0, 18.0, 28.0, 58.0, 63.0, 87.0, 156.0, 224.0, 287.0, 492.0, 725.0, 998.0, 1591.0, 2453.0, 3868.0, 5961.0, 9448.0, 15193.0, 24339.0, 38675.0, 60967.0, 91595.0, 126402.0, 150982.0, 149699.0, 122074.0, 86751.0, 56850.0, 36261.0, 23166.0, 14225.0, 8953.0, 5636.0, 3586.0, 2346.0, 1450.0, 941.0, 652.0, 426.0, 326.0, 197.0, 110.0, 84.0, 55.0, 33.0, 29.0, 24.0, 12.0, 11.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-14.2265625, -13.7666015625, -13.306640625, -12.8466796875, -12.38671875, -11.9267578125, -11.466796875, -11.0068359375, -10.546875, -10.0869140625, -9.626953125, -9.1669921875, -8.70703125, -8.2470703125, -7.787109375, -7.3271484375, -6.8671875, -6.4072265625, -5.947265625, -5.4873046875, -5.02734375, -4.5673828125, -4.107421875, -3.6474609375, -3.1875, -2.7275390625, -2.267578125, -1.8076171875, -1.34765625, -0.8876953125, -0.427734375, 0.0322265625, 0.4921875, 0.9521484375, 1.412109375, 1.8720703125, 2.33203125, 2.7919921875, 3.251953125, 3.7119140625, 4.171875, 4.6318359375, 5.091796875, 5.5517578125, 6.01171875, 6.4716796875, 6.931640625, 7.3916015625, 7.8515625, 8.3115234375, 8.771484375, 9.2314453125, 9.69140625, 10.1513671875, 10.611328125, 11.0712890625, 11.53125, 11.9912109375, 12.451171875, 12.9111328125, 13.37109375, 13.8310546875, 14.291015625, 14.7509765625, 15.2109375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 15.0, 22.0, 19.0, 19.0, 23.0, 38.0, 29.0, 25.0, 25.0, 31.0, 39.0, 44.0, 39.0, 39.0, 42.0, 45.0, 39.0, 34.0, 39.0, 35.0, 36.0, 32.0, 23.0, 32.0, 19.0, 13.0, 30.0, 23.0, 13.0, 16.0, 11.0, 15.0, 8.0, 7.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.2578125, -7.9957275390625, -7.733642578125, -7.4715576171875, -7.20947265625, -6.9473876953125, -6.685302734375, -6.4232177734375, -6.1611328125, -5.8990478515625, -5.636962890625, -5.3748779296875, -5.11279296875, -4.8507080078125, -4.588623046875, -4.3265380859375, -4.064453125, -3.8023681640625, -3.540283203125, -3.2781982421875, -3.01611328125, -2.7540283203125, -2.491943359375, -2.2298583984375, -1.9677734375, -1.7056884765625, -1.443603515625, -1.1815185546875, -0.91943359375, -0.6573486328125, -0.395263671875, -0.1331787109375, 0.12890625, 0.3909912109375, 0.653076171875, 0.9151611328125, 1.17724609375, 1.4393310546875, 1.701416015625, 1.9635009765625, 2.2255859375, 2.4876708984375, 2.749755859375, 3.0118408203125, 3.27392578125, 3.5360107421875, 3.798095703125, 4.0601806640625, 4.322265625, 4.5843505859375, 4.846435546875, 5.1085205078125, 5.37060546875, 5.6326904296875, 5.894775390625, 6.1568603515625, 6.4189453125, 6.6810302734375, 6.943115234375, 7.2052001953125, 7.46728515625, 7.7293701171875, 7.991455078125, 8.2535400390625, 8.515625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 14.0, 15.0, 15.0, 29.0, 46.0, 62.0, 83.0, 129.0, 166.0, 241.0, 343.0, 521.0, 802.0, 1304.0, 1992.0, 3377.0, 5511.0, 9448.0, 18005.0, 35975.0, 76022.0, 163394.0, 274350.0, 229353.0, 115912.0, 53044.0, 25814.0, 13461.0, 7388.0, 4330.0, 2559.0, 1626.0, 1073.0, 737.0, 455.0, 291.0, 192.0, 128.0, 108.0, 73.0, 49.0, 23.0, 28.0, 17.0, 8.0, 11.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-14.8203125, -14.3680419921875, -13.915771484375, -13.4635009765625, -13.01123046875, -12.5589599609375, -12.106689453125, -11.6544189453125, -11.2021484375, -10.7498779296875, -10.297607421875, -9.8453369140625, -9.39306640625, -8.9407958984375, -8.488525390625, -8.0362548828125, -7.583984375, -7.1317138671875, -6.679443359375, -6.2271728515625, -5.77490234375, -5.3226318359375, -4.870361328125, -4.4180908203125, -3.9658203125, -3.5135498046875, -3.061279296875, -2.6090087890625, -2.15673828125, -1.7044677734375, -1.252197265625, -0.7999267578125, -0.34765625, 0.1046142578125, 0.556884765625, 1.0091552734375, 1.46142578125, 1.9136962890625, 2.365966796875, 2.8182373046875, 3.2705078125, 3.7227783203125, 4.175048828125, 4.6273193359375, 5.07958984375, 5.5318603515625, 5.984130859375, 6.4364013671875, 6.888671875, 7.3409423828125, 7.793212890625, 8.2454833984375, 8.69775390625, 9.1500244140625, 9.602294921875, 10.0545654296875, 10.5068359375, 10.9591064453125, 11.411376953125, 11.8636474609375, 12.31591796875, 12.7681884765625, 13.220458984375, 13.6727294921875, 14.125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 5.0, 5.0, 16.0, 8.0, 16.0, 13.0, 44.0, 40.0, 71.0, 71.0, 80.0, 86.0, 108.0, 93.0, 78.0, 59.0, 53.0, 27.0, 27.0, 33.0, 15.0, 10.0, 7.0, 11.0, 0.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013074874877929688, -0.0012574195861816406, -0.0012073516845703125, -0.0011572837829589844, -0.0011072158813476562, -0.0010571479797363281, -0.001007080078125, -0.0009570121765136719, -0.0009069442749023438, -0.0008568763732910156, -0.0008068084716796875, -0.0007567405700683594, -0.0007066726684570312, -0.0006566047668457031, -0.000606536865234375, -0.0005564689636230469, -0.0005064010620117188, -0.0004563331604003906, -0.0004062652587890625, -0.0003561973571777344, -0.00030612945556640625, -0.0002560615539550781, -0.00020599365234375, -0.00015592575073242188, -0.00010585784912109375, -5.5789947509765625e-05, -5.7220458984375e-06, 4.4345855712890625e-05, 9.441375732421875e-05, 0.00014448165893554688, 0.000194549560546875, 0.0002446174621582031, 0.00029468536376953125, 0.0003447532653808594, 0.0003948211669921875, 0.0004448890686035156, 0.0004949569702148438, 0.0005450248718261719, 0.0005950927734375, 0.0006451606750488281, 0.0006952285766601562, 0.0007452964782714844, 0.0007953643798828125, 0.0008454322814941406, 0.0008955001831054688, 0.0009455680847167969, 0.000995635986328125, 0.0010457038879394531, 0.0010957717895507812, 0.0011458396911621094, 0.0011959075927734375, 0.0012459754943847656, 0.0012960433959960938, 0.0013461112976074219, 0.00139617919921875, 0.0014462471008300781, 0.0014963150024414062, 0.0015463829040527344, 0.0015964508056640625, 0.0016465187072753906, 0.0016965866088867188, 0.0017466545104980469, 0.001796722412109375, 0.0018467903137207031, 0.0018968582153320312]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 5.0, 5.0, 7.0, 9.0, 21.0, 27.0, 17.0, 35.0, 46.0, 74.0, 82.0, 95.0, 144.0, 223.0, 290.0, 427.0, 580.0, 951.0, 1438.0, 2405.0, 4330.0, 8064.0, 16655.0, 37467.0, 94818.0, 240690.0, 336052.0, 178423.0, 68487.0, 28148.0, 12760.0, 6398.0, 3497.0, 2058.0, 1188.0, 807.0, 530.0, 334.0, 268.0, 199.0, 138.0, 99.0, 75.0, 55.0, 22.0, 30.0, 16.0, 22.0, 15.0, 11.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.140625, -16.575439453125, -16.01025390625, -15.445068359375, -14.8798828125, -14.314697265625, -13.74951171875, -13.184326171875, -12.619140625, -12.053955078125, -11.48876953125, -10.923583984375, -10.3583984375, -9.793212890625, -9.22802734375, -8.662841796875, -8.09765625, -7.532470703125, -6.96728515625, -6.402099609375, -5.8369140625, -5.271728515625, -4.70654296875, -4.141357421875, -3.576171875, -3.010986328125, -2.44580078125, -1.880615234375, -1.3154296875, -0.750244140625, -0.18505859375, 0.380126953125, 0.9453125, 1.510498046875, 2.07568359375, 2.640869140625, 3.2060546875, 3.771240234375, 4.33642578125, 4.901611328125, 5.466796875, 6.031982421875, 6.59716796875, 7.162353515625, 7.7275390625, 8.292724609375, 8.85791015625, 9.423095703125, 9.98828125, 10.553466796875, 11.11865234375, 11.683837890625, 12.2490234375, 12.814208984375, 13.37939453125, 13.944580078125, 14.509765625, 15.074951171875, 15.64013671875, 16.205322265625, 16.7705078125, 17.335693359375, 17.90087890625, 18.466064453125, 19.03125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 6.0, 9.0, 5.0, 16.0, 20.0, 29.0, 26.0, 39.0, 22.0, 39.0, 59.0, 63.0, 73.0, 72.0, 93.0, 71.0, 69.0, 63.0, 54.0, 37.0, 33.0, 20.0, 16.0, 16.0, 11.0, 8.0, 9.0, 8.0, 5.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.00274658203125, -3.8648681640625, -3.72698974609375, -3.589111328125, -3.45123291015625, -3.3133544921875, -3.17547607421875, -3.03759765625, -2.89971923828125, -2.7618408203125, -2.62396240234375, -2.486083984375, -2.34820556640625, -2.2103271484375, -2.07244873046875, -1.9345703125, -1.79669189453125, -1.6588134765625, -1.52093505859375, -1.383056640625, -1.24517822265625, -1.1072998046875, -0.96942138671875, -0.83154296875, -0.69366455078125, -0.5557861328125, -0.41790771484375, -0.280029296875, -0.14215087890625, -0.0042724609375, 0.13360595703125, 0.271484375, 0.40936279296875, 0.5472412109375, 0.68511962890625, 0.822998046875, 0.96087646484375, 1.0987548828125, 1.23663330078125, 1.37451171875, 1.51239013671875, 1.6502685546875, 1.78814697265625, 1.926025390625, 2.06390380859375, 2.2017822265625, 2.33966064453125, 2.4775390625, 2.61541748046875, 2.7532958984375, 2.89117431640625, 3.029052734375, 3.16693115234375, 3.3048095703125, 3.44268798828125, 3.58056640625, 3.71844482421875, 3.8563232421875, 3.99420166015625, 4.132080078125, 4.26995849609375, 4.4078369140625, 4.54571533203125, 4.68359375]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 12.0, 10.0, 20.0, 25.0, 32.0, 34.0, 41.0, 45.0, 46.0, 64.0, 73.0, 90.0, 60.0, 72.0, 58.0, 58.0, 61.0, 39.0, 33.0, 25.0, 21.0, 19.0, 9.0, 9.0, 5.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.214067459106445, -25.52163314819336, -24.82919692993164, -24.136760711669922, -23.444326400756836, -22.75189208984375, -22.05945587158203, -21.367019653320312, -20.674585342407227, -19.98215103149414, -19.289714813232422, -18.597278594970703, -17.904844284057617, -17.21240997314453, -16.519973754882812, -15.82753849029541, -15.135103225708008, -14.442667961120605, -13.750232696533203, -13.0577974319458, -12.365362167358398, -11.672926902770996, -10.980491638183594, -10.288056373596191, -9.595621109008789, -8.903185844421387, -8.210750579833984, -7.518315315246582, -6.82588005065918, -6.133444786071777, -5.441009521484375, -4.748574256896973, -4.05613899230957, -3.363703727722168, -2.6712684631347656, -1.9788331985473633, -1.286397933959961, -0.5939626693725586, 0.09847259521484375, 0.7909078598022461, 1.4833431243896484, 2.175778388977051, 2.868213653564453, 3.5606489181518555, 4.253084182739258, 4.94551944732666, 5.6379547119140625, 6.330389976501465, 7.022825241088867, 7.7152605056762695, 8.407695770263672, 9.100131034851074, 9.792566299438477, 10.485001564025879, 11.177436828613281, 11.869872093200684, 12.562307357788086, 13.254742622375488, 13.94717788696289, 14.639613151550293, 15.332048416137695, 16.02448272705078, 16.7169189453125, 17.40935516357422, 18.101789474487305]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 7.0, 10.0, 7.0, 13.0, 9.0, 9.0, 17.0, 29.0, 16.0, 11.0, 27.0, 33.0, 27.0, 30.0, 30.0, 28.0, 35.0, 39.0, 38.0, 29.0, 37.0, 30.0, 38.0, 39.0, 38.0, 34.0, 36.0, 32.0, 24.0, 27.0, 28.0, 28.0, 14.0, 13.0, 17.0, 13.0, 7.0, 12.0, 10.0, 17.0, 12.0, 7.0, 9.0, 7.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.033554077148438, -11.64134407043457, -11.249134063720703, -10.856924057006836, -10.464715003967285, -10.072504997253418, -9.68029499053955, -9.288084983825684, -8.895875930786133, -8.503665924072266, -8.111455917358398, -7.7192463874816895, -7.3270368576049805, -6.934826850891113, -6.542616844177246, -6.150406837463379, -5.758196830749512, -5.3659868240356445, -4.9737772941589355, -4.581567287445068, -4.189357757568359, -3.797147750854492, -3.404937744140625, -3.012727975845337, -2.620518207550049, -2.2283084392547607, -1.836098551750183, -1.4438886642456055, -1.0516788959503174, -0.6594691276550293, -0.2672591209411621, 0.12495064735412598, 0.5171594619750977, 0.9093692898750305, 1.3015791177749634, 1.693789005279541, 2.085998773574829, 2.478208541870117, 2.8704185485839844, 3.2626283168792725, 3.6548380851745605, 4.047048091888428, 4.439257621765137, 4.831467628479004, 5.223677635192871, 5.61588716506958, 6.008097171783447, 6.400306701660156, 6.792516708374023, 7.184726715087891, 7.5769362449646, 7.969146251678467, 8.361355781555176, 8.753565788269043, 9.14577579498291, 9.537985801696777, 9.930194854736328, 10.322404861450195, 10.714614868164062, 11.10682487487793, 11.49903392791748, 11.891243934631348, 12.283453941345215, 12.675663948059082, 13.06787395477295]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 11.0, 14.0, 22.0, 32.0, 49.0, 57.0, 83.0, 125.0, 151.0, 234.0, 329.0, 519.0, 772.0, 1212.0, 1940.0, 3078.0, 5179.0, 8514.0, 15172.0, 28021.0, 55532.0, 119509.0, 288329.0, 731860.0, 1286022.0, 953670.0, 389978.0, 153838.0, 69258.0, 34394.0, 18656.0, 10480.0, 6281.0, 3786.0, 2383.0, 1505.0, 1082.0, 665.0, 450.0, 315.0, 209.0, 153.0, 114.0, 80.0, 49.0, 38.0, 32.0, 26.0, 19.0, 14.0, 14.0, 5.0, 2.0, 3.0, 3.0, 3.0], "bins": [-20.84375, -20.20556640625, -19.5673828125, -18.92919921875, -18.291015625, -17.65283203125, -17.0146484375, -16.37646484375, -15.73828125, -15.10009765625, -14.4619140625, -13.82373046875, -13.185546875, -12.54736328125, -11.9091796875, -11.27099609375, -10.6328125, -9.99462890625, -9.3564453125, -8.71826171875, -8.080078125, -7.44189453125, -6.8037109375, -6.16552734375, -5.52734375, -4.88916015625, -4.2509765625, -3.61279296875, -2.974609375, -2.33642578125, -1.6982421875, -1.06005859375, -0.421875, 0.21630859375, 0.8544921875, 1.49267578125, 2.130859375, 2.76904296875, 3.4072265625, 4.04541015625, 4.68359375, 5.32177734375, 5.9599609375, 6.59814453125, 7.236328125, 7.87451171875, 8.5126953125, 9.15087890625, 9.7890625, 10.42724609375, 11.0654296875, 11.70361328125, 12.341796875, 12.97998046875, 13.6181640625, 14.25634765625, 14.89453125, 15.53271484375, 16.1708984375, 16.80908203125, 17.447265625, 18.08544921875, 18.7236328125, 19.36181640625, 20.0]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 11.0, 14.0, 14.0, 21.0, 17.0, 23.0, 30.0, 34.0, 27.0, 27.0, 35.0, 39.0, 35.0, 27.0, 35.0, 35.0, 47.0, 31.0, 40.0, 38.0, 40.0, 26.0, 39.0, 39.0, 29.0, 29.0, 26.0, 15.0, 15.0, 17.0, 16.0, 12.0, 13.0, 10.0, 16.0, 11.0, 2.0, 6.0, 6.0, 4.0, 9.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7734375, -8.4896240234375, -8.205810546875, -7.9219970703125, -7.63818359375, -7.3543701171875, -7.070556640625, -6.7867431640625, -6.5029296875, -6.2191162109375, -5.935302734375, -5.6514892578125, -5.36767578125, -5.0838623046875, -4.800048828125, -4.5162353515625, -4.232421875, -3.9486083984375, -3.664794921875, -3.3809814453125, -3.09716796875, -2.8133544921875, -2.529541015625, -2.2457275390625, -1.9619140625, -1.6781005859375, -1.394287109375, -1.1104736328125, -0.82666015625, -0.5428466796875, -0.259033203125, 0.0247802734375, 0.30859375, 0.5924072265625, 0.876220703125, 1.1600341796875, 1.44384765625, 1.7276611328125, 2.011474609375, 2.2952880859375, 2.5791015625, 2.8629150390625, 3.146728515625, 3.4305419921875, 3.71435546875, 3.9981689453125, 4.281982421875, 4.5657958984375, 4.849609375, 5.1334228515625, 5.417236328125, 5.7010498046875, 5.98486328125, 6.2686767578125, 6.552490234375, 6.8363037109375, 7.1201171875, 7.4039306640625, 7.687744140625, 7.9715576171875, 8.25537109375, 8.5391845703125, 8.822998046875, 9.1068115234375, 9.390625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 12.0, 22.0, 27.0, 29.0, 49.0, 75.0, 85.0, 135.0, 204.0, 334.0, 489.0, 739.0, 1194.0, 1783.0, 3094.0, 5148.0, 9200.0, 16625.0, 31681.0, 63107.0, 135113.0, 303634.0, 692123.0, 1201549.0, 930093.0, 430343.0, 188741.0, 86506.0, 42134.0, 21741.0, 11851.0, 6508.0, 3752.0, 2309.0, 1383.0, 862.0, 545.0, 373.0, 248.0, 146.0, 106.0, 55.0, 52.0, 31.0, 25.0, 17.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.74755859375, -19.1044921875, -18.46142578125, -17.818359375, -17.17529296875, -16.5322265625, -15.88916015625, -15.24609375, -14.60302734375, -13.9599609375, -13.31689453125, -12.673828125, -12.03076171875, -11.3876953125, -10.74462890625, -10.1015625, -9.45849609375, -8.8154296875, -8.17236328125, -7.529296875, -6.88623046875, -6.2431640625, -5.60009765625, -4.95703125, -4.31396484375, -3.6708984375, -3.02783203125, -2.384765625, -1.74169921875, -1.0986328125, -0.45556640625, 0.1875, 0.83056640625, 1.4736328125, 2.11669921875, 2.759765625, 3.40283203125, 4.0458984375, 4.68896484375, 5.33203125, 5.97509765625, 6.6181640625, 7.26123046875, 7.904296875, 8.54736328125, 9.1904296875, 9.83349609375, 10.4765625, 11.11962890625, 11.7626953125, 12.40576171875, 13.048828125, 13.69189453125, 14.3349609375, 14.97802734375, 15.62109375, 16.26416015625, 16.9072265625, 17.55029296875, 18.193359375, 18.83642578125, 19.4794921875, 20.12255859375, 20.765625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 10.0, 2.0, 10.0, 12.0, 20.0, 17.0, 20.0, 33.0, 54.0, 54.0, 72.0, 89.0, 128.0, 132.0, 173.0, 215.0, 270.0, 301.0, 337.0, 309.0, 316.0, 238.0, 222.0, 193.0, 194.0, 131.0, 106.0, 98.0, 79.0, 50.0, 38.0, 31.0, 22.0, 25.0, 16.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.390625, -6.1982421875, -6.005859375, -5.8134765625, -5.62109375, -5.4287109375, -5.236328125, -5.0439453125, -4.8515625, -4.6591796875, -4.466796875, -4.2744140625, -4.08203125, -3.8896484375, -3.697265625, -3.5048828125, -3.3125, -3.1201171875, -2.927734375, -2.7353515625, -2.54296875, -2.3505859375, -2.158203125, -1.9658203125, -1.7734375, -1.5810546875, -1.388671875, -1.1962890625, -1.00390625, -0.8115234375, -0.619140625, -0.4267578125, -0.234375, -0.0419921875, 0.150390625, 0.3427734375, 0.53515625, 0.7275390625, 0.919921875, 1.1123046875, 1.3046875, 1.4970703125, 1.689453125, 1.8818359375, 2.07421875, 2.2666015625, 2.458984375, 2.6513671875, 2.84375, 3.0361328125, 3.228515625, 3.4208984375, 3.61328125, 3.8056640625, 3.998046875, 4.1904296875, 4.3828125, 4.5751953125, 4.767578125, 4.9599609375, 5.15234375, 5.3447265625, 5.537109375, 5.7294921875, 5.921875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 13.0, 14.0, 8.0, 20.0, 26.0, 33.0, 36.0, 42.0, 51.0, 62.0, 79.0, 89.0, 78.0, 70.0, 73.0, 55.0, 43.0, 42.0, 35.0, 18.0, 15.0, 22.0, 18.0, 9.0, 14.0, 6.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.06292724609375, -26.371339797973633, -25.679750442504883, -24.988162994384766, -24.29657554626465, -23.60498809814453, -22.91339874267578, -22.221811294555664, -21.530223846435547, -20.83863639831543, -20.14704704284668, -19.455459594726562, -18.763872146606445, -18.072284698486328, -17.380695343017578, -16.68910789489746, -15.997518539428711, -15.305930137634277, -14.61434268951416, -13.922754287719727, -13.23116683959961, -12.539578437805176, -11.847990036010742, -11.156402587890625, -10.464814186096191, -9.773225784301758, -9.08163833618164, -8.390049934387207, -7.698462009429932, -7.006874084472656, -6.315285682678223, -5.623697757720947, -4.932111740112305, -4.240523815155029, -3.548935651779175, -2.8573474884033203, -2.165759563446045, -1.4741716384887695, -0.7825832366943359, -0.09099531173706055, 0.6005926132202148, 1.2921806573867798, 1.9837687015533447, 2.675356864929199, 3.3669447898864746, 4.05853271484375, 4.750121116638184, 5.441709041595459, 6.133296966552734, 6.82488489151001, 7.516472816467285, 8.208061218261719, 8.899648666381836, 9.59123706817627, 10.282825469970703, 10.97441291809082, 11.666001319885254, 12.357589721679688, 13.049177169799805, 13.740765571594238, 14.432353973388672, 15.123941421508789, 15.815529823303223, 16.507118225097656, 17.198705673217773]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 6.0, 5.0, 16.0, 11.0, 17.0, 18.0, 17.0, 17.0, 19.0, 15.0, 30.0, 31.0, 36.0, 38.0, 32.0, 33.0, 48.0, 36.0, 43.0, 42.0, 47.0, 36.0, 43.0, 39.0, 31.0, 32.0, 39.0, 17.0, 22.0, 32.0, 22.0, 21.0, 21.0, 13.0, 7.0, 14.0, 12.0, 9.0, 6.0, 6.0, 7.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.914490699768066, -12.507570266723633, -12.100648880004883, -11.69372844696045, -11.286808013916016, -10.879887580871582, -10.472967147827148, -10.066045761108398, -9.659125328063965, -9.252204895019531, -8.845283508300781, -8.438363075256348, -8.031442642211914, -7.6245222091674805, -7.217601299285889, -6.810680389404297, -6.403759956359863, -5.99683952331543, -5.589918613433838, -5.182997703552246, -4.7760772705078125, -4.369156837463379, -3.962235927581787, -3.5553152561187744, -3.1483945846557617, -2.741473913192749, -2.3345532417297363, -1.9276325702667236, -1.520711898803711, -1.1137912273406982, -0.7068705558776855, -0.29994988441467285, 0.10697174072265625, 0.513892412185669, 0.9208130836486816, 1.3277337551116943, 1.734654426574707, 2.1415750980377197, 2.5484957695007324, 2.955416440963745, 3.362337112426758, 3.7692577838897705, 4.176178455352783, 4.583099365234375, 4.990019798278809, 5.396940231323242, 5.803861141204834, 6.210782051086426, 6.617702484130859, 7.024622917175293, 7.431543827056885, 7.838464736938477, 8.24538516998291, 8.652305603027344, 9.059226989746094, 9.466147422790527, 9.873067855834961, 10.279988288879395, 10.686908721923828, 11.093830108642578, 11.500750541687012, 11.907670974731445, 12.314592361450195, 12.721512794494629, 13.128433227539062]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 4.0, 16.0, 20.0, 29.0, 41.0, 74.0, 117.0, 189.0, 279.0, 419.0, 658.0, 1146.0, 1761.0, 2840.0, 4968.0, 8361.0, 14657.0, 27010.0, 51107.0, 99314.0, 180780.0, 242880.0, 187837.0, 104539.0, 53690.0, 28316.0, 15758.0, 8735.0, 4976.0, 2994.0, 1848.0, 1168.0, 745.0, 457.0, 279.0, 178.0, 130.0, 85.0, 46.0, 33.0, 19.0, 15.0, 10.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.400146484375, -11.02685546875, -10.653564453125, -10.2802734375, -9.906982421875, -9.53369140625, -9.160400390625, -8.787109375, -8.413818359375, -8.04052734375, -7.667236328125, -7.2939453125, -6.920654296875, -6.54736328125, -6.174072265625, -5.80078125, -5.427490234375, -5.05419921875, -4.680908203125, -4.3076171875, -3.934326171875, -3.56103515625, -3.187744140625, -2.814453125, -2.441162109375, -2.06787109375, -1.694580078125, -1.3212890625, -0.947998046875, -0.57470703125, -0.201416015625, 0.171875, 0.545166015625, 0.91845703125, 1.291748046875, 1.6650390625, 2.038330078125, 2.41162109375, 2.784912109375, 3.158203125, 3.531494140625, 3.90478515625, 4.278076171875, 4.6513671875, 5.024658203125, 5.39794921875, 5.771240234375, 6.14453125, 6.517822265625, 6.89111328125, 7.264404296875, 7.6376953125, 8.010986328125, 8.38427734375, 8.757568359375, 9.130859375, 9.504150390625, 9.87744140625, 10.250732421875, 10.6240234375, 10.997314453125, 11.37060546875, 11.743896484375, 12.1171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 12.0, 8.0, 6.0, 13.0, 13.0, 14.0, 17.0, 27.0, 27.0, 23.0, 33.0, 23.0, 27.0, 38.0, 31.0, 42.0, 36.0, 44.0, 41.0, 41.0, 46.0, 48.0, 39.0, 35.0, 36.0, 30.0, 32.0, 24.0, 35.0, 21.0, 19.0, 14.0, 17.0, 12.0, 10.0, 6.0, 13.0, 10.0, 7.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-13.3671875, -12.9522705078125, -12.537353515625, -12.1224365234375, -11.70751953125, -11.2926025390625, -10.877685546875, -10.4627685546875, -10.0478515625, -9.6329345703125, -9.218017578125, -8.8031005859375, -8.38818359375, -7.9732666015625, -7.558349609375, -7.1434326171875, -6.728515625, -6.3135986328125, -5.898681640625, -5.4837646484375, -5.06884765625, -4.6539306640625, -4.239013671875, -3.8240966796875, -3.4091796875, -2.9942626953125, -2.579345703125, -2.1644287109375, -1.74951171875, -1.3345947265625, -0.919677734375, -0.5047607421875, -0.08984375, 0.3250732421875, 0.739990234375, 1.1549072265625, 1.56982421875, 1.9847412109375, 2.399658203125, 2.8145751953125, 3.2294921875, 3.6444091796875, 4.059326171875, 4.4742431640625, 4.88916015625, 5.3040771484375, 5.718994140625, 6.1339111328125, 6.548828125, 6.9637451171875, 7.378662109375, 7.7935791015625, 8.20849609375, 8.6234130859375, 9.038330078125, 9.4532470703125, 9.8681640625, 10.2830810546875, 10.697998046875, 11.1129150390625, 11.52783203125, 11.9427490234375, 12.357666015625, 12.7725830078125, 13.1875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 3.0, 9.0, 11.0, 15.0, 33.0, 25.0, 42.0, 62.0, 68.0, 120.0, 172.0, 242.0, 414.0, 593.0, 949.0, 1614.0, 2685.0, 4832.0, 9167.0, 19461.0, 45274.0, 117015.0, 288423.0, 320044.0, 138169.0, 52995.0, 22313.0, 10560.0, 5404.0, 3086.0, 1763.0, 1031.0, 680.0, 400.0, 269.0, 168.0, 136.0, 88.0, 60.0, 48.0, 32.0, 23.0, 20.0, 7.0, 10.0, 5.0, 4.0, 8.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-19.015625, -18.457763671875, -17.89990234375, -17.342041015625, -16.7841796875, -16.226318359375, -15.66845703125, -15.110595703125, -14.552734375, -13.994873046875, -13.43701171875, -12.879150390625, -12.3212890625, -11.763427734375, -11.20556640625, -10.647705078125, -10.08984375, -9.531982421875, -8.97412109375, -8.416259765625, -7.8583984375, -7.300537109375, -6.74267578125, -6.184814453125, -5.626953125, -5.069091796875, -4.51123046875, -3.953369140625, -3.3955078125, -2.837646484375, -2.27978515625, -1.721923828125, -1.1640625, -0.606201171875, -0.04833984375, 0.509521484375, 1.0673828125, 1.625244140625, 2.18310546875, 2.740966796875, 3.298828125, 3.856689453125, 4.41455078125, 4.972412109375, 5.5302734375, 6.088134765625, 6.64599609375, 7.203857421875, 7.76171875, 8.319580078125, 8.87744140625, 9.435302734375, 9.9931640625, 10.551025390625, 11.10888671875, 11.666748046875, 12.224609375, 12.782470703125, 13.34033203125, 13.898193359375, 14.4560546875, 15.013916015625, 15.57177734375, 16.129638671875, 16.6875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 17.0, 15.0, 18.0, 12.0, 30.0, 22.0, 28.0, 31.0, 28.0, 31.0, 40.0, 39.0, 33.0, 31.0, 49.0, 33.0, 36.0, 52.0, 42.0, 38.0, 43.0, 41.0, 33.0, 34.0, 30.0, 34.0, 23.0, 20.0, 16.0, 13.0, 15.0, 12.0, 14.0, 8.0, 6.0, 2.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.12347412109375, -7.8719482421875, -7.62042236328125, -7.368896484375, -7.11737060546875, -6.8658447265625, -6.61431884765625, -6.36279296875, -6.11126708984375, -5.8597412109375, -5.60821533203125, -5.356689453125, -5.10516357421875, -4.8536376953125, -4.60211181640625, -4.3505859375, -4.09906005859375, -3.8475341796875, -3.59600830078125, -3.344482421875, -3.09295654296875, -2.8414306640625, -2.58990478515625, -2.33837890625, -2.08685302734375, -1.8353271484375, -1.58380126953125, -1.332275390625, -1.08074951171875, -0.8292236328125, -0.57769775390625, -0.326171875, -0.07464599609375, 0.1768798828125, 0.42840576171875, 0.679931640625, 0.93145751953125, 1.1829833984375, 1.43450927734375, 1.68603515625, 1.93756103515625, 2.1890869140625, 2.44061279296875, 2.692138671875, 2.94366455078125, 3.1951904296875, 3.44671630859375, 3.6982421875, 3.94976806640625, 4.2012939453125, 4.45281982421875, 4.704345703125, 4.95587158203125, 5.2073974609375, 5.45892333984375, 5.71044921875, 5.96197509765625, 6.2135009765625, 6.46502685546875, 6.716552734375, 6.96807861328125, 7.2196044921875, 7.47113037109375, 7.72265625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 14.0, 14.0, 15.0, 25.0, 35.0, 45.0, 75.0, 106.0, 171.0, 171.0, 281.0, 419.0, 646.0, 892.0, 1468.0, 2383.0, 3917.0, 6672.0, 12352.0, 24419.0, 52547.0, 121028.0, 269068.0, 294144.0, 137742.0, 59960.0, 27469.0, 13890.0, 7412.0, 4114.0, 2524.0, 1545.0, 1002.0, 609.0, 394.0, 304.0, 202.0, 143.0, 115.0, 70.0, 52.0, 27.0, 25.0, 17.0, 12.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.473876953125, -5.30322265625, -5.132568359375, -4.9619140625, -4.791259765625, -4.62060546875, -4.449951171875, -4.279296875, -4.108642578125, -3.93798828125, -3.767333984375, -3.5966796875, -3.426025390625, -3.25537109375, -3.084716796875, -2.9140625, -2.743408203125, -2.57275390625, -2.402099609375, -2.2314453125, -2.060791015625, -1.89013671875, -1.719482421875, -1.548828125, -1.378173828125, -1.20751953125, -1.036865234375, -0.8662109375, -0.695556640625, -0.52490234375, -0.354248046875, -0.18359375, -0.012939453125, 0.15771484375, 0.328369140625, 0.4990234375, 0.669677734375, 0.84033203125, 1.010986328125, 1.181640625, 1.352294921875, 1.52294921875, 1.693603515625, 1.8642578125, 2.034912109375, 2.20556640625, 2.376220703125, 2.546875, 2.717529296875, 2.88818359375, 3.058837890625, 3.2294921875, 3.400146484375, 3.57080078125, 3.741455078125, 3.912109375, 4.082763671875, 4.25341796875, 4.424072265625, 4.5947265625, 4.765380859375, 4.93603515625, 5.106689453125, 5.27734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 14.0, 27.0, 21.0, 34.0, 43.0, 69.0, 82.0, 94.0, 108.0, 91.0, 89.0, 71.0, 75.0, 38.0, 34.0, 20.0, 23.0, 11.0, 12.0, 13.0, 2.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003936290740966797, -0.0003808923065662384, -0.0003681555390357971, -0.00035541877150535583, -0.00034268200397491455, -0.00032994523644447327, -0.000317208468914032, -0.0003044717013835907, -0.0002917349338531494, -0.00027899816632270813, -0.00026626139879226685, -0.00025352463126182556, -0.00024078786373138428, -0.000228051096200943, -0.0002153143286705017, -0.00020257756114006042, -0.00018984079360961914, -0.00017710402607917786, -0.00016436725854873657, -0.0001516304910182953, -0.000138893723487854, -0.00012615695595741272, -0.00011342018842697144, -0.00010068342089653015, -8.794665336608887e-05, -7.520988583564758e-05, -6.24731183052063e-05, -4.9736350774765015e-05, -3.699958324432373e-05, -2.4262815713882446e-05, -1.1526048183441162e-05, 1.210719347000122e-06, 1.3947486877441406e-05, 2.668425440788269e-05, 3.9421021938323975e-05, 5.215778946876526e-05, 6.489455699920654e-05, 7.763132452964783e-05, 9.036809206008911e-05, 0.0001031048595905304, 0.00011584162712097168, 0.00012857839465141296, 0.00014131516218185425, 0.00015405192971229553, 0.00016678869724273682, 0.0001795254647731781, 0.00019226223230361938, 0.00020499899983406067, 0.00021773576736450195, 0.00023047253489494324, 0.00024320930242538452, 0.0002559460699558258, 0.0002686828374862671, 0.0002814196050167084, 0.00029415637254714966, 0.00030689314007759094, 0.0003196299076080322, 0.0003323666751384735, 0.0003451034426689148, 0.0003578402101993561, 0.00037057697772979736, 0.00038331374526023865, 0.00039605051279067993, 0.0004087872803211212, 0.0004215240478515625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 11.0, 14.0, 19.0, 31.0, 45.0, 72.0, 119.0, 171.0, 260.0, 485.0, 789.0, 1373.0, 2513.0, 4865.0, 9458.0, 19912.0, 44906.0, 105377.0, 223977.0, 295773.0, 186757.0, 82907.0, 35827.0, 15989.0, 7640.0, 4002.0, 2132.0, 1265.0, 716.0, 416.0, 258.0, 157.0, 91.0, 64.0, 51.0, 34.0, 30.0, 13.0, 13.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.76171875, -5.5780029296875, -5.394287109375, -5.2105712890625, -5.02685546875, -4.8431396484375, -4.659423828125, -4.4757080078125, -4.2919921875, -4.1082763671875, -3.924560546875, -3.7408447265625, -3.55712890625, -3.3734130859375, -3.189697265625, -3.0059814453125, -2.822265625, -2.6385498046875, -2.454833984375, -2.2711181640625, -2.08740234375, -1.9036865234375, -1.719970703125, -1.5362548828125, -1.3525390625, -1.1688232421875, -0.985107421875, -0.8013916015625, -0.61767578125, -0.4339599609375, -0.250244140625, -0.0665283203125, 0.1171875, 0.3009033203125, 0.484619140625, 0.6683349609375, 0.85205078125, 1.0357666015625, 1.219482421875, 1.4031982421875, 1.5869140625, 1.7706298828125, 1.954345703125, 2.1380615234375, 2.32177734375, 2.5054931640625, 2.689208984375, 2.8729248046875, 3.056640625, 3.2403564453125, 3.424072265625, 3.6077880859375, 3.79150390625, 3.9752197265625, 4.158935546875, 4.3426513671875, 4.5263671875, 4.7100830078125, 4.893798828125, 5.0775146484375, 5.26123046875, 5.4449462890625, 5.628662109375, 5.8123779296875, 5.99609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 6.0, 12.0, 8.0, 15.0, 20.0, 22.0, 22.0, 26.0, 38.0, 51.0, 51.0, 49.0, 33.0, 52.0, 63.0, 52.0, 44.0, 45.0, 50.0, 48.0, 39.0, 31.0, 38.0, 18.0, 32.0, 21.0, 18.0, 14.0, 14.0, 10.0, 11.0, 4.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0475006103515625, -1.010040283203125, -0.9725799560546875, -0.93511962890625, -0.8976593017578125, -0.860198974609375, -0.8227386474609375, -0.7852783203125, -0.7478179931640625, -0.710357666015625, -0.6728973388671875, -0.63543701171875, -0.5979766845703125, -0.560516357421875, -0.5230560302734375, -0.485595703125, -0.4481353759765625, -0.410675048828125, -0.3732147216796875, -0.33575439453125, -0.2982940673828125, -0.260833740234375, -0.2233734130859375, -0.1859130859375, -0.1484527587890625, -0.110992431640625, -0.0735321044921875, -0.03607177734375, 0.0013885498046875, 0.038848876953125, 0.0763092041015625, 0.11376953125, 0.1512298583984375, 0.188690185546875, 0.2261505126953125, 0.26361083984375, 0.3010711669921875, 0.338531494140625, 0.3759918212890625, 0.4134521484375, 0.4509124755859375, 0.488372802734375, 0.5258331298828125, 0.56329345703125, 0.6007537841796875, 0.638214111328125, 0.6756744384765625, 0.713134765625, 0.7505950927734375, 0.788055419921875, 0.8255157470703125, 0.86297607421875, 0.9004364013671875, 0.937896728515625, 0.9753570556640625, 1.0128173828125, 1.0502777099609375, 1.087738037109375, 1.1251983642578125, 1.16265869140625, 1.2001190185546875, 1.237579345703125, 1.2750396728515625, 1.3125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 9.0, 12.0, 5.0, 20.0, 21.0, 25.0, 31.0, 35.0, 45.0, 51.0, 62.0, 81.0, 79.0, 90.0, 76.0, 67.0, 52.0, 47.0, 44.0, 21.0, 25.0, 18.0, 22.0, 11.0, 15.0, 9.0, 10.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.460037231445312, -25.76615333557129, -25.072269439697266, -24.37838363647461, -23.684499740600586, -22.990615844726562, -22.296730041503906, -21.602846145629883, -20.90896224975586, -20.215078353881836, -19.521194458007812, -18.827308654785156, -18.133424758911133, -17.43954086303711, -16.745655059814453, -16.05177116394043, -15.357887268066406, -14.664003372192383, -13.970118522644043, -13.276233673095703, -12.58234977722168, -11.888465881347656, -11.194581031799316, -10.500696182250977, -9.806812286376953, -9.11292839050293, -8.41904354095459, -7.725159168243408, -7.031274795532227, -6.337390422821045, -5.643506050109863, -4.949621677398682, -4.2557373046875, -3.5618529319763184, -2.8679685592651367, -2.174084186553955, -1.4801998138427734, -0.7863154411315918, -0.09243106842041016, 0.6014533042907715, 1.2953376770019531, 1.9892220497131348, 2.6831064224243164, 3.376990795135498, 4.07087516784668, 4.764759540557861, 5.458643913269043, 6.152528285980225, 6.846412658691406, 7.540297031402588, 8.23418140411377, 8.92806625366211, 9.621950149536133, 10.315834045410156, 11.009718894958496, 11.703603744506836, 12.39748764038086, 13.091371536254883, 13.785256385803223, 14.479141235351562, 15.173025131225586, 15.86690902709961, 16.560794830322266, 17.25467872619629, 17.948562622070312]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 16.0, 9.0, 20.0, 20.0, 11.0, 23.0, 16.0, 24.0, 29.0, 33.0, 38.0, 39.0, 29.0, 40.0, 41.0, 51.0, 40.0, 40.0, 43.0, 35.0, 32.0, 41.0, 39.0, 32.0, 27.0, 19.0, 21.0, 29.0, 26.0, 16.0, 17.0, 14.0, 13.0, 11.0, 12.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.408023834228516, -12.008654594421387, -11.609285354614258, -11.209916114807129, -10.810546875, -10.411177635192871, -10.011808395385742, -9.612439155578613, -9.213069915771484, -8.813700675964355, -8.414331436157227, -8.014962196350098, -7.615592956542969, -7.21622371673584, -6.816854476928711, -6.417485237121582, -6.018115997314453, -5.618746757507324, -5.219377517700195, -4.820008277893066, -4.4206390380859375, -4.021269798278809, -3.6219005584716797, -3.222531318664551, -2.823162078857422, -2.423792839050293, -2.024423599243164, -1.6250543594360352, -1.2256851196289062, -0.8263158798217773, -0.42694664001464844, -0.02757740020751953, 0.3717927932739258, 0.7711620330810547, 1.1705312728881836, 1.5699005126953125, 1.9692697525024414, 2.3686389923095703, 2.768008232116699, 3.167377471923828, 3.566746711730957, 3.966115951538086, 4.365485191345215, 4.764854431152344, 5.164223670959473, 5.563592910766602, 5.9629621505737305, 6.362331390380859, 6.761700630187988, 7.161069869995117, 7.560439109802246, 7.959808349609375, 8.359177589416504, 8.758546829223633, 9.157916069030762, 9.55728530883789, 9.95665454864502, 10.356023788452148, 10.755393028259277, 11.154762268066406, 11.554131507873535, 11.953500747680664, 12.352869987487793, 12.752239227294922, 13.15160846710205]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 11.0, 18.0, 23.0, 41.0, 52.0, 67.0, 124.0, 190.0, 269.0, 455.0, 689.0, 1051.0, 1638.0, 2480.0, 3908.0, 6227.0, 9860.0, 15924.0, 25303.0, 40843.0, 64446.0, 98445.0, 137632.0, 162482.0, 151210.0, 115400.0, 77591.0, 49462.0, 30747.0, 18970.0, 12093.0, 7626.0, 4660.0, 3075.0, 1977.0, 1221.0, 784.0, 574.0, 353.0, 215.0, 140.0, 102.0, 51.0, 39.0, 33.0, 17.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2772216796875, -13.796630859375, -13.3160400390625, -12.83544921875, -12.3548583984375, -11.874267578125, -11.3936767578125, -10.9130859375, -10.4324951171875, -9.951904296875, -9.4713134765625, -8.99072265625, -8.5101318359375, -8.029541015625, -7.5489501953125, -7.068359375, -6.5877685546875, -6.107177734375, -5.6265869140625, -5.14599609375, -4.6654052734375, -4.184814453125, -3.7042236328125, -3.2236328125, -2.7430419921875, -2.262451171875, -1.7818603515625, -1.30126953125, -0.8206787109375, -0.340087890625, 0.1405029296875, 0.62109375, 1.1016845703125, 1.582275390625, 2.0628662109375, 2.54345703125, 3.0240478515625, 3.504638671875, 3.9852294921875, 4.4658203125, 4.9464111328125, 5.427001953125, 5.9075927734375, 6.38818359375, 6.8687744140625, 7.349365234375, 7.8299560546875, 8.310546875, 8.7911376953125, 9.271728515625, 9.7523193359375, 10.23291015625, 10.7135009765625, 11.194091796875, 11.6746826171875, 12.1552734375, 12.6358642578125, 13.116455078125, 13.5970458984375, 14.07763671875, 14.5582275390625, 15.038818359375, 15.5194091796875, 16.0]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 8.0, 16.0, 12.0, 9.0, 18.0, 19.0, 15.0, 25.0, 23.0, 27.0, 36.0, 36.0, 42.0, 33.0, 43.0, 38.0, 47.0, 50.0, 49.0, 37.0, 47.0, 49.0, 38.0, 32.0, 32.0, 24.0, 29.0, 22.0, 15.0, 23.0, 17.0, 20.0, 13.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.796875, -12.3651123046875, -11.933349609375, -11.5015869140625, -11.06982421875, -10.6380615234375, -10.206298828125, -9.7745361328125, -9.3427734375, -8.9110107421875, -8.479248046875, -8.0474853515625, -7.61572265625, -7.1839599609375, -6.752197265625, -6.3204345703125, -5.888671875, -5.4569091796875, -5.025146484375, -4.5933837890625, -4.16162109375, -3.7298583984375, -3.298095703125, -2.8663330078125, -2.4345703125, -2.0028076171875, -1.571044921875, -1.1392822265625, -0.70751953125, -0.2757568359375, 0.156005859375, 0.5877685546875, 1.01953125, 1.4512939453125, 1.883056640625, 2.3148193359375, 2.74658203125, 3.1783447265625, 3.610107421875, 4.0418701171875, 4.4736328125, 4.9053955078125, 5.337158203125, 5.7689208984375, 6.20068359375, 6.6324462890625, 7.064208984375, 7.4959716796875, 7.927734375, 8.3594970703125, 8.791259765625, 9.2230224609375, 9.65478515625, 10.0865478515625, 10.518310546875, 10.9500732421875, 11.3818359375, 11.8135986328125, 12.245361328125, 12.6771240234375, 13.10888671875, 13.5406494140625, 13.972412109375, 14.4041748046875, 14.8359375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 30.0, 20.0, 35.0, 70.0, 117.0, 173.0, 237.0, 419.0, 674.0, 1095.0, 1861.0, 2930.0, 4911.0, 8127.0, 14233.0, 23805.0, 40531.0, 67755.0, 106475.0, 151632.0, 175907.0, 156613.0, 112700.0, 71548.0, 43756.0, 25606.0, 14986.0, 8875.0, 5266.0, 3215.0, 1925.0, 1112.0, 694.0, 430.0, 265.0, 177.0, 127.0, 64.0, 48.0, 25.0, 22.0, 13.0, 13.0, 8.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.3214111328125, -12.838134765625, -12.3548583984375, -11.87158203125, -11.3883056640625, -10.905029296875, -10.4217529296875, -9.9384765625, -9.4552001953125, -8.971923828125, -8.4886474609375, -8.00537109375, -7.5220947265625, -7.038818359375, -6.5555419921875, -6.072265625, -5.5889892578125, -5.105712890625, -4.6224365234375, -4.13916015625, -3.6558837890625, -3.172607421875, -2.6893310546875, -2.2060546875, -1.7227783203125, -1.239501953125, -0.7562255859375, -0.27294921875, 0.2103271484375, 0.693603515625, 1.1768798828125, 1.66015625, 2.1434326171875, 2.626708984375, 3.1099853515625, 3.59326171875, 4.0765380859375, 4.559814453125, 5.0430908203125, 5.5263671875, 6.0096435546875, 6.492919921875, 6.9761962890625, 7.45947265625, 7.9427490234375, 8.426025390625, 8.9093017578125, 9.392578125, 9.8758544921875, 10.359130859375, 10.8424072265625, 11.32568359375, 11.8089599609375, 12.292236328125, 12.7755126953125, 13.2587890625, 13.7420654296875, 14.225341796875, 14.7086181640625, 15.19189453125, 15.6751708984375, 16.158447265625, 16.6417236328125, 17.125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 10.0, 5.0, 6.0, 4.0, 9.0, 7.0, 15.0, 11.0, 17.0, 23.0, 13.0, 23.0, 26.0, 19.0, 38.0, 42.0, 37.0, 30.0, 42.0, 38.0, 52.0, 58.0, 47.0, 29.0, 41.0, 42.0, 31.0, 36.0, 35.0, 31.0, 31.0, 23.0, 14.0, 13.0, 13.0, 20.0, 13.0, 14.0, 9.0, 14.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4609375, -8.19677734375, -7.9326171875, -7.66845703125, -7.404296875, -7.14013671875, -6.8759765625, -6.61181640625, -6.34765625, -6.08349609375, -5.8193359375, -5.55517578125, -5.291015625, -5.02685546875, -4.7626953125, -4.49853515625, -4.234375, -3.97021484375, -3.7060546875, -3.44189453125, -3.177734375, -2.91357421875, -2.6494140625, -2.38525390625, -2.12109375, -1.85693359375, -1.5927734375, -1.32861328125, -1.064453125, -0.80029296875, -0.5361328125, -0.27197265625, -0.0078125, 0.25634765625, 0.5205078125, 0.78466796875, 1.048828125, 1.31298828125, 1.5771484375, 1.84130859375, 2.10546875, 2.36962890625, 2.6337890625, 2.89794921875, 3.162109375, 3.42626953125, 3.6904296875, 3.95458984375, 4.21875, 4.48291015625, 4.7470703125, 5.01123046875, 5.275390625, 5.53955078125, 5.8037109375, 6.06787109375, 6.33203125, 6.59619140625, 6.8603515625, 7.12451171875, 7.388671875, 7.65283203125, 7.9169921875, 8.18115234375, 8.4453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 10.0, 6.0, 16.0, 23.0, 33.0, 43.0, 57.0, 76.0, 160.0, 200.0, 294.0, 521.0, 725.0, 1205.0, 1775.0, 2723.0, 4381.0, 7053.0, 11272.0, 18948.0, 31850.0, 53823.0, 91066.0, 143956.0, 189116.0, 177215.0, 123474.0, 75784.0, 44759.0, 26392.0, 15725.0, 9532.0, 5851.0, 3655.0, 2405.0, 1468.0, 1010.0, 655.0, 411.0, 280.0, 187.0, 129.0, 87.0, 66.0, 37.0, 32.0, 23.0, 11.0, 14.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0], "bins": [-9.140625, -8.870361328125, -8.60009765625, -8.329833984375, -8.0595703125, -7.789306640625, -7.51904296875, -7.248779296875, -6.978515625, -6.708251953125, -6.43798828125, -6.167724609375, -5.8974609375, -5.627197265625, -5.35693359375, -5.086669921875, -4.81640625, -4.546142578125, -4.27587890625, -4.005615234375, -3.7353515625, -3.465087890625, -3.19482421875, -2.924560546875, -2.654296875, -2.384033203125, -2.11376953125, -1.843505859375, -1.5732421875, -1.302978515625, -1.03271484375, -0.762451171875, -0.4921875, -0.221923828125, 0.04833984375, 0.318603515625, 0.5888671875, 0.859130859375, 1.12939453125, 1.399658203125, 1.669921875, 1.940185546875, 2.21044921875, 2.480712890625, 2.7509765625, 3.021240234375, 3.29150390625, 3.561767578125, 3.83203125, 4.102294921875, 4.37255859375, 4.642822265625, 4.9130859375, 5.183349609375, 5.45361328125, 5.723876953125, 5.994140625, 6.264404296875, 6.53466796875, 6.804931640625, 7.0751953125, 7.345458984375, 7.61572265625, 7.885986328125, 8.15625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 7.0, 15.0, 18.0, 18.0, 16.0, 28.0, 33.0, 43.0, 56.0, 76.0, 78.0, 88.0, 85.0, 84.0, 72.0, 60.0, 51.0, 51.0, 27.0, 23.0, 23.0, 12.0, 10.0, 4.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.000990539789199829, -0.0009530186653137207, -0.0009154975414276123, -0.0008779764175415039, -0.0008404552936553955, -0.0008029341697692871, -0.0007654130458831787, -0.0007278919219970703, -0.0006903707981109619, -0.0006528496742248535, -0.0006153285503387451, -0.0005778074264526367, -0.0005402863025665283, -0.0005027651786804199, -0.0004652440547943115, -0.0004277229309082031, -0.0003902018070220947, -0.00035268068313598633, -0.00031515955924987793, -0.00027763843536376953, -0.00024011731147766113, -0.00020259618759155273, -0.00016507506370544434, -0.00012755393981933594, -9.003281593322754e-05, -5.251169204711914e-05, -1.4990568161010742e-05, 2.2530555725097656e-05, 6.0051679611206055e-05, 9.757280349731445e-05, 0.00013509392738342285, 0.00017261505126953125, 0.00021013617515563965, 0.00024765729904174805, 0.00028517842292785645, 0.00032269954681396484, 0.00036022067070007324, 0.00039774179458618164, 0.00043526291847229004, 0.00047278404235839844, 0.0005103051662445068, 0.0005478262901306152, 0.0005853474140167236, 0.000622868537902832, 0.0006603896617889404, 0.0006979107856750488, 0.0007354319095611572, 0.0007729530334472656, 0.000810474157333374, 0.0008479952812194824, 0.0008855164051055908, 0.0009230375289916992, 0.0009605586528778076, 0.000998079776763916, 0.0010356009006500244, 0.0010731220245361328, 0.0011106431484222412, 0.0011481642723083496, 0.001185685396194458, 0.0012232065200805664, 0.0012607276439666748, 0.0012982487678527832, 0.0013357698917388916, 0.001373291015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 15.0, 21.0, 32.0, 39.0, 74.0, 89.0, 135.0, 221.0, 336.0, 437.0, 807.0, 1118.0, 1807.0, 2908.0, 4482.0, 7443.0, 12463.0, 21323.0, 36632.0, 62582.0, 104572.0, 158518.0, 190212.0, 165288.0, 112148.0, 67472.0, 39713.0, 22809.0, 13501.0, 8026.0, 4842.0, 2995.0, 1927.0, 1268.0, 736.0, 485.0, 362.0, 236.0, 160.0, 97.0, 78.0, 37.0, 34.0, 19.0, 19.0, 11.0, 4.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.07958984375, -8.7919921875, -8.50439453125, -8.216796875, -7.92919921875, -7.6416015625, -7.35400390625, -7.06640625, -6.77880859375, -6.4912109375, -6.20361328125, -5.916015625, -5.62841796875, -5.3408203125, -5.05322265625, -4.765625, -4.47802734375, -4.1904296875, -3.90283203125, -3.615234375, -3.32763671875, -3.0400390625, -2.75244140625, -2.46484375, -2.17724609375, -1.8896484375, -1.60205078125, -1.314453125, -1.02685546875, -0.7392578125, -0.45166015625, -0.1640625, 0.12353515625, 0.4111328125, 0.69873046875, 0.986328125, 1.27392578125, 1.5615234375, 1.84912109375, 2.13671875, 2.42431640625, 2.7119140625, 2.99951171875, 3.287109375, 3.57470703125, 3.8623046875, 4.14990234375, 4.4375, 4.72509765625, 5.0126953125, 5.30029296875, 5.587890625, 5.87548828125, 6.1630859375, 6.45068359375, 6.73828125, 7.02587890625, 7.3134765625, 7.60107421875, 7.888671875, 8.17626953125, 8.4638671875, 8.75146484375, 9.0390625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 12.0, 7.0, 9.0, 14.0, 15.0, 20.0, 36.0, 36.0, 27.0, 40.0, 39.0, 53.0, 45.0, 61.0, 63.0, 69.0, 54.0, 49.0, 68.0, 47.0, 51.0, 41.0, 25.0, 26.0, 15.0, 11.0, 18.0, 17.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-4.01953125, -3.89483642578125, -3.7701416015625, -3.64544677734375, -3.520751953125, -3.39605712890625, -3.2713623046875, -3.14666748046875, -3.02197265625, -2.89727783203125, -2.7725830078125, -2.64788818359375, -2.523193359375, -2.39849853515625, -2.2738037109375, -2.14910888671875, -2.0244140625, -1.89971923828125, -1.7750244140625, -1.65032958984375, -1.525634765625, -1.40093994140625, -1.2762451171875, -1.15155029296875, -1.02685546875, -0.90216064453125, -0.7774658203125, -0.65277099609375, -0.528076171875, -0.40338134765625, -0.2786865234375, -0.15399169921875, -0.029296875, 0.09539794921875, 0.2200927734375, 0.34478759765625, 0.469482421875, 0.59417724609375, 0.7188720703125, 0.84356689453125, 0.96826171875, 1.09295654296875, 1.2176513671875, 1.34234619140625, 1.467041015625, 1.59173583984375, 1.7164306640625, 1.84112548828125, 1.9658203125, 2.09051513671875, 2.2152099609375, 2.33990478515625, 2.464599609375, 2.58929443359375, 2.7139892578125, 2.83868408203125, 2.96337890625, 3.08807373046875, 3.2127685546875, 3.33746337890625, 3.462158203125, 3.58685302734375, 3.7115478515625, 3.83624267578125, 3.9609375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 11.0, 13.0, 12.0, 25.0, 23.0, 28.0, 28.0, 45.0, 60.0, 66.0, 65.0, 74.0, 76.0, 85.0, 59.0, 65.0, 39.0, 51.0, 32.0, 22.0, 17.0, 18.0, 15.0, 8.0, 14.0, 11.0, 8.0, 0.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.177438735961914, -22.52055549621582, -21.863672256469727, -21.206790924072266, -20.549907684326172, -19.893024444580078, -19.236141204833984, -18.57925796508789, -17.922374725341797, -17.265491485595703, -16.60860824584961, -15.951725959777832, -15.294842720031738, -14.637960433959961, -13.981077194213867, -13.324193954467773, -12.667311668395996, -12.010428428649902, -11.353546142578125, -10.696662902832031, -10.039779663085938, -9.382896423339844, -8.726014137268066, -8.069130897521973, -7.412248134613037, -6.755365371704102, -6.098482131958008, -5.441599369049072, -4.784716606140137, -4.127833366394043, -3.4709506034851074, -2.8140673637390137, -2.157184600830078, -1.5003015995025635, -0.8434187173843384, -0.18653583526611328, 0.47034716606140137, 1.127230167388916, 1.7841129302978516, 2.4409961700439453, 3.097878932952881, 3.7547619342803955, 4.41164493560791, 5.068527698516846, 5.725410461425781, 6.382293701171875, 7.0391764640808105, 7.696059703826904, 8.35294246673584, 9.009825706481934, 9.666707992553711, 10.323591232299805, 10.980474472045898, 11.637357711791992, 12.29423999786377, 12.951123237609863, 13.60800552368164, 14.264888763427734, 14.921771049499512, 15.578654289245605, 16.235536575317383, 16.892419815063477, 17.54930305480957, 18.206186294555664, 18.863069534301758]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 7.0, 14.0, 11.0, 11.0, 15.0, 14.0, 14.0, 11.0, 19.0, 23.0, 22.0, 43.0, 33.0, 41.0, 38.0, 38.0, 37.0, 41.0, 40.0, 42.0, 39.0, 35.0, 33.0, 38.0, 44.0, 29.0, 37.0, 39.0, 25.0, 18.0, 26.0, 19.0, 17.0, 11.0, 10.0, 12.0, 8.0, 12.0, 5.0, 4.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.626763343811035, -11.233745574951172, -10.840727806091309, -10.447710037231445, -10.054691314697266, -9.661673545837402, -9.268655776977539, -8.875638008117676, -8.482620239257812, -8.08960247039795, -7.696584701538086, -7.3035664558410645, -6.910548686981201, -6.517530918121338, -6.124512672424316, -5.731494903564453, -5.33847713470459, -4.945459365844727, -4.552441596984863, -4.159423351287842, -3.7664055824279785, -3.3733878135681152, -2.980369806289673, -2.5873517990112305, -2.194334030151367, -1.8013161420822144, -1.4082982540130615, -1.0152803659439087, -0.6222624778747559, -0.22924458980560303, 0.1637732982635498, 0.5567913055419922, 0.9498081207275391, 1.342826008796692, 1.7358438968658447, 2.128861904144287, 2.5218796730041504, 2.9148974418640137, 3.307915449142456, 3.7009334564208984, 4.093951225280762, 4.486968994140625, 4.879986763000488, 5.27300500869751, 5.666022777557373, 6.059040546417236, 6.452058792114258, 6.845076560974121, 7.238094329833984, 7.631112098693848, 8.024129867553711, 8.417147636413574, 8.810165405273438, 9.203184127807617, 9.59620189666748, 9.989219665527344, 10.382237434387207, 10.77525520324707, 11.168272972106934, 11.561290740966797, 11.954309463500977, 12.34732723236084, 12.740345001220703, 13.133362770080566, 13.52638053894043]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 13.0, 15.0, 32.0, 38.0, 67.0, 78.0, 104.0, 159.0, 236.0, 344.0, 477.0, 718.0, 1095.0, 1613.0, 2428.0, 3619.0, 6020.0, 9777.0, 15722.0, 27352.0, 48729.0, 94502.0, 203960.0, 484002.0, 1011179.0, 1145831.0, 620035.0, 260060.0, 116265.0, 58559.0, 31850.0, 18314.0, 10887.0, 7082.0, 4294.0, 2892.0, 1833.0, 1235.0, 799.0, 594.0, 410.0, 299.0, 231.0, 139.0, 105.0, 75.0, 52.0, 36.0, 28.0, 27.0, 23.0, 11.0, 11.0, 9.0, 6.0, 6.0, 0.0, 4.0], "bins": [-16.296875, -15.773681640625, -15.25048828125, -14.727294921875, -14.2041015625, -13.680908203125, -13.15771484375, -12.634521484375, -12.111328125, -11.588134765625, -11.06494140625, -10.541748046875, -10.0185546875, -9.495361328125, -8.97216796875, -8.448974609375, -7.92578125, -7.402587890625, -6.87939453125, -6.356201171875, -5.8330078125, -5.309814453125, -4.78662109375, -4.263427734375, -3.740234375, -3.217041015625, -2.69384765625, -2.170654296875, -1.6474609375, -1.124267578125, -0.60107421875, -0.077880859375, 0.4453125, 0.968505859375, 1.49169921875, 2.014892578125, 2.5380859375, 3.061279296875, 3.58447265625, 4.107666015625, 4.630859375, 5.154052734375, 5.67724609375, 6.200439453125, 6.7236328125, 7.246826171875, 7.77001953125, 8.293212890625, 8.81640625, 9.339599609375, 9.86279296875, 10.385986328125, 10.9091796875, 11.432373046875, 11.95556640625, 12.478759765625, 13.001953125, 13.525146484375, 14.04833984375, 14.571533203125, 15.0947265625, 15.617919921875, 16.14111328125, 16.664306640625, 17.1875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 11.0, 8.0, 11.0, 10.0, 19.0, 10.0, 15.0, 16.0, 20.0, 32.0, 30.0, 38.0, 45.0, 33.0, 45.0, 31.0, 46.0, 48.0, 40.0, 44.0, 36.0, 36.0, 38.0, 42.0, 35.0, 40.0, 29.0, 22.0, 23.0, 13.0, 27.0, 20.0, 14.0, 9.0, 12.0, 12.0, 8.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.265625, -7.9888916015625, -7.712158203125, -7.4354248046875, -7.15869140625, -6.8819580078125, -6.605224609375, -6.3284912109375, -6.0517578125, -5.7750244140625, -5.498291015625, -5.2215576171875, -4.94482421875, -4.6680908203125, -4.391357421875, -4.1146240234375, -3.837890625, -3.5611572265625, -3.284423828125, -3.0076904296875, -2.73095703125, -2.4542236328125, -2.177490234375, -1.9007568359375, -1.6240234375, -1.3472900390625, -1.070556640625, -0.7938232421875, -0.51708984375, -0.2403564453125, 0.036376953125, 0.3131103515625, 0.58984375, 0.8665771484375, 1.143310546875, 1.4200439453125, 1.69677734375, 1.9735107421875, 2.250244140625, 2.5269775390625, 2.8037109375, 3.0804443359375, 3.357177734375, 3.6339111328125, 3.91064453125, 4.1873779296875, 4.464111328125, 4.7408447265625, 5.017578125, 5.2943115234375, 5.571044921875, 5.8477783203125, 6.12451171875, 6.4012451171875, 6.677978515625, 6.9547119140625, 7.2314453125, 7.5081787109375, 7.784912109375, 8.0616455078125, 8.33837890625, 8.6151123046875, 8.891845703125, 9.1685791015625, 9.4453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 12.0, 18.0, 36.0, 46.0, 66.0, 103.0, 168.0, 227.0, 384.0, 600.0, 980.0, 1558.0, 2540.0, 4250.0, 7326.0, 12946.0, 24027.0, 46681.0, 97005.0, 213969.0, 506140.0, 1087981.0, 1161542.0, 568179.0, 240219.0, 106023.0, 51121.0, 26216.0, 14023.0, 7990.0, 4672.0, 2757.0, 1730.0, 1052.0, 639.0, 376.0, 225.0, 141.0, 115.0, 64.0, 37.0, 25.0, 16.0, 14.0, 12.0, 8.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-20.734375, -20.125732421875, -19.51708984375, -18.908447265625, -18.2998046875, -17.691162109375, -17.08251953125, -16.473876953125, -15.865234375, -15.256591796875, -14.64794921875, -14.039306640625, -13.4306640625, -12.822021484375, -12.21337890625, -11.604736328125, -10.99609375, -10.387451171875, -9.77880859375, -9.170166015625, -8.5615234375, -7.952880859375, -7.34423828125, -6.735595703125, -6.126953125, -5.518310546875, -4.90966796875, -4.301025390625, -3.6923828125, -3.083740234375, -2.47509765625, -1.866455078125, -1.2578125, -0.649169921875, -0.04052734375, 0.568115234375, 1.1767578125, 1.785400390625, 2.39404296875, 3.002685546875, 3.611328125, 4.219970703125, 4.82861328125, 5.437255859375, 6.0458984375, 6.654541015625, 7.26318359375, 7.871826171875, 8.48046875, 9.089111328125, 9.69775390625, 10.306396484375, 10.9150390625, 11.523681640625, 12.13232421875, 12.740966796875, 13.349609375, 13.958251953125, 14.56689453125, 15.175537109375, 15.7841796875, 16.392822265625, 17.00146484375, 17.610107421875, 18.21875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 13.0, 9.0, 23.0, 19.0, 29.0, 50.0, 57.0, 69.0, 112.0, 135.0, 168.0, 192.0, 265.0, 285.0, 391.0, 385.0, 375.0, 304.0, 256.0, 206.0, 168.0, 163.0, 97.0, 70.0, 54.0, 40.0, 17.0, 38.0, 16.0, 10.0, 16.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.37139892578125, -5.1685791015625, -4.96575927734375, -4.762939453125, -4.56011962890625, -4.3572998046875, -4.15447998046875, -3.95166015625, -3.74884033203125, -3.5460205078125, -3.34320068359375, -3.140380859375, -2.93756103515625, -2.7347412109375, -2.53192138671875, -2.3291015625, -2.12628173828125, -1.9234619140625, -1.72064208984375, -1.517822265625, -1.31500244140625, -1.1121826171875, -0.90936279296875, -0.70654296875, -0.50372314453125, -0.3009033203125, -0.09808349609375, 0.104736328125, 0.30755615234375, 0.5103759765625, 0.71319580078125, 0.916015625, 1.11883544921875, 1.3216552734375, 1.52447509765625, 1.727294921875, 1.93011474609375, 2.1329345703125, 2.33575439453125, 2.53857421875, 2.74139404296875, 2.9442138671875, 3.14703369140625, 3.349853515625, 3.55267333984375, 3.7554931640625, 3.95831298828125, 4.1611328125, 4.36395263671875, 4.5667724609375, 4.76959228515625, 4.972412109375, 5.17523193359375, 5.3780517578125, 5.58087158203125, 5.78369140625, 5.98651123046875, 6.1893310546875, 6.39215087890625, 6.594970703125, 6.79779052734375, 7.0006103515625, 7.20343017578125, 7.40625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 11.0, 13.0, 22.0, 30.0, 23.0, 37.0, 40.0, 48.0, 73.0, 91.0, 89.0, 89.0, 89.0, 59.0, 61.0, 47.0, 42.0, 27.0, 15.0, 15.0, 14.0, 12.0, 9.0, 7.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.39463233947754, -26.70754051208496, -26.020448684692383, -25.333356857299805, -24.646265029907227, -23.95917320251465, -23.27208137512207, -22.584989547729492, -21.897897720336914, -21.210805892944336, -20.523714065551758, -19.83662223815918, -19.1495304107666, -18.462438583374023, -17.775346755981445, -17.088254928588867, -16.401165008544922, -15.714073181152344, -15.026981353759766, -14.339889526367188, -13.65279769897461, -12.965705871582031, -12.278614044189453, -11.591522216796875, -10.904430389404297, -10.217338562011719, -9.53024673461914, -8.843154907226562, -8.156063079833984, -7.468971252441406, -6.781879901885986, -6.094788074493408, -5.407695770263672, -4.720603942871094, -4.033512115478516, -3.3464205265045166, -2.6593286991119385, -1.9722368717193604, -1.2851452827453613, -0.5980534553527832, 0.08903837203979492, 0.7761301398277283, 1.4632219076156616, 2.15031361579895, 2.8374054431915283, 3.5244972705841064, 4.2115888595581055, 4.898680686950684, 5.585772514343262, 6.27286434173584, 6.959956169128418, 7.647047996520996, 8.334139823913574, 9.021231651306152, 9.708322525024414, 10.395414352416992, 11.08250617980957, 11.769598007202148, 12.456689834594727, 13.143781661987305, 13.830873489379883, 14.517965316772461, 15.205057144165039, 15.892148971557617, 16.579240798950195]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 9.0, 8.0, 12.0, 14.0, 8.0, 13.0, 12.0, 18.0, 21.0, 24.0, 33.0, 52.0, 44.0, 36.0, 44.0, 34.0, 41.0, 68.0, 48.0, 51.0, 41.0, 54.0, 55.0, 33.0, 36.0, 39.0, 21.0, 14.0, 26.0, 23.0, 8.0, 17.0, 13.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.019588470458984, -14.589088439941406, -14.158588409423828, -13.72808837890625, -13.297589302062988, -12.86708927154541, -12.436589241027832, -12.006089210510254, -11.575590133666992, -11.145090103149414, -10.714590072631836, -10.284090042114258, -9.853590965270996, -9.423090934753418, -8.99259090423584, -8.562090873718262, -8.131590843200684, -7.7010908126831055, -7.2705912590026855, -6.840091228485107, -6.4095916748046875, -5.979091644287109, -5.548591613769531, -5.118091583251953, -4.687592029571533, -4.257091999053955, -3.826592445373535, -3.396092414855957, -2.965592622756958, -2.535092830657959, -2.104592800140381, -1.6740930080413818, -1.2435941696166992, -0.8130943179130554, -0.3825944662094116, 0.04790544509887695, 0.478405237197876, 0.908905029296875, 1.3394050598144531, 1.7699048519134521, 2.200404644012451, 2.63090443611145, 3.061404228210449, 3.4919042587280273, 3.9224040508270264, 4.352903842926025, 4.7834038734436035, 5.213903427124023, 5.644403457641602, 6.07490348815918, 6.5054030418396, 6.935903072357178, 7.366402626037598, 7.796902656555176, 8.227402687072754, 8.657902717590332, 9.088401794433594, 9.518901824951172, 9.94940185546875, 10.379901885986328, 10.81040096282959, 11.240900993347168, 11.671401023864746, 12.101901054382324, 12.532401084899902]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 9.0, 11.0, 18.0, 24.0, 33.0, 46.0, 91.0, 112.0, 184.0, 279.0, 520.0, 833.0, 1400.0, 2313.0, 3849.0, 6718.0, 11599.0, 20910.0, 38046.0, 69745.0, 125040.0, 199411.0, 218239.0, 153313.0, 87348.0, 47860.0, 26132.0, 14446.0, 8212.0, 4768.0, 2803.0, 1660.0, 959.0, 604.0, 392.0, 224.0, 158.0, 95.0, 57.0, 33.0, 22.0, 10.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.90625, -9.63250732421875, -9.3587646484375, -9.08502197265625, -8.811279296875, -8.53753662109375, -8.2637939453125, -7.99005126953125, -7.71630859375, -7.44256591796875, -7.1688232421875, -6.89508056640625, -6.621337890625, -6.34759521484375, -6.0738525390625, -5.80010986328125, -5.5263671875, -5.25262451171875, -4.9788818359375, -4.70513916015625, -4.431396484375, -4.15765380859375, -3.8839111328125, -3.61016845703125, -3.33642578125, -3.06268310546875, -2.7889404296875, -2.51519775390625, -2.241455078125, -1.96771240234375, -1.6939697265625, -1.42022705078125, -1.146484375, -0.87274169921875, -0.5989990234375, -0.32525634765625, -0.051513671875, 0.22222900390625, 0.4959716796875, 0.76971435546875, 1.04345703125, 1.31719970703125, 1.5909423828125, 1.86468505859375, 2.138427734375, 2.41217041015625, 2.6859130859375, 2.95965576171875, 3.2333984375, 3.50714111328125, 3.7808837890625, 4.05462646484375, 4.328369140625, 4.60211181640625, 4.8758544921875, 5.14959716796875, 5.42333984375, 5.69708251953125, 5.9708251953125, 6.24456787109375, 6.518310546875, 6.79205322265625, 7.0657958984375, 7.33953857421875, 7.61328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 5.0, 1.0, 9.0, 8.0, 13.0, 10.0, 12.0, 12.0, 17.0, 22.0, 17.0, 24.0, 27.0, 35.0, 40.0, 37.0, 36.0, 42.0, 46.0, 47.0, 43.0, 52.0, 57.0, 36.0, 44.0, 38.0, 37.0, 40.0, 35.0, 22.0, 25.0, 25.0, 18.0, 10.0, 17.0, 7.0, 11.0, 7.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.5582275390625, -11.124267578125, -10.6903076171875, -10.25634765625, -9.8223876953125, -9.388427734375, -8.9544677734375, -8.5205078125, -8.0865478515625, -7.652587890625, -7.2186279296875, -6.78466796875, -6.3507080078125, -5.916748046875, -5.4827880859375, -5.048828125, -4.6148681640625, -4.180908203125, -3.7469482421875, -3.31298828125, -2.8790283203125, -2.445068359375, -2.0111083984375, -1.5771484375, -1.1431884765625, -0.709228515625, -0.2752685546875, 0.15869140625, 0.5926513671875, 1.026611328125, 1.4605712890625, 1.89453125, 2.3284912109375, 2.762451171875, 3.1964111328125, 3.63037109375, 4.0643310546875, 4.498291015625, 4.9322509765625, 5.3662109375, 5.8001708984375, 6.234130859375, 6.6680908203125, 7.10205078125, 7.5360107421875, 7.969970703125, 8.4039306640625, 8.837890625, 9.2718505859375, 9.705810546875, 10.1397705078125, 10.57373046875, 11.0076904296875, 11.441650390625, 11.8756103515625, 12.3095703125, 12.7435302734375, 13.177490234375, 13.6114501953125, 14.04541015625, 14.4793701171875, 14.913330078125, 15.3472900390625, 15.78125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 10.0, 17.0, 21.0, 25.0, 29.0, 62.0, 76.0, 106.0, 175.0, 211.0, 321.0, 482.0, 742.0, 1073.0, 1905.0, 3377.0, 5842.0, 10586.0, 21308.0, 45321.0, 103494.0, 225616.0, 303445.0, 175850.0, 76763.0, 34464.0, 16505.0, 8638.0, 4729.0, 2785.0, 1711.0, 998.0, 590.0, 388.0, 290.0, 185.0, 123.0, 82.0, 62.0, 40.0, 28.0, 25.0, 13.0, 9.0, 12.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.1312255859375, -11.731201171875, -11.3311767578125, -10.93115234375, -10.5311279296875, -10.131103515625, -9.7310791015625, -9.3310546875, -8.9310302734375, -8.531005859375, -8.1309814453125, -7.73095703125, -7.3309326171875, -6.930908203125, -6.5308837890625, -6.130859375, -5.7308349609375, -5.330810546875, -4.9307861328125, -4.53076171875, -4.1307373046875, -3.730712890625, -3.3306884765625, -2.9306640625, -2.5306396484375, -2.130615234375, -1.7305908203125, -1.33056640625, -0.9305419921875, -0.530517578125, -0.1304931640625, 0.26953125, 0.6695556640625, 1.069580078125, 1.4696044921875, 1.86962890625, 2.2696533203125, 2.669677734375, 3.0697021484375, 3.4697265625, 3.8697509765625, 4.269775390625, 4.6697998046875, 5.06982421875, 5.4698486328125, 5.869873046875, 6.2698974609375, 6.669921875, 7.0699462890625, 7.469970703125, 7.8699951171875, 8.27001953125, 8.6700439453125, 9.070068359375, 9.4700927734375, 9.8701171875, 10.2701416015625, 10.670166015625, 11.0701904296875, 11.47021484375, 11.8702392578125, 12.270263671875, 12.6702880859375, 13.0703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 7.0, 7.0, 7.0, 8.0, 8.0, 16.0, 20.0, 21.0, 21.0, 23.0, 25.0, 28.0, 34.0, 24.0, 37.0, 46.0, 45.0, 39.0, 46.0, 45.0, 33.0, 41.0, 37.0, 32.0, 33.0, 38.0, 31.0, 29.0, 30.0, 38.0, 22.0, 23.0, 19.0, 12.0, 11.0, 8.0, 12.0, 7.0, 7.0, 3.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.67578125, -6.45330810546875, -6.2308349609375, -6.00836181640625, -5.785888671875, -5.56341552734375, -5.3409423828125, -5.11846923828125, -4.89599609375, -4.67352294921875, -4.4510498046875, -4.22857666015625, -4.006103515625, -3.78363037109375, -3.5611572265625, -3.33868408203125, -3.1162109375, -2.89373779296875, -2.6712646484375, -2.44879150390625, -2.226318359375, -2.00384521484375, -1.7813720703125, -1.55889892578125, -1.33642578125, -1.11395263671875, -0.8914794921875, -0.66900634765625, -0.446533203125, -0.22406005859375, -0.0015869140625, 0.22088623046875, 0.443359375, 0.66583251953125, 0.8883056640625, 1.11077880859375, 1.333251953125, 1.55572509765625, 1.7781982421875, 2.00067138671875, 2.22314453125, 2.44561767578125, 2.6680908203125, 2.89056396484375, 3.113037109375, 3.33551025390625, 3.5579833984375, 3.78045654296875, 4.0029296875, 4.22540283203125, 4.4478759765625, 4.67034912109375, 4.892822265625, 5.11529541015625, 5.3377685546875, 5.56024169921875, 5.78271484375, 6.00518798828125, 6.2276611328125, 6.45013427734375, 6.672607421875, 6.89508056640625, 7.1175537109375, 7.34002685546875, 7.5625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 15.0, 32.0, 45.0, 49.0, 75.0, 120.0, 170.0, 219.0, 373.0, 617.0, 1000.0, 1904.0, 3539.0, 8567.0, 22213.0, 69292.0, 246418.0, 448925.0, 166677.0, 48547.0, 16441.0, 6357.0, 2880.0, 1541.0, 893.0, 554.0, 321.0, 226.0, 153.0, 96.0, 66.0, 67.0, 24.0, 31.0, 16.0, 12.0, 9.0, 9.0, 5.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.3828125, -6.19140625, -6.0, -5.80859375, -5.6171875, -5.42578125, -5.234375, -5.04296875, -4.8515625, -4.66015625, -4.46875, -4.27734375, -4.0859375, -3.89453125, -3.703125, -3.51171875, -3.3203125, -3.12890625, -2.9375, -2.74609375, -2.5546875, -2.36328125, -2.171875, -1.98046875, -1.7890625, -1.59765625, -1.40625, -1.21484375, -1.0234375, -0.83203125, -0.640625, -0.44921875, -0.2578125, -0.06640625, 0.125, 0.31640625, 0.5078125, 0.69921875, 0.890625, 1.08203125, 1.2734375, 1.46484375, 1.65625, 1.84765625, 2.0390625, 2.23046875, 2.421875, 2.61328125, 2.8046875, 2.99609375, 3.1875, 3.37890625, 3.5703125, 3.76171875, 3.953125, 4.14453125, 4.3359375, 4.52734375, 4.71875, 4.91015625, 5.1015625, 5.29296875, 5.484375, 5.67578125, 5.8671875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 6.0, 13.0, 12.0, 16.0, 31.0, 45.0, 72.0, 102.0, 126.0, 107.0, 138.0, 85.0, 78.0, 45.0, 51.0, 24.0, 16.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004858970642089844, -0.0004732981324195862, -0.000460699200630188, -0.0004481002688407898, -0.0004355013370513916, -0.0004229024052619934, -0.0004103034734725952, -0.000397704541683197, -0.00038510560989379883, -0.00037250667810440063, -0.00035990774631500244, -0.00034730881452560425, -0.00033470988273620605, -0.00032211095094680786, -0.00030951201915740967, -0.0002969130873680115, -0.0002843141555786133, -0.0002717152237892151, -0.0002591162919998169, -0.0002465173602104187, -0.0002339184284210205, -0.00022131949663162231, -0.00020872056484222412, -0.00019612163305282593, -0.00018352270126342773, -0.00017092376947402954, -0.00015832483768463135, -0.00014572590589523315, -0.00013312697410583496, -0.00012052804231643677, -0.00010792911052703857, -9.533017873764038e-05, -8.273124694824219e-05, -7.0132315158844e-05, -5.75333833694458e-05, -4.493445158004761e-05, -3.2335519790649414e-05, -1.973658800125122e-05, -7.137656211853027e-06, 5.461275577545166e-06, 1.806020736694336e-05, 3.065913915634155e-05, 4.3258070945739746e-05, 5.585700273513794e-05, 6.845593452453613e-05, 8.105486631393433e-05, 9.365379810333252e-05, 0.00010625272989273071, 0.0001188516616821289, 0.0001314505934715271, 0.0001440495252609253, 0.00015664845705032349, 0.00016924738883972168, 0.00018184632062911987, 0.00019444525241851807, 0.00020704418420791626, 0.00021964311599731445, 0.00023224204778671265, 0.00024484097957611084, 0.00025743991136550903, 0.0002700388431549072, 0.0002826377749443054, 0.0002952367067337036, 0.0003078356385231018, 0.0003204345703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 21.0, 24.0, 31.0, 42.0, 61.0, 95.0, 117.0, 203.0, 286.0, 461.0, 790.0, 1625.0, 3693.0, 9966.0, 32080.0, 116019.0, 353109.0, 359816.0, 119348.0, 32871.0, 10228.0, 3797.0, 1633.0, 853.0, 449.0, 310.0, 181.0, 114.0, 80.0, 59.0, 58.0, 32.0, 19.0, 20.0, 13.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6953125, -6.49249267578125, -6.2896728515625, -6.08685302734375, -5.884033203125, -5.68121337890625, -5.4783935546875, -5.27557373046875, -5.07275390625, -4.86993408203125, -4.6671142578125, -4.46429443359375, -4.261474609375, -4.05865478515625, -3.8558349609375, -3.65301513671875, -3.4501953125, -3.24737548828125, -3.0445556640625, -2.84173583984375, -2.638916015625, -2.43609619140625, -2.2332763671875, -2.03045654296875, -1.82763671875, -1.62481689453125, -1.4219970703125, -1.21917724609375, -1.016357421875, -0.81353759765625, -0.6107177734375, -0.40789794921875, -0.205078125, -0.00225830078125, 0.2005615234375, 0.40338134765625, 0.606201171875, 0.80902099609375, 1.0118408203125, 1.21466064453125, 1.41748046875, 1.62030029296875, 1.8231201171875, 2.02593994140625, 2.228759765625, 2.43157958984375, 2.6343994140625, 2.83721923828125, 3.0400390625, 3.24285888671875, 3.4456787109375, 3.64849853515625, 3.851318359375, 4.05413818359375, 4.2569580078125, 4.45977783203125, 4.66259765625, 4.86541748046875, 5.0682373046875, 5.27105712890625, 5.473876953125, 5.67669677734375, 5.8795166015625, 6.08233642578125, 6.28515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 20.0, 22.0, 43.0, 63.0, 115.0, 131.0, 135.0, 118.0, 114.0, 74.0, 44.0, 40.0, 28.0, 16.0, 3.0, 8.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.28955078125, -2.2197265625, -2.14990234375, -2.080078125, -2.01025390625, -1.9404296875, -1.87060546875, -1.80078125, -1.73095703125, -1.6611328125, -1.59130859375, -1.521484375, -1.45166015625, -1.3818359375, -1.31201171875, -1.2421875, -1.17236328125, -1.1025390625, -1.03271484375, -0.962890625, -0.89306640625, -0.8232421875, -0.75341796875, -0.68359375, -0.61376953125, -0.5439453125, -0.47412109375, -0.404296875, -0.33447265625, -0.2646484375, -0.19482421875, -0.125, -0.05517578125, 0.0146484375, 0.08447265625, 0.154296875, 0.22412109375, 0.2939453125, 0.36376953125, 0.43359375, 0.50341796875, 0.5732421875, 0.64306640625, 0.712890625, 0.78271484375, 0.8525390625, 0.92236328125, 0.9921875, 1.06201171875, 1.1318359375, 1.20166015625, 1.271484375, 1.34130859375, 1.4111328125, 1.48095703125, 1.55078125, 1.62060546875, 1.6904296875, 1.76025390625, 1.830078125, 1.89990234375, 1.9697265625, 2.03955078125, 2.109375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 8.0, 4.0, 14.0, 21.0, 23.0, 21.0, 35.0, 42.0, 52.0, 56.0, 76.0, 108.0, 93.0, 88.0, 73.0, 62.0, 57.0, 40.0, 29.0, 16.0, 17.0, 14.0, 7.0, 9.0, 11.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.336435317993164, -28.623172760009766, -27.909908294677734, -27.196643829345703, -26.483381271362305, -25.770118713378906, -25.056854248046875, -24.343589782714844, -23.630327224731445, -22.917064666748047, -22.203800201416016, -21.490535736083984, -20.777273178100586, -20.064010620117188, -19.350746154785156, -18.637481689453125, -17.924219131469727, -17.210956573486328, -16.497692108154297, -15.784428596496582, -15.071165084838867, -14.357901573181152, -13.644638061523438, -12.931374549865723, -12.218111038208008, -11.504847526550293, -10.791584014892578, -10.078320503234863, -9.365056991577148, -8.651793479919434, -7.938529968261719, -7.225266456604004, -6.512004852294922, -5.798741340637207, -5.085477828979492, -4.372214317321777, -3.6589508056640625, -2.9456872940063477, -2.232423782348633, -1.519160270690918, -0.8058967590332031, -0.09263324737548828, 0.6206302642822266, 1.3338937759399414, 2.0471572875976562, 2.760420799255371, 3.473684310913086, 4.186947822570801, 4.900211334228516, 5.6134748458862305, 6.326738357543945, 7.04000186920166, 7.753265380859375, 8.46652889251709, 9.179792404174805, 9.89305591583252, 10.606319427490234, 11.31958293914795, 12.032846450805664, 12.746109962463379, 13.459373474121094, 14.172636985778809, 14.885900497436523, 15.599164009094238, 16.312427520751953]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 13.0, 10.0, 13.0, 13.0, 13.0, 17.0, 23.0, 22.0, 32.0, 43.0, 47.0, 48.0, 34.0, 37.0, 42.0, 57.0, 58.0, 48.0, 53.0, 42.0, 57.0, 37.0, 34.0, 34.0, 23.0, 25.0, 20.0, 19.0, 14.0, 17.0, 12.0, 9.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.124489784240723, -14.69525146484375, -14.266013145446777, -13.836774826049805, -13.407536506652832, -12.97829818725586, -12.54905891418457, -12.119821548461914, -11.690582275390625, -11.261343955993652, -10.83210563659668, -10.402867317199707, -9.973628997802734, -9.544390678405762, -9.115152359008789, -8.6859130859375, -8.256675720214844, -7.827437400817871, -7.398199081420898, -6.968960762023926, -6.539722442626953, -6.1104841232299805, -5.68124532699585, -5.252007007598877, -4.822768688201904, -4.393530368804932, -3.964292049407959, -3.5350534915924072, -3.1058151721954346, -2.676576852798462, -2.24733829498291, -1.8180999755859375, -1.3888616561889648, -0.9596232771873474, -0.53038489818573, -0.10114645957946777, 0.3280918598175049, 0.7573301792144775, 1.1865687370300293, 1.615807056427002, 2.0450453758239746, 2.4742836952209473, 2.90352201461792, 3.3327605724334717, 3.7619988918304443, 4.191237449645996, 4.620475769042969, 5.049714088439941, 5.478952407836914, 5.908190727233887, 6.337429046630859, 6.766667366027832, 7.195905685424805, 7.625144004821777, 8.05438232421875, 8.483621597290039, 8.912858963012695, 9.342097282409668, 9.77133560180664, 10.200573921203613, 10.629812240600586, 11.059050559997559, 11.488288879394531, 11.91752815246582, 12.346766471862793]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 17.0, 10.0, 36.0, 43.0, 85.0, 132.0, 298.0, 529.0, 1127.0, 2188.0, 4562.0, 10088.0, 22317.0, 52380.0, 120587.0, 236622.0, 281719.0, 174394.0, 79168.0, 34355.0, 14796.0, 6734.0, 3210.0, 1529.0, 750.0, 408.0, 211.0, 109.0, 71.0, 24.0, 18.0, 15.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.578125, -23.8388671875, -23.099609375, -22.3603515625, -21.62109375, -20.8818359375, -20.142578125, -19.4033203125, -18.6640625, -17.9248046875, -17.185546875, -16.4462890625, -15.70703125, -14.9677734375, -14.228515625, -13.4892578125, -12.75, -12.0107421875, -11.271484375, -10.5322265625, -9.79296875, -9.0537109375, -8.314453125, -7.5751953125, -6.8359375, -6.0966796875, -5.357421875, -4.6181640625, -3.87890625, -3.1396484375, -2.400390625, -1.6611328125, -0.921875, -0.1826171875, 0.556640625, 1.2958984375, 2.03515625, 2.7744140625, 3.513671875, 4.2529296875, 4.9921875, 5.7314453125, 6.470703125, 7.2099609375, 7.94921875, 8.6884765625, 9.427734375, 10.1669921875, 10.90625, 11.6455078125, 12.384765625, 13.1240234375, 13.86328125, 14.6025390625, 15.341796875, 16.0810546875, 16.8203125, 17.5595703125, 18.298828125, 19.0380859375, 19.77734375, 20.5166015625, 21.255859375, 21.9951171875, 22.734375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 1.0, 7.0, 14.0, 6.0, 9.0, 9.0, 17.0, 12.0, 16.0, 24.0, 20.0, 36.0, 23.0, 31.0, 42.0, 43.0, 44.0, 43.0, 44.0, 58.0, 52.0, 57.0, 47.0, 43.0, 41.0, 32.0, 32.0, 34.0, 28.0, 24.0, 13.0, 14.0, 18.0, 13.0, 15.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-15.34375, -14.915283203125, -14.48681640625, -14.058349609375, -13.6298828125, -13.201416015625, -12.77294921875, -12.344482421875, -11.916015625, -11.487548828125, -11.05908203125, -10.630615234375, -10.2021484375, -9.773681640625, -9.34521484375, -8.916748046875, -8.48828125, -8.059814453125, -7.63134765625, -7.202880859375, -6.7744140625, -6.345947265625, -5.91748046875, -5.489013671875, -5.060546875, -4.632080078125, -4.20361328125, -3.775146484375, -3.3466796875, -2.918212890625, -2.48974609375, -2.061279296875, -1.6328125, -1.204345703125, -0.77587890625, -0.347412109375, 0.0810546875, 0.509521484375, 0.93798828125, 1.366455078125, 1.794921875, 2.223388671875, 2.65185546875, 3.080322265625, 3.5087890625, 3.937255859375, 4.36572265625, 4.794189453125, 5.22265625, 5.651123046875, 6.07958984375, 6.508056640625, 6.9365234375, 7.364990234375, 7.79345703125, 8.221923828125, 8.650390625, 9.078857421875, 9.50732421875, 9.935791015625, 10.3642578125, 10.792724609375, 11.22119140625, 11.649658203125, 12.078125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 6.0, 9.0, 12.0, 17.0, 21.0, 23.0, 42.0, 61.0, 81.0, 109.0, 145.0, 207.0, 315.0, 477.0, 724.0, 1215.0, 2211.0, 4094.0, 8173.0, 16676.0, 34862.0, 75483.0, 151671.0, 243722.0, 235411.0, 140494.0, 68874.0, 31701.0, 15161.0, 7440.0, 3787.0, 2020.0, 1182.0, 710.0, 414.0, 276.0, 207.0, 144.0, 99.0, 63.0, 61.0, 40.0, 40.0, 23.0, 13.0, 10.0, 12.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-20.3125, -19.676513671875, -19.04052734375, -18.404541015625, -17.7685546875, -17.132568359375, -16.49658203125, -15.860595703125, -15.224609375, -14.588623046875, -13.95263671875, -13.316650390625, -12.6806640625, -12.044677734375, -11.40869140625, -10.772705078125, -10.13671875, -9.500732421875, -8.86474609375, -8.228759765625, -7.5927734375, -6.956787109375, -6.32080078125, -5.684814453125, -5.048828125, -4.412841796875, -3.77685546875, -3.140869140625, -2.5048828125, -1.868896484375, -1.23291015625, -0.596923828125, 0.0390625, 0.675048828125, 1.31103515625, 1.947021484375, 2.5830078125, 3.218994140625, 3.85498046875, 4.490966796875, 5.126953125, 5.762939453125, 6.39892578125, 7.034912109375, 7.6708984375, 8.306884765625, 8.94287109375, 9.578857421875, 10.21484375, 10.850830078125, 11.48681640625, 12.122802734375, 12.7587890625, 13.394775390625, 14.03076171875, 14.666748046875, 15.302734375, 15.938720703125, 16.57470703125, 17.210693359375, 17.8466796875, 18.482666015625, 19.11865234375, 19.754638671875, 20.390625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 14.0, 11.0, 10.0, 16.0, 25.0, 20.0, 25.0, 33.0, 39.0, 26.0, 49.0, 56.0, 33.0, 41.0, 52.0, 47.0, 43.0, 45.0, 46.0, 37.0, 49.0, 29.0, 30.0, 43.0, 29.0, 26.0, 20.0, 20.0, 14.0, 11.0, 13.0, 11.0, 4.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.0703125, -9.806640625, -9.54296875, -9.279296875, -9.015625, -8.751953125, -8.48828125, -8.224609375, -7.9609375, -7.697265625, -7.43359375, -7.169921875, -6.90625, -6.642578125, -6.37890625, -6.115234375, -5.8515625, -5.587890625, -5.32421875, -5.060546875, -4.796875, -4.533203125, -4.26953125, -4.005859375, -3.7421875, -3.478515625, -3.21484375, -2.951171875, -2.6875, -2.423828125, -2.16015625, -1.896484375, -1.6328125, -1.369140625, -1.10546875, -0.841796875, -0.578125, -0.314453125, -0.05078125, 0.212890625, 0.4765625, 0.740234375, 1.00390625, 1.267578125, 1.53125, 1.794921875, 2.05859375, 2.322265625, 2.5859375, 2.849609375, 3.11328125, 3.376953125, 3.640625, 3.904296875, 4.16796875, 4.431640625, 4.6953125, 4.958984375, 5.22265625, 5.486328125, 5.75, 6.013671875, 6.27734375, 6.541015625, 6.8046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 6.0, 15.0, 29.0, 22.0, 31.0, 54.0, 78.0, 90.0, 110.0, 174.0, 231.0, 353.0, 501.0, 800.0, 1208.0, 1987.0, 3327.0, 5590.0, 10038.0, 18844.0, 35354.0, 68007.0, 129417.0, 210585.0, 228582.0, 154563.0, 83367.0, 43282.0, 22576.0, 12213.0, 6665.0, 3833.0, 2291.0, 1433.0, 908.0, 593.0, 400.0, 293.0, 197.0, 144.0, 109.0, 76.0, 50.0, 37.0, 29.0, 14.0, 13.0, 11.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.1640625, -7.91015625, -7.65625, -7.40234375, -7.1484375, -6.89453125, -6.640625, -6.38671875, -6.1328125, -5.87890625, -5.625, -5.37109375, -5.1171875, -4.86328125, -4.609375, -4.35546875, -4.1015625, -3.84765625, -3.59375, -3.33984375, -3.0859375, -2.83203125, -2.578125, -2.32421875, -2.0703125, -1.81640625, -1.5625, -1.30859375, -1.0546875, -0.80078125, -0.546875, -0.29296875, -0.0390625, 0.21484375, 0.46875, 0.72265625, 0.9765625, 1.23046875, 1.484375, 1.73828125, 1.9921875, 2.24609375, 2.5, 2.75390625, 3.0078125, 3.26171875, 3.515625, 3.76953125, 4.0234375, 4.27734375, 4.53125, 4.78515625, 5.0390625, 5.29296875, 5.546875, 5.80078125, 6.0546875, 6.30859375, 6.5625, 6.81640625, 7.0703125, 7.32421875, 7.578125, 7.83203125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 8.0, 9.0, 16.0, 9.0, 34.0, 18.0, 37.0, 55.0, 64.0, 80.0, 81.0, 77.0, 87.0, 97.0, 78.0, 37.0, 51.0, 33.0, 24.0, 23.0, 11.0, 15.0, 10.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0011339187622070312, -0.001104898750782013, -0.0010758787393569946, -0.0010468587279319763, -0.001017838716506958, -0.0009888187050819397, -0.0009597986936569214, -0.0009307786822319031, -0.0009017586708068848, -0.0008727386593818665, -0.0008437186479568481, -0.0008146986365318298, -0.0007856786251068115, -0.0007566586136817932, -0.0007276386022567749, -0.0006986185908317566, -0.0006695985794067383, -0.00064057856798172, -0.0006115585565567017, -0.0005825385451316833, -0.000553518533706665, -0.0005244985222816467, -0.0004954785108566284, -0.0004664584994316101, -0.0004374384880065918, -0.0004084184765815735, -0.0003793984651565552, -0.00035037845373153687, -0.00032135844230651855, -0.00029233843088150024, -0.00026331841945648193, -0.00023429840803146362, -0.0002052783966064453, -0.000176258385181427, -0.0001472383737564087, -0.00011821836233139038, -8.919835090637207e-05, -6.017833948135376e-05, -3.115832805633545e-05, -2.1383166313171387e-06, 2.6881694793701172e-05, 5.590170621871948e-05, 8.492171764373779e-05, 0.0001139417290687561, 0.00014296174049377441, 0.00017198175191879272, 0.00020100176334381104, 0.00023002177476882935, 0.00025904178619384766, 0.00028806179761886597, 0.0003170818090438843, 0.0003461018204689026, 0.0003751218318939209, 0.0004041418433189392, 0.0004331618547439575, 0.00046218186616897583, 0.0004912018775939941, 0.0005202218890190125, 0.0005492419004440308, 0.0005782619118690491, 0.0006072819232940674, 0.0006363019347190857, 0.000665321946144104, 0.0006943419575691223, 0.0007233619689941406]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 11.0, 11.0, 26.0, 35.0, 56.0, 74.0, 70.0, 120.0, 179.0, 239.0, 416.0, 596.0, 976.0, 1618.0, 2659.0, 4889.0, 8986.0, 16789.0, 33133.0, 67011.0, 133677.0, 223501.0, 237980.0, 154044.0, 78817.0, 38863.0, 19540.0, 10485.0, 5602.0, 3124.0, 1866.0, 1071.0, 693.0, 410.0, 284.0, 179.0, 158.0, 96.0, 67.0, 48.0, 35.0, 30.0, 25.0, 12.0, 16.0, 10.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.390625, -8.1209716796875, -7.851318359375, -7.5816650390625, -7.31201171875, -7.0423583984375, -6.772705078125, -6.5030517578125, -6.2333984375, -5.9637451171875, -5.694091796875, -5.4244384765625, -5.15478515625, -4.8851318359375, -4.615478515625, -4.3458251953125, -4.076171875, -3.8065185546875, -3.536865234375, -3.2672119140625, -2.99755859375, -2.7279052734375, -2.458251953125, -2.1885986328125, -1.9189453125, -1.6492919921875, -1.379638671875, -1.1099853515625, -0.84033203125, -0.5706787109375, -0.301025390625, -0.0313720703125, 0.23828125, 0.5079345703125, 0.777587890625, 1.0472412109375, 1.31689453125, 1.5865478515625, 1.856201171875, 2.1258544921875, 2.3955078125, 2.6651611328125, 2.934814453125, 3.2044677734375, 3.47412109375, 3.7437744140625, 4.013427734375, 4.2830810546875, 4.552734375, 4.8223876953125, 5.092041015625, 5.3616943359375, 5.63134765625, 5.9010009765625, 6.170654296875, 6.4403076171875, 6.7099609375, 6.9796142578125, 7.249267578125, 7.5189208984375, 7.78857421875, 8.0582275390625, 8.327880859375, 8.5975341796875, 8.8671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 1.0, 0.0, 4.0, 6.0, 4.0, 1.0, 8.0, 8.0, 7.0, 13.0, 8.0, 15.0, 17.0, 16.0, 26.0, 34.0, 37.0, 34.0, 42.0, 52.0, 68.0, 75.0, 80.0, 55.0, 70.0, 51.0, 56.0, 41.0, 31.0, 24.0, 30.0, 17.0, 10.0, 11.0, 12.0, 12.0, 6.0, 9.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.923828125, -2.8406982421875, -2.757568359375, -2.6744384765625, -2.59130859375, -2.5081787109375, -2.425048828125, -2.3419189453125, -2.2587890625, -2.1756591796875, -2.092529296875, -2.0093994140625, -1.92626953125, -1.8431396484375, -1.760009765625, -1.6768798828125, -1.59375, -1.5106201171875, -1.427490234375, -1.3443603515625, -1.26123046875, -1.1781005859375, -1.094970703125, -1.0118408203125, -0.9287109375, -0.8455810546875, -0.762451171875, -0.6793212890625, -0.59619140625, -0.5130615234375, -0.429931640625, -0.3468017578125, -0.263671875, -0.1805419921875, -0.097412109375, -0.0142822265625, 0.06884765625, 0.1519775390625, 0.235107421875, 0.3182373046875, 0.4013671875, 0.4844970703125, 0.567626953125, 0.6507568359375, 0.73388671875, 0.8170166015625, 0.900146484375, 0.9832763671875, 1.06640625, 1.1495361328125, 1.232666015625, 1.3157958984375, 1.39892578125, 1.4820556640625, 1.565185546875, 1.6483154296875, 1.7314453125, 1.8145751953125, 1.897705078125, 1.9808349609375, 2.06396484375, 2.1470947265625, 2.230224609375, 2.3133544921875, 2.396484375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 8.0, 6.0, 7.0, 20.0, 19.0, 21.0, 25.0, 38.0, 42.0, 70.0, 68.0, 80.0, 79.0, 94.0, 78.0, 64.0, 70.0, 53.0, 38.0, 22.0, 24.0, 16.0, 12.0, 10.0, 6.0, 7.0, 7.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.061565399169922, -25.35848045349121, -24.655397415161133, -23.952312469482422, -23.249229431152344, -22.546144485473633, -21.843059539794922, -21.139976501464844, -20.436893463134766, -19.733808517456055, -19.030725479125977, -18.327640533447266, -17.624557495117188, -16.921472549438477, -16.218387603759766, -15.515304565429688, -14.812219619750977, -14.109135627746582, -13.406051635742188, -12.702966690063477, -11.999883651733398, -11.296798706054688, -10.593714714050293, -9.890630722045898, -9.187546730041504, -8.48446273803711, -7.781378746032715, -7.078294277191162, -6.375210285186768, -5.672126293182373, -4.96904182434082, -4.265957832336426, -3.5628719329833984, -2.859787940979004, -2.1567037105560303, -1.4536194801330566, -0.7505354881286621, -0.04745149612426758, 0.6556329727172852, 1.3587169647216797, 2.061800956726074, 2.7648849487304688, 3.4679691791534424, 4.171053409576416, 4.8741374015808105, 5.577221393585205, 6.280305862426758, 6.983389854431152, 7.686473846435547, 8.389557838439941, 9.092641830444336, 9.795726776123047, 10.498809814453125, 11.201894760131836, 11.90497875213623, 12.608062744140625, 13.31114673614502, 14.014230728149414, 14.717314720153809, 15.420398712158203, 16.123483657836914, 16.826566696166992, 17.529651641845703, 18.23273468017578, 18.935819625854492]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 13.0, 14.0, 13.0, 19.0, 20.0, 16.0, 19.0, 27.0, 28.0, 47.0, 39.0, 37.0, 49.0, 39.0, 61.0, 37.0, 40.0, 58.0, 51.0, 58.0, 45.0, 43.0, 33.0, 28.0, 28.0, 26.0, 18.0, 12.0, 16.0, 16.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.976397514343262, -13.553116798400879, -13.129836082458496, -12.70655632019043, -12.283275604248047, -11.859994888305664, -11.436714172363281, -11.013433456420898, -10.590153694152832, -10.16687297821045, -9.743592262268066, -9.3203125, -8.897031784057617, -8.473751068115234, -8.050470352172852, -7.627190113067627, -7.203909397125244, -6.780628681182861, -6.357348442077637, -5.934067726135254, -5.510787487030029, -5.0875067710876465, -4.664226531982422, -4.240945816040039, -3.8176653385162354, -3.3943848609924316, -2.971104383468628, -2.547823905944824, -2.1245431900024414, -1.7012627124786377, -1.277982234954834, -0.8547017574310303, -0.43142127990722656, -0.008140772581100464, 0.41513973474502563, 0.8384202718734741, 1.2617007493972778, 1.684981346130371, 2.108261823654175, 2.5315423011779785, 2.9548227787017822, 3.378103256225586, 3.8013837337493896, 4.224664211273193, 4.647944927215576, 5.071225166320801, 5.494505882263184, 5.917786598205566, 6.341066837310791, 6.764347553253174, 7.187627792358398, 7.610908508300781, 8.034189224243164, 8.457469940185547, 8.880749702453613, 9.304030418395996, 9.727311134338379, 10.150591850280762, 10.573872566223145, 10.997152328491211, 11.420433044433594, 11.843713760375977, 12.26699447631836, 12.690275192260742, 13.113554954528809]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 10.0, 17.0, 28.0, 52.0, 90.0, 179.0, 280.0, 547.0, 1088.0, 2446.0, 5311.0, 12701.0, 34321.0, 117322.0, 554860.0, 2081283.0, 1087009.0, 209395.0, 54538.0, 18415.0, 7324.0, 3307.0, 1634.0, 881.0, 484.0, 292.0, 151.0, 106.0, 71.0, 45.0, 31.0, 11.0, 18.0, 8.0, 6.0, 11.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.463134765625, -22.47314453125, -21.483154296875, -20.4931640625, -19.503173828125, -18.51318359375, -17.523193359375, -16.533203125, -15.543212890625, -14.55322265625, -13.563232421875, -12.5732421875, -11.583251953125, -10.59326171875, -9.603271484375, -8.61328125, -7.623291015625, -6.63330078125, -5.643310546875, -4.6533203125, -3.663330078125, -2.67333984375, -1.683349609375, -0.693359375, 0.296630859375, 1.28662109375, 2.276611328125, 3.2666015625, 4.256591796875, 5.24658203125, 6.236572265625, 7.2265625, 8.216552734375, 9.20654296875, 10.196533203125, 11.1865234375, 12.176513671875, 13.16650390625, 14.156494140625, 15.146484375, 16.136474609375, 17.12646484375, 18.116455078125, 19.1064453125, 20.096435546875, 21.08642578125, 22.076416015625, 23.06640625, 24.056396484375, 25.04638671875, 26.036376953125, 27.0263671875, 28.016357421875, 29.00634765625, 29.996337890625, 30.986328125, 31.976318359375, 32.96630859375, 33.956298828125, 34.9462890625, 35.936279296875, 36.92626953125, 37.916259765625, 38.90625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 13.0, 10.0, 10.0, 13.0, 19.0, 18.0, 26.0, 23.0, 33.0, 29.0, 35.0, 36.0, 47.0, 50.0, 53.0, 64.0, 51.0, 52.0, 50.0, 55.0, 41.0, 45.0, 28.0, 36.0, 25.0, 23.0, 19.0, 15.0, 11.0, 17.0, 18.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.919677734375, -9.62060546875, -9.321533203125, -9.0224609375, -8.723388671875, -8.42431640625, -8.125244140625, -7.826171875, -7.527099609375, -7.22802734375, -6.928955078125, -6.6298828125, -6.330810546875, -6.03173828125, -5.732666015625, -5.43359375, -5.134521484375, -4.83544921875, -4.536376953125, -4.2373046875, -3.938232421875, -3.63916015625, -3.340087890625, -3.041015625, -2.741943359375, -2.44287109375, -2.143798828125, -1.8447265625, -1.545654296875, -1.24658203125, -0.947509765625, -0.6484375, -0.349365234375, -0.05029296875, 0.248779296875, 0.5478515625, 0.846923828125, 1.14599609375, 1.445068359375, 1.744140625, 2.043212890625, 2.34228515625, 2.641357421875, 2.9404296875, 3.239501953125, 3.53857421875, 3.837646484375, 4.13671875, 4.435791015625, 4.73486328125, 5.033935546875, 5.3330078125, 5.632080078125, 5.93115234375, 6.230224609375, 6.529296875, 6.828369140625, 7.12744140625, 7.426513671875, 7.7255859375, 8.024658203125, 8.32373046875, 8.622802734375, 8.921875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 14.0, 13.0, 23.0, 34.0, 30.0, 67.0, 114.0, 163.0, 232.0, 363.0, 599.0, 960.0, 1565.0, 2549.0, 4277.0, 7362.0, 13273.0, 24438.0, 46810.0, 96179.0, 209579.0, 480952.0, 1025031.0, 1169337.0, 604605.0, 263613.0, 118769.0, 57140.0, 29325.0, 15526.0, 8739.0, 4886.0, 2984.0, 1812.0, 1074.0, 637.0, 433.0, 255.0, 177.0, 101.0, 83.0, 51.0, 41.0, 27.0, 17.0, 10.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.953125, -16.390625, -15.828125, -15.265625, -14.703125, -14.140625, -13.578125, -13.015625, -12.453125, -11.890625, -11.328125, -10.765625, -10.203125, -9.640625, -9.078125, -8.515625, -7.953125, -7.390625, -6.828125, -6.265625, -5.703125, -5.140625, -4.578125, -4.015625, -3.453125, -2.890625, -2.328125, -1.765625, -1.203125, -0.640625, -0.078125, 0.484375, 1.046875, 1.609375, 2.171875, 2.734375, 3.296875, 3.859375, 4.421875, 4.984375, 5.546875, 6.109375, 6.671875, 7.234375, 7.796875, 8.359375, 8.921875, 9.484375, 10.046875, 10.609375, 11.171875, 11.734375, 12.296875, 12.859375, 13.421875, 13.984375, 14.546875, 15.109375, 15.671875, 16.234375, 16.796875, 17.359375, 17.921875, 18.484375, 19.046875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 13.0, 17.0, 22.0, 35.0, 33.0, 52.0, 56.0, 74.0, 118.0, 141.0, 185.0, 229.0, 303.0, 321.0, 357.0, 349.0, 296.0, 295.0, 248.0, 202.0, 164.0, 127.0, 90.0, 94.0, 54.0, 39.0, 25.0, 29.0, 24.0, 12.0, 7.0, 16.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0859375, -5.90789794921875, -5.7298583984375, -5.55181884765625, -5.373779296875, -5.19573974609375, -5.0177001953125, -4.83966064453125, -4.66162109375, -4.48358154296875, -4.3055419921875, -4.12750244140625, -3.949462890625, -3.77142333984375, -3.5933837890625, -3.41534423828125, -3.2373046875, -3.05926513671875, -2.8812255859375, -2.70318603515625, -2.525146484375, -2.34710693359375, -2.1690673828125, -1.99102783203125, -1.81298828125, -1.63494873046875, -1.4569091796875, -1.27886962890625, -1.100830078125, -0.92279052734375, -0.7447509765625, -0.56671142578125, -0.388671875, -0.21063232421875, -0.0325927734375, 0.14544677734375, 0.323486328125, 0.50152587890625, 0.6795654296875, 0.85760498046875, 1.03564453125, 1.21368408203125, 1.3917236328125, 1.56976318359375, 1.747802734375, 1.92584228515625, 2.1038818359375, 2.28192138671875, 2.4599609375, 2.63800048828125, 2.8160400390625, 2.99407958984375, 3.172119140625, 3.35015869140625, 3.5281982421875, 3.70623779296875, 3.88427734375, 4.06231689453125, 4.2403564453125, 4.41839599609375, 4.596435546875, 4.77447509765625, 4.9525146484375, 5.13055419921875, 5.30859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 3.0, 7.0, 10.0, 10.0, 26.0, 27.0, 29.0, 39.0, 59.0, 70.0, 70.0, 102.0, 88.0, 72.0, 83.0, 65.0, 58.0, 41.0, 19.0, 28.0, 15.0, 17.0, 8.0, 12.0, 6.0, 6.0, 4.0, 4.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.464479446411133, -22.782136917114258, -22.099794387817383, -21.417451858520508, -20.735107421875, -20.052764892578125, -19.37042236328125, -18.688079833984375, -18.0057373046875, -17.323394775390625, -16.64105224609375, -15.958708763122559, -15.276366233825684, -14.594023704528809, -13.911680221557617, -13.229337692260742, -12.546995162963867, -11.864652633666992, -11.182310104370117, -10.499966621398926, -9.81762409210205, -9.135281562805176, -8.452938079833984, -7.770595550537109, -7.088253021240234, -6.405910491943359, -5.723567485809326, -5.041224479675293, -4.358881950378418, -3.676539182662964, -2.9941964149475098, -2.3118534088134766, -1.6295089721679688, -0.9471662044525146, -0.26482343673706055, 0.41751933097839355, 1.0998620986938477, 1.7822048664093018, 2.464547634124756, 3.146890640258789, 3.829233169555664, 4.511575698852539, 5.193918704986572, 5.8762617111206055, 6.5586042404174805, 7.2409467697143555, 7.923289775848389, 8.605632781982422, 9.287975311279297, 9.970317840576172, 10.652660369873047, 11.335003852844238, 12.017346382141113, 12.699688911437988, 13.38203239440918, 14.064374923706055, 14.74671745300293, 15.429059982299805, 16.11140251159668, 16.793745040893555, 17.476089477539062, 18.158432006835938, 18.840774536132812, 19.523117065429688, 20.205459594726562]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 6.0, 10.0, 5.0, 11.0, 11.0, 7.0, 13.0, 20.0, 18.0, 25.0, 20.0, 23.0, 24.0, 39.0, 47.0, 49.0, 41.0, 38.0, 47.0, 46.0, 48.0, 44.0, 47.0, 43.0, 36.0, 44.0, 40.0, 30.0, 20.0, 24.0, 15.0, 18.0, 21.0, 13.0, 14.0, 7.0, 6.0, 5.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.00927734375, -11.652820587158203, -11.296363830566406, -10.93990707397461, -10.583450317382812, -10.226994514465332, -9.870537757873535, -9.514081001281738, -9.157624244689941, -8.801167488098145, -8.444710731506348, -8.08825397491455, -7.731797695159912, -7.375340938568115, -7.018884658813477, -6.66242790222168, -6.305971145629883, -5.949514389038086, -5.593057632446289, -5.23660135269165, -4.8801445960998535, -4.523687839508057, -4.167231559753418, -3.810774803161621, -3.454318046569824, -3.0978612899780273, -2.7414047718048096, -2.384948253631592, -2.028491497039795, -1.6720348596572876, -1.3155782222747803, -0.9591217041015625, -0.602665901184082, -0.2462092638015747, 0.11024737358093262, 0.46670401096343994, 0.8231606483459473, 1.1796172857284546, 1.536073923110962, 1.8925304412841797, 2.2489871978759766, 2.6054439544677734, 2.961900472640991, 3.318356990814209, 3.674813747406006, 4.031270503997803, 4.387726783752441, 4.744183540344238, 5.100640296936035, 5.457097053527832, 5.813553810119629, 6.170010089874268, 6.5264668464660645, 6.882923603057861, 7.2393798828125, 7.595836639404297, 7.952293395996094, 8.30875015258789, 8.665206909179688, 9.021663665771484, 9.378120422363281, 9.734576225280762, 10.091032981872559, 10.447489738464355, 10.803946495056152]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 9.0, 19.0, 15.0, 41.0, 36.0, 55.0, 78.0, 112.0, 184.0, 312.0, 418.0, 768.0, 1280.0, 2231.0, 3812.0, 7027.0, 13418.0, 28005.0, 60877.0, 134334.0, 256058.0, 265857.0, 145305.0, 66184.0, 30125.0, 14600.0, 7588.0, 4037.0, 2219.0, 1366.0, 790.0, 467.0, 273.0, 185.0, 119.0, 96.0, 58.0, 49.0, 40.0, 21.0, 21.0, 10.0, 12.0, 12.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.9296875, -10.5989990234375, -10.268310546875, -9.9376220703125, -9.60693359375, -9.2762451171875, -8.945556640625, -8.6148681640625, -8.2841796875, -7.9534912109375, -7.622802734375, -7.2921142578125, -6.96142578125, -6.6307373046875, -6.300048828125, -5.9693603515625, -5.638671875, -5.3079833984375, -4.977294921875, -4.6466064453125, -4.31591796875, -3.9852294921875, -3.654541015625, -3.3238525390625, -2.9931640625, -2.6624755859375, -2.331787109375, -2.0010986328125, -1.67041015625, -1.3397216796875, -1.009033203125, -0.6783447265625, -0.34765625, -0.0169677734375, 0.313720703125, 0.6444091796875, 0.97509765625, 1.3057861328125, 1.636474609375, 1.9671630859375, 2.2978515625, 2.6285400390625, 2.959228515625, 3.2899169921875, 3.62060546875, 3.9512939453125, 4.281982421875, 4.6126708984375, 4.943359375, 5.2740478515625, 5.604736328125, 5.9354248046875, 6.26611328125, 6.5968017578125, 6.927490234375, 7.2581787109375, 7.5888671875, 7.9195556640625, 8.250244140625, 8.5809326171875, 8.91162109375, 9.2423095703125, 9.572998046875, 9.9036865234375, 10.234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 10.0, 9.0, 11.0, 8.0, 10.0, 15.0, 17.0, 13.0, 23.0, 33.0, 17.0, 32.0, 36.0, 33.0, 42.0, 44.0, 54.0, 50.0, 47.0, 66.0, 37.0, 44.0, 28.0, 38.0, 42.0, 33.0, 29.0, 28.0, 19.0, 16.0, 19.0, 21.0, 12.0, 7.0, 5.0, 11.0, 6.0, 3.0, 6.0, 8.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-13.3125, -12.9403076171875, -12.568115234375, -12.1959228515625, -11.82373046875, -11.4515380859375, -11.079345703125, -10.7071533203125, -10.3349609375, -9.9627685546875, -9.590576171875, -9.2183837890625, -8.84619140625, -8.4739990234375, -8.101806640625, -7.7296142578125, -7.357421875, -6.9852294921875, -6.613037109375, -6.2408447265625, -5.86865234375, -5.4964599609375, -5.124267578125, -4.7520751953125, -4.3798828125, -4.0076904296875, -3.635498046875, -3.2633056640625, -2.89111328125, -2.5189208984375, -2.146728515625, -1.7745361328125, -1.40234375, -1.0301513671875, -0.657958984375, -0.2857666015625, 0.08642578125, 0.4586181640625, 0.830810546875, 1.2030029296875, 1.5751953125, 1.9473876953125, 2.319580078125, 2.6917724609375, 3.06396484375, 3.4361572265625, 3.808349609375, 4.1805419921875, 4.552734375, 4.9249267578125, 5.297119140625, 5.6693115234375, 6.04150390625, 6.4136962890625, 6.785888671875, 7.1580810546875, 7.5302734375, 7.9024658203125, 8.274658203125, 8.6468505859375, 9.01904296875, 9.3912353515625, 9.763427734375, 10.1356201171875, 10.5078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 12.0, 20.0, 15.0, 25.0, 38.0, 47.0, 86.0, 110.0, 178.0, 227.0, 371.0, 571.0, 934.0, 1487.0, 2593.0, 4607.0, 8908.0, 17868.0, 40172.0, 97612.0, 236540.0, 333131.0, 174031.0, 69861.0, 29301.0, 13711.0, 6897.0, 3652.0, 2083.0, 1261.0, 769.0, 494.0, 320.0, 190.0, 126.0, 82.0, 74.0, 45.0, 22.0, 17.0, 17.0, 16.0, 7.0, 10.0, 8.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-14.7578125, -14.3277587890625, -13.897705078125, -13.4676513671875, -13.03759765625, -12.6075439453125, -12.177490234375, -11.7474365234375, -11.3173828125, -10.8873291015625, -10.457275390625, -10.0272216796875, -9.59716796875, -9.1671142578125, -8.737060546875, -8.3070068359375, -7.876953125, -7.4468994140625, -7.016845703125, -6.5867919921875, -6.15673828125, -5.7266845703125, -5.296630859375, -4.8665771484375, -4.4365234375, -4.0064697265625, -3.576416015625, -3.1463623046875, -2.71630859375, -2.2862548828125, -1.856201171875, -1.4261474609375, -0.99609375, -0.5660400390625, -0.135986328125, 0.2940673828125, 0.72412109375, 1.1541748046875, 1.584228515625, 2.0142822265625, 2.4443359375, 2.8743896484375, 3.304443359375, 3.7344970703125, 4.16455078125, 4.5946044921875, 5.024658203125, 5.4547119140625, 5.884765625, 6.3148193359375, 6.744873046875, 7.1749267578125, 7.60498046875, 8.0350341796875, 8.465087890625, 8.8951416015625, 9.3251953125, 9.7552490234375, 10.185302734375, 10.6153564453125, 11.04541015625, 11.4754638671875, 11.905517578125, 12.3355712890625, 12.765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 13.0, 8.0, 12.0, 11.0, 17.0, 20.0, 21.0, 31.0, 29.0, 25.0, 38.0, 29.0, 28.0, 41.0, 28.0, 41.0, 45.0, 35.0, 48.0, 44.0, 41.0, 27.0, 41.0, 44.0, 41.0, 34.0, 22.0, 19.0, 31.0, 19.0, 17.0, 20.0, 7.0, 10.0, 8.0, 11.0, 6.0, 8.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.9296875, -6.72015380859375, -6.5106201171875, -6.30108642578125, -6.091552734375, -5.88201904296875, -5.6724853515625, -5.46295166015625, -5.25341796875, -5.04388427734375, -4.8343505859375, -4.62481689453125, -4.415283203125, -4.20574951171875, -3.9962158203125, -3.78668212890625, -3.5771484375, -3.36761474609375, -3.1580810546875, -2.94854736328125, -2.739013671875, -2.52947998046875, -2.3199462890625, -2.11041259765625, -1.90087890625, -1.69134521484375, -1.4818115234375, -1.27227783203125, -1.062744140625, -0.85321044921875, -0.6436767578125, -0.43414306640625, -0.224609375, -0.01507568359375, 0.1944580078125, 0.40399169921875, 0.613525390625, 0.82305908203125, 1.0325927734375, 1.24212646484375, 1.45166015625, 1.66119384765625, 1.8707275390625, 2.08026123046875, 2.289794921875, 2.49932861328125, 2.7088623046875, 2.91839599609375, 3.1279296875, 3.33746337890625, 3.5469970703125, 3.75653076171875, 3.966064453125, 4.17559814453125, 4.3851318359375, 4.59466552734375, 4.80419921875, 5.01373291015625, 5.2232666015625, 5.43280029296875, 5.642333984375, 5.85186767578125, 6.0614013671875, 6.27093505859375, 6.48046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 14.0, 22.0, 19.0, 34.0, 53.0, 59.0, 78.0, 157.0, 247.0, 330.0, 536.0, 845.0, 1495.0, 2781.0, 5390.0, 10822.0, 25129.0, 63105.0, 172528.0, 373762.0, 240611.0, 87924.0, 33721.0, 14312.0, 6531.0, 3321.0, 1825.0, 1026.0, 651.0, 395.0, 268.0, 171.0, 117.0, 78.0, 53.0, 35.0, 18.0, 28.0, 18.0, 11.0, 4.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05078125, -4.89129638671875, -4.7318115234375, -4.57232666015625, -4.412841796875, -4.25335693359375, -4.0938720703125, -3.93438720703125, -3.77490234375, -3.61541748046875, -3.4559326171875, -3.29644775390625, -3.136962890625, -2.97747802734375, -2.8179931640625, -2.65850830078125, -2.4990234375, -2.33953857421875, -2.1800537109375, -2.02056884765625, -1.861083984375, -1.70159912109375, -1.5421142578125, -1.38262939453125, -1.22314453125, -1.06365966796875, -0.9041748046875, -0.74468994140625, -0.585205078125, -0.42572021484375, -0.2662353515625, -0.10675048828125, 0.052734375, 0.21221923828125, 0.3717041015625, 0.53118896484375, 0.690673828125, 0.85015869140625, 1.0096435546875, 1.16912841796875, 1.32861328125, 1.48809814453125, 1.6475830078125, 1.80706787109375, 1.966552734375, 2.12603759765625, 2.2855224609375, 2.44500732421875, 2.6044921875, 2.76397705078125, 2.9234619140625, 3.08294677734375, 3.242431640625, 3.40191650390625, 3.5614013671875, 3.72088623046875, 3.88037109375, 4.03985595703125, 4.1993408203125, 4.35882568359375, 4.518310546875, 4.67779541015625, 4.8372802734375, 4.99676513671875, 5.15625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 9.0, 12.0, 20.0, 22.0, 29.0, 40.0, 46.0, 59.0, 69.0, 103.0, 89.0, 89.0, 79.0, 77.0, 52.0, 46.0, 33.0, 26.0, 23.0, 9.0, 7.0, 9.0, 4.0, 5.0, 1.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003216266632080078, -0.0003117993474006653, -0.00030197203159332275, -0.0002921447157859802, -0.0002823173999786377, -0.00027249008417129517, -0.00026266276836395264, -0.0002528354525566101, -0.00024300813674926758, -0.00023318082094192505, -0.00022335350513458252, -0.00021352618932724, -0.00020369887351989746, -0.00019387155771255493, -0.0001840442419052124, -0.00017421692609786987, -0.00016438961029052734, -0.00015456229448318481, -0.00014473497867584229, -0.00013490766286849976, -0.00012508034706115723, -0.0001152530312538147, -0.00010542571544647217, -9.559839963912964e-05, -8.577108383178711e-05, -7.594376802444458e-05, -6.611645221710205e-05, -5.628913640975952e-05, -4.646182060241699e-05, -3.663450479507446e-05, -2.6807188987731934e-05, -1.6979873180389404e-05, -7.152557373046875e-06, 2.6747584342956543e-06, 1.2502074241638184e-05, 2.2329390048980713e-05, 3.215670585632324e-05, 4.198402166366577e-05, 5.18113374710083e-05, 6.163865327835083e-05, 7.146596908569336e-05, 8.129328489303589e-05, 9.112060070037842e-05, 0.00010094791650772095, 0.00011077523231506348, 0.000120602548122406, 0.00013042986392974854, 0.00014025717973709106, 0.0001500844955444336, 0.00015991181135177612, 0.00016973912715911865, 0.00017956644296646118, 0.0001893937587738037, 0.00019922107458114624, 0.00020904839038848877, 0.0002188757061958313, 0.00022870302200317383, 0.00023853033781051636, 0.0002483576536178589, 0.0002581849694252014, 0.00026801228523254395, 0.0002778396010398865, 0.000287666916847229, 0.00029749423265457153, 0.00030732154846191406]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 14.0, 20.0, 17.0, 22.0, 25.0, 33.0, 56.0, 52.0, 113.0, 114.0, 173.0, 229.0, 315.0, 411.0, 594.0, 912.0, 1470.0, 2445.0, 4652.0, 9602.0, 21253.0, 50508.0, 126737.0, 271195.0, 296039.0, 151386.0, 60822.0, 25280.0, 11113.0, 5303.0, 2724.0, 1571.0, 968.0, 668.0, 434.0, 322.0, 241.0, 202.0, 135.0, 113.0, 66.0, 52.0, 39.0, 42.0, 17.0, 19.0, 15.0, 11.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.65625, -4.50653076171875, -4.3568115234375, -4.20709228515625, -4.057373046875, -3.90765380859375, -3.7579345703125, -3.60821533203125, -3.45849609375, -3.30877685546875, -3.1590576171875, -3.00933837890625, -2.859619140625, -2.70989990234375, -2.5601806640625, -2.41046142578125, -2.2607421875, -2.11102294921875, -1.9613037109375, -1.81158447265625, -1.661865234375, -1.51214599609375, -1.3624267578125, -1.21270751953125, -1.06298828125, -0.91326904296875, -0.7635498046875, -0.61383056640625, -0.464111328125, -0.31439208984375, -0.1646728515625, -0.01495361328125, 0.134765625, 0.28448486328125, 0.4342041015625, 0.58392333984375, 0.733642578125, 0.88336181640625, 1.0330810546875, 1.18280029296875, 1.33251953125, 1.48223876953125, 1.6319580078125, 1.78167724609375, 1.931396484375, 2.08111572265625, 2.2308349609375, 2.38055419921875, 2.5302734375, 2.67999267578125, 2.8297119140625, 2.97943115234375, 3.129150390625, 3.27886962890625, 3.4285888671875, 3.57830810546875, 3.72802734375, 3.87774658203125, 4.0274658203125, 4.17718505859375, 4.326904296875, 4.47662353515625, 4.6263427734375, 4.77606201171875, 4.92578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 10.0, 21.0, 29.0, 43.0, 59.0, 85.0, 110.0, 114.0, 117.0, 115.0, 85.0, 66.0, 33.0, 39.0, 19.0, 12.0, 11.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8362579345703125, -1.775054931640625, -1.7138519287109375, -1.65264892578125, -1.5914459228515625, -1.530242919921875, -1.4690399169921875, -1.4078369140625, -1.3466339111328125, -1.285430908203125, -1.2242279052734375, -1.16302490234375, -1.1018218994140625, -1.040618896484375, -0.9794158935546875, -0.918212890625, -0.8570098876953125, -0.795806884765625, -0.7346038818359375, -0.67340087890625, -0.6121978759765625, -0.550994873046875, -0.4897918701171875, -0.4285888671875, -0.3673858642578125, -0.306182861328125, -0.2449798583984375, -0.18377685546875, -0.1225738525390625, -0.061370849609375, -0.0001678466796875, 0.06103515625, 0.1222381591796875, 0.183441162109375, 0.2446441650390625, 0.30584716796875, 0.3670501708984375, 0.428253173828125, 0.4894561767578125, 0.5506591796875, 0.6118621826171875, 0.673065185546875, 0.7342681884765625, 0.79547119140625, 0.8566741943359375, 0.917877197265625, 0.9790802001953125, 1.040283203125, 1.1014862060546875, 1.162689208984375, 1.2238922119140625, 1.28509521484375, 1.3462982177734375, 1.407501220703125, 1.4687042236328125, 1.5299072265625, 1.5911102294921875, 1.652313232421875, 1.7135162353515625, 1.77471923828125, 1.8359222412109375, 1.897125244140625, 1.9583282470703125, 2.01953125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 15.0, 15.0, 31.0, 28.0, 33.0, 59.0, 67.0, 82.0, 89.0, 99.0, 87.0, 74.0, 73.0, 55.0, 35.0, 29.0, 24.0, 11.0, 23.0, 9.0, 8.0, 7.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.203750610351562, -24.492664337158203, -23.78157615661621, -23.07048988342285, -22.35940170288086, -21.6483154296875, -20.93722915649414, -20.22614097595215, -19.51505470275879, -18.80396842956543, -18.092880249023438, -17.381793975830078, -16.670705795288086, -15.959619522094727, -15.24853229522705, -14.537445068359375, -13.8263578414917, -13.115270614624023, -12.404183387756348, -11.693096160888672, -10.982009887695312, -10.270922660827637, -9.559835433959961, -8.848749160766602, -8.13766098022461, -7.426573753356934, -6.715487003326416, -6.00439977645874, -5.293313026428223, -4.582225799560547, -3.871138572692871, -3.1600518226623535, -2.448965072631836, -1.7378780841827393, -1.026790976524353, -0.3157038688659668, 0.3953831195831299, 1.1064701080322266, 1.8175573348999023, 2.52864408493042, 3.2397313117980957, 3.9508183002471924, 4.661905288696289, 5.372992515563965, 6.084079742431641, 6.795166492462158, 7.506253719329834, 8.217340469360352, 8.928427696228027, 9.639514923095703, 10.350602149963379, 11.061689376831055, 11.772775650024414, 12.48386287689209, 13.194950103759766, 13.906036376953125, 14.617124557495117, 15.328211784362793, 16.03929901123047, 16.750385284423828, 17.46147346496582, 18.17255973815918, 18.883647918701172, 19.59473419189453, 20.30582046508789]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 3.0, 7.0, 9.0, 8.0, 12.0, 7.0, 11.0, 16.0, 17.0, 17.0, 25.0, 21.0, 21.0, 25.0, 43.0, 40.0, 42.0, 45.0, 37.0, 48.0, 45.0, 42.0, 49.0, 51.0, 34.0, 46.0, 36.0, 39.0, 32.0, 23.0, 20.0, 16.0, 23.0, 17.0, 17.0, 12.0, 5.0, 9.0, 6.0, 6.0, 8.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.688831329345703, -11.343927383422852, -10.999024391174316, -10.654120445251465, -10.30921745300293, -9.964313507080078, -9.619409561157227, -9.274505615234375, -8.92960262298584, -8.584698677062988, -8.239795684814453, -7.894891738891602, -7.549988269805908, -7.205084800720215, -6.860180854797363, -6.51527738571167, -6.170373916625977, -5.825470447540283, -5.48056697845459, -5.135663032531738, -4.790759563446045, -4.445856094360352, -4.1009521484375, -3.7560486793518066, -3.4111452102661133, -3.06624174118042, -2.7213380336761475, -2.376434326171875, -2.0315308570861816, -1.6866272687911987, -1.3417236804962158, -0.9968199729919434, -0.6519174575805664, -0.3070138692855835, 0.037889719009399414, 0.3827933073043823, 0.7276968955993652, 1.0726004838943481, 1.417504072189331, 1.7624077796936035, 2.107311248779297, 2.4522147178649902, 2.7971184253692627, 3.142022132873535, 3.4869256019592285, 3.831829071044922, 4.176733016967773, 4.521636486053467, 4.86653995513916, 5.2114434242248535, 5.556346893310547, 5.901250839233398, 6.246154308319092, 6.591057777404785, 6.935961723327637, 7.28086519241333, 7.625768661499023, 7.970672130584717, 8.31557559967041, 8.660479545593262, 9.005382537841797, 9.350286483764648, 9.6951904296875, 10.040094375610352, 10.384997367858887]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 5.0, 12.0, 7.0, 13.0, 20.0, 40.0, 41.0, 68.0, 119.0, 169.0, 280.0, 407.0, 679.0, 1065.0, 1701.0, 2879.0, 4736.0, 7924.0, 13978.0, 24311.0, 42409.0, 72150.0, 118963.0, 171616.0, 189690.0, 153105.0, 99673.0, 59650.0, 34689.0, 19721.0, 11425.0, 6817.0, 3986.0, 2291.0, 1471.0, 902.0, 531.0, 327.0, 233.0, 138.0, 110.0, 81.0, 41.0, 24.0, 21.0, 13.0, 3.0, 6.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0], "bins": [-15.1015625, -14.6614990234375, -14.221435546875, -13.7813720703125, -13.34130859375, -12.9012451171875, -12.461181640625, -12.0211181640625, -11.5810546875, -11.1409912109375, -10.700927734375, -10.2608642578125, -9.82080078125, -9.3807373046875, -8.940673828125, -8.5006103515625, -8.060546875, -7.6204833984375, -7.180419921875, -6.7403564453125, -6.30029296875, -5.8602294921875, -5.420166015625, -4.9801025390625, -4.5400390625, -4.0999755859375, -3.659912109375, -3.2198486328125, -2.77978515625, -2.3397216796875, -1.899658203125, -1.4595947265625, -1.01953125, -0.5794677734375, -0.139404296875, 0.3006591796875, 0.74072265625, 1.1807861328125, 1.620849609375, 2.0609130859375, 2.5009765625, 2.9410400390625, 3.381103515625, 3.8211669921875, 4.26123046875, 4.7012939453125, 5.141357421875, 5.5814208984375, 6.021484375, 6.4615478515625, 6.901611328125, 7.3416748046875, 7.78173828125, 8.2218017578125, 8.661865234375, 9.1019287109375, 9.5419921875, 9.9820556640625, 10.422119140625, 10.8621826171875, 11.30224609375, 11.7423095703125, 12.182373046875, 12.6224365234375, 13.0625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 4.0, 9.0, 4.0, 7.0, 14.0, 15.0, 17.0, 21.0, 24.0, 21.0, 31.0, 44.0, 43.0, 50.0, 51.0, 49.0, 46.0, 45.0, 50.0, 56.0, 40.0, 58.0, 37.0, 44.0, 30.0, 34.0, 24.0, 24.0, 24.0, 17.0, 10.0, 8.0, 15.0, 5.0, 6.0, 9.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.59375, -12.183837890625, -11.77392578125, -11.364013671875, -10.9541015625, -10.544189453125, -10.13427734375, -9.724365234375, -9.314453125, -8.904541015625, -8.49462890625, -8.084716796875, -7.6748046875, -7.264892578125, -6.85498046875, -6.445068359375, -6.03515625, -5.625244140625, -5.21533203125, -4.805419921875, -4.3955078125, -3.985595703125, -3.57568359375, -3.165771484375, -2.755859375, -2.345947265625, -1.93603515625, -1.526123046875, -1.1162109375, -0.706298828125, -0.29638671875, 0.113525390625, 0.5234375, 0.933349609375, 1.34326171875, 1.753173828125, 2.1630859375, 2.572998046875, 2.98291015625, 3.392822265625, 3.802734375, 4.212646484375, 4.62255859375, 5.032470703125, 5.4423828125, 5.852294921875, 6.26220703125, 6.672119140625, 7.08203125, 7.491943359375, 7.90185546875, 8.311767578125, 8.7216796875, 9.131591796875, 9.54150390625, 9.951416015625, 10.361328125, 10.771240234375, 11.18115234375, 11.591064453125, 12.0009765625, 12.410888671875, 12.82080078125, 13.230712890625, 13.640625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 2.0, 6.0, 10.0, 16.0, 16.0, 31.0, 38.0, 70.0, 108.0, 130.0, 209.0, 297.0, 512.0, 840.0, 1385.0, 2353.0, 4073.0, 7239.0, 13249.0, 25557.0, 49297.0, 94381.0, 164703.0, 222726.0, 196780.0, 123594.0, 66357.0, 34520.0, 17776.0, 9555.0, 5230.0, 2913.0, 1713.0, 1069.0, 659.0, 381.0, 236.0, 168.0, 112.0, 70.0, 51.0, 36.0, 23.0, 21.0, 14.0, 8.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.15625, -16.615478515625, -16.07470703125, -15.533935546875, -14.9931640625, -14.452392578125, -13.91162109375, -13.370849609375, -12.830078125, -12.289306640625, -11.74853515625, -11.207763671875, -10.6669921875, -10.126220703125, -9.58544921875, -9.044677734375, -8.50390625, -7.963134765625, -7.42236328125, -6.881591796875, -6.3408203125, -5.800048828125, -5.25927734375, -4.718505859375, -4.177734375, -3.636962890625, -3.09619140625, -2.555419921875, -2.0146484375, -1.473876953125, -0.93310546875, -0.392333984375, 0.1484375, 0.689208984375, 1.22998046875, 1.770751953125, 2.3115234375, 2.852294921875, 3.39306640625, 3.933837890625, 4.474609375, 5.015380859375, 5.55615234375, 6.096923828125, 6.6376953125, 7.178466796875, 7.71923828125, 8.260009765625, 8.80078125, 9.341552734375, 9.88232421875, 10.423095703125, 10.9638671875, 11.504638671875, 12.04541015625, 12.586181640625, 13.126953125, 13.667724609375, 14.20849609375, 14.749267578125, 15.2900390625, 15.830810546875, 16.37158203125, 16.912353515625, 17.453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 3.0, 5.0, 5.0, 10.0, 11.0, 13.0, 7.0, 20.0, 29.0, 14.0, 27.0, 21.0, 23.0, 32.0, 25.0, 42.0, 39.0, 31.0, 30.0, 34.0, 44.0, 41.0, 35.0, 34.0, 35.0, 37.0, 37.0, 27.0, 28.0, 32.0, 22.0, 30.0, 21.0, 15.0, 16.0, 16.0, 15.0, 15.0, 14.0, 10.0, 9.0, 3.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0], "bins": [-6.01953125, -5.82952880859375, -5.6395263671875, -5.44952392578125, -5.259521484375, -5.06951904296875, -4.8795166015625, -4.68951416015625, -4.49951171875, -4.30950927734375, -4.1195068359375, -3.92950439453125, -3.739501953125, -3.54949951171875, -3.3594970703125, -3.16949462890625, -2.9794921875, -2.78948974609375, -2.5994873046875, -2.40948486328125, -2.219482421875, -2.02947998046875, -1.8394775390625, -1.64947509765625, -1.45947265625, -1.26947021484375, -1.0794677734375, -0.88946533203125, -0.699462890625, -0.50946044921875, -0.3194580078125, -0.12945556640625, 0.060546875, 0.25054931640625, 0.4405517578125, 0.63055419921875, 0.820556640625, 1.01055908203125, 1.2005615234375, 1.39056396484375, 1.58056640625, 1.77056884765625, 1.9605712890625, 2.15057373046875, 2.340576171875, 2.53057861328125, 2.7205810546875, 2.91058349609375, 3.1005859375, 3.29058837890625, 3.4805908203125, 3.67059326171875, 3.860595703125, 4.05059814453125, 4.2406005859375, 4.43060302734375, 4.62060546875, 4.81060791015625, 5.0006103515625, 5.19061279296875, 5.380615234375, 5.57061767578125, 5.7606201171875, 5.95062255859375, 6.140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 11.0, 10.0, 25.0, 35.0, 50.0, 101.0, 125.0, 209.0, 366.0, 640.0, 1035.0, 1816.0, 3086.0, 5288.0, 9748.0, 18050.0, 33747.0, 64932.0, 122252.0, 199199.0, 226885.0, 164458.0, 91694.0, 48467.0, 25113.0, 13586.0, 7469.0, 4183.0, 2388.0, 1412.0, 845.0, 498.0, 327.0, 196.0, 130.0, 58.0, 41.0, 28.0, 23.0, 10.0, 8.0, 5.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.853515625, -5.66015625, -5.466796875, -5.2734375, -5.080078125, -4.88671875, -4.693359375, -4.5, -4.306640625, -4.11328125, -3.919921875, -3.7265625, -3.533203125, -3.33984375, -3.146484375, -2.953125, -2.759765625, -2.56640625, -2.373046875, -2.1796875, -1.986328125, -1.79296875, -1.599609375, -1.40625, -1.212890625, -1.01953125, -0.826171875, -0.6328125, -0.439453125, -0.24609375, -0.052734375, 0.140625, 0.333984375, 0.52734375, 0.720703125, 0.9140625, 1.107421875, 1.30078125, 1.494140625, 1.6875, 1.880859375, 2.07421875, 2.267578125, 2.4609375, 2.654296875, 2.84765625, 3.041015625, 3.234375, 3.427734375, 3.62109375, 3.814453125, 4.0078125, 4.201171875, 4.39453125, 4.587890625, 4.78125, 4.974609375, 5.16796875, 5.361328125, 5.5546875, 5.748046875, 5.94140625, 6.134765625, 6.328125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 5.0, 7.0, 24.0, 28.0, 33.0, 31.0, 56.0, 55.0, 65.0, 87.0, 89.0, 114.0, 73.0, 61.0, 69.0, 47.0, 48.0, 23.0, 26.0, 13.0, 9.0, 11.0, 4.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007867813110351562, -0.0007650107145309448, -0.0007432401180267334, -0.000721469521522522, -0.0006996989250183105, -0.0006779283285140991, -0.0006561577320098877, -0.0006343871355056763, -0.0006126165390014648, -0.0005908459424972534, -0.000569075345993042, -0.0005473047494888306, -0.0005255341529846191, -0.0005037635564804077, -0.0004819929599761963, -0.00046022236347198486, -0.00043845176696777344, -0.000416681170463562, -0.0003949105739593506, -0.00037313997745513916, -0.00035136938095092773, -0.0003295987844467163, -0.0003078281879425049, -0.00028605759143829346, -0.00026428699493408203, -0.0002425163984298706, -0.00022074580192565918, -0.00019897520542144775, -0.00017720460891723633, -0.0001554340124130249, -0.00013366341590881348, -0.00011189281940460205, -9.012222290039062e-05, -6.83516263961792e-05, -4.6581029891967773e-05, -2.4810433387756348e-05, -3.039836883544922e-06, 1.8730759620666504e-05, 4.050135612487793e-05, 6.227195262908936e-05, 8.404254913330078e-05, 0.00010581314563751221, 0.00012758374214172363, 0.00014935433864593506, 0.00017112493515014648, 0.0001928955316543579, 0.00021466612815856934, 0.00023643672466278076, 0.0002582073211669922, 0.0002799779176712036, 0.00030174851417541504, 0.00032351911067962646, 0.0003452897071838379, 0.0003670603036880493, 0.00038883090019226074, 0.00041060149669647217, 0.0004323720932006836, 0.000454142689704895, 0.00047591328620910645, 0.0004976838827133179, 0.0005194544792175293, 0.0005412250757217407, 0.0005629956722259521, 0.0005847662687301636, 0.000606536865234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 7.0, 25.0, 31.0, 41.0, 59.0, 99.0, 151.0, 223.0, 379.0, 623.0, 1097.0, 1682.0, 2824.0, 4824.0, 8138.0, 14275.0, 25776.0, 46251.0, 82568.0, 140457.0, 201650.0, 198523.0, 136420.0, 79832.0, 44303.0, 24591.0, 14080.0, 7965.0, 4527.0, 2691.0, 1675.0, 1014.0, 641.0, 406.0, 238.0, 148.0, 107.0, 72.0, 43.0, 22.0, 18.0, 21.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.70703125, -6.52056884765625, -6.3341064453125, -6.14764404296875, -5.961181640625, -5.77471923828125, -5.5882568359375, -5.40179443359375, -5.21533203125, -5.02886962890625, -4.8424072265625, -4.65594482421875, -4.469482421875, -4.28302001953125, -4.0965576171875, -3.91009521484375, -3.7236328125, -3.53717041015625, -3.3507080078125, -3.16424560546875, -2.977783203125, -2.79132080078125, -2.6048583984375, -2.41839599609375, -2.23193359375, -2.04547119140625, -1.8590087890625, -1.67254638671875, -1.486083984375, -1.29962158203125, -1.1131591796875, -0.92669677734375, -0.740234375, -0.55377197265625, -0.3673095703125, -0.18084716796875, 0.005615234375, 0.19207763671875, 0.3785400390625, 0.56500244140625, 0.75146484375, 0.93792724609375, 1.1243896484375, 1.31085205078125, 1.497314453125, 1.68377685546875, 1.8702392578125, 2.05670166015625, 2.2431640625, 2.42962646484375, 2.6160888671875, 2.80255126953125, 2.989013671875, 3.17547607421875, 3.3619384765625, 3.54840087890625, 3.73486328125, 3.92132568359375, 4.1077880859375, 4.29425048828125, 4.480712890625, 4.66717529296875, 4.8536376953125, 5.04010009765625, 5.2265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 10.0, 17.0, 10.0, 12.0, 16.0, 29.0, 32.0, 37.0, 39.0, 45.0, 55.0, 72.0, 53.0, 56.0, 58.0, 59.0, 48.0, 52.0, 40.0, 37.0, 35.0, 38.0, 22.0, 24.0, 11.0, 9.0, 19.0, 7.0, 10.0, 8.0, 9.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6244354248046875, -1.572113037109375, -1.5197906494140625, -1.46746826171875, -1.4151458740234375, -1.362823486328125, -1.3105010986328125, -1.2581787109375, -1.2058563232421875, -1.153533935546875, -1.1012115478515625, -1.04888916015625, -0.9965667724609375, -0.944244384765625, -0.8919219970703125, -0.839599609375, -0.7872772216796875, -0.734954833984375, -0.6826324462890625, -0.63031005859375, -0.5779876708984375, -0.525665283203125, -0.4733428955078125, -0.4210205078125, -0.3686981201171875, -0.316375732421875, -0.2640533447265625, -0.21173095703125, -0.1594085693359375, -0.107086181640625, -0.0547637939453125, -0.00244140625, 0.0498809814453125, 0.102203369140625, 0.1545257568359375, 0.20684814453125, 0.2591705322265625, 0.311492919921875, 0.3638153076171875, 0.4161376953125, 0.4684600830078125, 0.520782470703125, 0.5731048583984375, 0.62542724609375, 0.6777496337890625, 0.730072021484375, 0.7823944091796875, 0.834716796875, 0.8870391845703125, 0.939361572265625, 0.9916839599609375, 1.04400634765625, 1.0963287353515625, 1.148651123046875, 1.2009735107421875, 1.2532958984375, 1.3056182861328125, 1.357940673828125, 1.4102630615234375, 1.46258544921875, 1.5149078369140625, 1.567230224609375, 1.6195526123046875, 1.671875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 10.0, 6.0, 8.0, 10.0, 15.0, 34.0, 27.0, 35.0, 62.0, 72.0, 55.0, 106.0, 64.0, 85.0, 85.0, 58.0, 57.0, 40.0, 29.0, 30.0, 26.0, 12.0, 12.0, 12.0, 7.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.424373626708984, -20.788061141967773, -20.151748657226562, -19.515438079833984, -18.879125595092773, -18.242813110351562, -17.60650062561035, -16.97018814086914, -16.333877563476562, -15.697565078735352, -15.061253547668457, -14.424941062927246, -13.788629531860352, -13.15231704711914, -12.51600456237793, -11.879693031311035, -11.243380546569824, -10.607068061828613, -9.970756530761719, -9.334444046020508, -8.698132514953613, -8.061820030212402, -7.42550802230835, -6.789196014404297, -6.152884006500244, -5.516571998596191, -4.880259990692139, -4.243947982788086, -3.607635736465454, -2.9713237285614014, -2.3350114822387695, -1.6986994743347168, -1.062387466430664, -0.42607539892196655, 0.21023666858673096, 0.8465487957000732, 1.482860803604126, 2.1191728115081787, 2.7554850578308105, 3.3917970657348633, 4.028109073638916, 4.664421081542969, 5.3007330894470215, 5.937045097351074, 6.573357582092285, 7.20966911315918, 7.845981597900391, 8.482294082641602, 9.118605613708496, 9.754918098449707, 10.391229629516602, 11.027542114257812, 11.663853645324707, 12.300166130065918, 12.936477661132812, 13.572790145874023, 14.209102630615234, 14.845415115356445, 15.48172664642334, 16.118038177490234, 16.754350662231445, 17.390663146972656, 18.026975631713867, 18.663288116455078, 19.299598693847656]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 12.0, 15.0, 9.0, 10.0, 11.0, 15.0, 16.0, 25.0, 23.0, 36.0, 31.0, 23.0, 37.0, 38.0, 42.0, 42.0, 42.0, 43.0, 56.0, 41.0, 43.0, 38.0, 42.0, 29.0, 35.0, 32.0, 28.0, 20.0, 23.0, 24.0, 23.0, 18.0, 13.0, 11.0, 10.0, 6.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.103266716003418, -9.778627395629883, -9.453987121582031, -9.129347801208496, -8.804708480834961, -8.48006820678711, -8.155428886413574, -7.830789566040039, -7.506149768829346, -7.181509971618652, -6.856870651245117, -6.532230854034424, -6.2075910568237305, -5.882951736450195, -5.558311939239502, -5.233672142028809, -4.909032821655273, -4.58439302444458, -4.259753704071045, -3.9351139068603516, -3.6104743480682373, -3.285834789276123, -2.9611949920654297, -2.6365554332733154, -2.311915874481201, -1.987276315689087, -1.662636637687683, -1.3379969596862793, -1.013357400894165, -0.6887178421020508, -0.364078164100647, -0.039438486099243164, 0.2852001190185547, 0.6098397374153137, 0.9344793558120728, 1.2591190338134766, 1.5837585926055908, 1.908398151397705, 2.2330379486083984, 2.5576775074005127, 2.882317066192627, 3.206956624984741, 3.5315961837768555, 3.856235980987549, 4.180875778198242, 4.505515098571777, 4.830154895782471, 5.154794692993164, 5.479434013366699, 5.804073810577393, 6.128713130950928, 6.453352928161621, 6.777992248535156, 7.10263204574585, 7.427271842956543, 7.751911163330078, 8.07655143737793, 8.401190757751465, 8.725831031799316, 9.050470352172852, 9.375109672546387, 9.699748992919922, 10.024389266967773, 10.349028587341309, 10.673667907714844]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 9.0, 11.0, 26.0, 39.0, 50.0, 83.0, 130.0, 221.0, 376.0, 526.0, 958.0, 1653.0, 2778.0, 4834.0, 9411.0, 18181.0, 37915.0, 89344.0, 246570.0, 767942.0, 1566736.0, 945965.0, 303975.0, 106057.0, 43982.0, 21002.0, 10853.0, 5911.0, 3449.0, 1949.0, 1220.0, 773.0, 455.0, 288.0, 191.0, 139.0, 81.0, 55.0, 33.0, 34.0, 26.0, 12.0, 11.0, 12.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.174560546875, -16.55224609375, -15.929931640625, -15.3076171875, -14.685302734375, -14.06298828125, -13.440673828125, -12.818359375, -12.196044921875, -11.57373046875, -10.951416015625, -10.3291015625, -9.706787109375, -9.08447265625, -8.462158203125, -7.83984375, -7.217529296875, -6.59521484375, -5.972900390625, -5.3505859375, -4.728271484375, -4.10595703125, -3.483642578125, -2.861328125, -2.239013671875, -1.61669921875, -0.994384765625, -0.3720703125, 0.250244140625, 0.87255859375, 1.494873046875, 2.1171875, 2.739501953125, 3.36181640625, 3.984130859375, 4.6064453125, 5.228759765625, 5.85107421875, 6.473388671875, 7.095703125, 7.718017578125, 8.34033203125, 8.962646484375, 9.5849609375, 10.207275390625, 10.82958984375, 11.451904296875, 12.07421875, 12.696533203125, 13.31884765625, 13.941162109375, 14.5634765625, 15.185791015625, 15.80810546875, 16.430419921875, 17.052734375, 17.675048828125, 18.29736328125, 18.919677734375, 19.5419921875, 20.164306640625, 20.78662109375, 21.408935546875, 22.03125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 13.0, 9.0, 6.0, 9.0, 19.0, 15.0, 16.0, 13.0, 29.0, 23.0, 23.0, 37.0, 40.0, 28.0, 34.0, 41.0, 53.0, 47.0, 52.0, 46.0, 50.0, 31.0, 38.0, 36.0, 41.0, 44.0, 31.0, 23.0, 23.0, 18.0, 14.0, 14.0, 16.0, 18.0, 14.0, 7.0, 8.0, 1.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.80078125, -7.5643310546875, -7.327880859375, -7.0914306640625, -6.85498046875, -6.6185302734375, -6.382080078125, -6.1456298828125, -5.9091796875, -5.6727294921875, -5.436279296875, -5.1998291015625, -4.96337890625, -4.7269287109375, -4.490478515625, -4.2540283203125, -4.017578125, -3.7811279296875, -3.544677734375, -3.3082275390625, -3.07177734375, -2.8353271484375, -2.598876953125, -2.3624267578125, -2.1259765625, -1.8895263671875, -1.653076171875, -1.4166259765625, -1.18017578125, -0.9437255859375, -0.707275390625, -0.4708251953125, -0.234375, 0.0020751953125, 0.238525390625, 0.4749755859375, 0.71142578125, 0.9478759765625, 1.184326171875, 1.4207763671875, 1.6572265625, 1.8936767578125, 2.130126953125, 2.3665771484375, 2.60302734375, 2.8394775390625, 3.075927734375, 3.3123779296875, 3.548828125, 3.7852783203125, 4.021728515625, 4.2581787109375, 4.49462890625, 4.7310791015625, 4.967529296875, 5.2039794921875, 5.4404296875, 5.6768798828125, 5.913330078125, 6.1497802734375, 6.38623046875, 6.6226806640625, 6.859130859375, 7.0955810546875, 7.33203125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 7.0, 15.0, 13.0, 27.0, 29.0, 58.0, 75.0, 131.0, 165.0, 294.0, 555.0, 828.0, 1336.0, 2496.0, 4316.0, 7730.0, 14799.0, 28969.0, 60967.0, 133080.0, 319203.0, 787922.0, 1337836.0, 861923.0, 352834.0, 146366.0, 65724.0, 31464.0, 15981.0, 8545.0, 4535.0, 2478.0, 1445.0, 813.0, 473.0, 310.0, 195.0, 120.0, 89.0, 43.0, 36.0, 17.0, 13.0, 9.0, 3.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.828125, -17.24462890625, -16.6611328125, -16.07763671875, -15.494140625, -14.91064453125, -14.3271484375, -13.74365234375, -13.16015625, -12.57666015625, -11.9931640625, -11.40966796875, -10.826171875, -10.24267578125, -9.6591796875, -9.07568359375, -8.4921875, -7.90869140625, -7.3251953125, -6.74169921875, -6.158203125, -5.57470703125, -4.9912109375, -4.40771484375, -3.82421875, -3.24072265625, -2.6572265625, -2.07373046875, -1.490234375, -0.90673828125, -0.3232421875, 0.26025390625, 0.84375, 1.42724609375, 2.0107421875, 2.59423828125, 3.177734375, 3.76123046875, 4.3447265625, 4.92822265625, 5.51171875, 6.09521484375, 6.6787109375, 7.26220703125, 7.845703125, 8.42919921875, 9.0126953125, 9.59619140625, 10.1796875, 10.76318359375, 11.3466796875, 11.93017578125, 12.513671875, 13.09716796875, 13.6806640625, 14.26416015625, 14.84765625, 15.43115234375, 16.0146484375, 16.59814453125, 17.181640625, 17.76513671875, 18.3486328125, 18.93212890625, 19.515625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 7.0, 12.0, 13.0, 22.0, 33.0, 36.0, 48.0, 53.0, 60.0, 96.0, 108.0, 163.0, 216.0, 285.0, 310.0, 325.0, 387.0, 325.0, 349.0, 251.0, 221.0, 189.0, 120.0, 112.0, 76.0, 66.0, 47.0, 33.0, 39.0, 21.0, 10.0, 9.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.76904296875, -5.5966796875, -5.42431640625, -5.251953125, -5.07958984375, -4.9072265625, -4.73486328125, -4.5625, -4.39013671875, -4.2177734375, -4.04541015625, -3.873046875, -3.70068359375, -3.5283203125, -3.35595703125, -3.18359375, -3.01123046875, -2.8388671875, -2.66650390625, -2.494140625, -2.32177734375, -2.1494140625, -1.97705078125, -1.8046875, -1.63232421875, -1.4599609375, -1.28759765625, -1.115234375, -0.94287109375, -0.7705078125, -0.59814453125, -0.42578125, -0.25341796875, -0.0810546875, 0.09130859375, 0.263671875, 0.43603515625, 0.6083984375, 0.78076171875, 0.953125, 1.12548828125, 1.2978515625, 1.47021484375, 1.642578125, 1.81494140625, 1.9873046875, 2.15966796875, 2.33203125, 2.50439453125, 2.6767578125, 2.84912109375, 3.021484375, 3.19384765625, 3.3662109375, 3.53857421875, 3.7109375, 3.88330078125, 4.0556640625, 4.22802734375, 4.400390625, 4.57275390625, 4.7451171875, 4.91748046875, 5.08984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 4.0, 7.0, 8.0, 6.0, 15.0, 30.0, 22.0, 45.0, 54.0, 64.0, 69.0, 80.0, 112.0, 86.0, 86.0, 65.0, 62.0, 32.0, 38.0, 27.0, 24.0, 12.0, 8.0, 7.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.235580444335938, -27.558937072753906, -26.882291793823242, -26.20564842224121, -25.529003143310547, -24.852359771728516, -24.175716400146484, -23.499073028564453, -22.82242774963379, -22.145784378051758, -21.469139099121094, -20.792495727539062, -20.11585235595703, -19.439207077026367, -18.762563705444336, -18.085918426513672, -17.40927505493164, -16.73263168334961, -16.055986404418945, -15.379343032836914, -14.702698707580566, -14.026054382324219, -13.349411010742188, -12.67276668548584, -11.996122360229492, -11.319478034973145, -10.642833709716797, -9.966190338134766, -9.289546012878418, -8.61290168762207, -7.936257839202881, -7.259613990783691, -6.582969665527344, -5.906325340270996, -5.229681491851807, -4.553037643432617, -3.8763933181762695, -3.199749231338501, -2.5231051445007324, -1.846461296081543, -1.1698169708251953, -0.49317288398742676, 0.1834712028503418, 0.8601152896881104, 1.536759376525879, 2.2134034633636475, 2.890047550201416, 3.5666913986206055, 4.243335723876953, 4.919980049133301, 5.59662389755249, 6.27326774597168, 6.949912071228027, 7.626556396484375, 8.303199768066406, 8.979844093322754, 9.656488418579102, 10.33313274383545, 11.009777069091797, 11.686420440673828, 12.363064765930176, 13.039709091186523, 13.716352462768555, 14.392996788024902, 15.06964111328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 3.0, 2.0, 2.0, 8.0, 7.0, 13.0, 10.0, 14.0, 11.0, 16.0, 19.0, 26.0, 33.0, 31.0, 28.0, 29.0, 42.0, 34.0, 51.0, 41.0, 35.0, 35.0, 40.0, 32.0, 36.0, 33.0, 30.0, 37.0, 31.0, 27.0, 33.0, 33.0, 26.0, 23.0, 20.0, 22.0, 19.0, 16.0, 9.0, 5.0, 10.0, 2.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-9.291252136230469, -9.004437446594238, -8.717622756958008, -8.430808067321777, -8.143993377685547, -7.857179164886475, -7.570364475250244, -7.283550262451172, -6.996735572814941, -6.709920883178711, -6.4231061935424805, -6.13629150390625, -5.849477291107178, -5.562662601470947, -5.275847911834717, -4.9890336990356445, -4.702218532562256, -4.415403842926025, -4.128589153289795, -3.8417747020721436, -3.554960250854492, -3.2681455612182617, -2.9813308715820312, -2.69451642036438, -2.4077017307281494, -2.120887041091919, -1.8340725898742676, -1.547257900238037, -1.2604433298110962, -0.9736287593841553, -0.6868140697479248, -0.39999961853027344, -0.11318492889404297, 0.17362967133522034, 0.46044427156448364, 0.7472589015960693, 1.0340734720230103, 1.3208880424499512, 1.6077027320861816, 1.894517183303833, 2.1813318729400635, 2.468146562576294, 2.7549610137939453, 3.041775703430176, 3.3285903930664062, 3.6154048442840576, 3.902219533920288, 4.1890339851379395, 4.47584867477417, 4.7626633644104, 5.049478054046631, 5.336292266845703, 5.623106956481934, 5.909921646118164, 6.1967363357543945, 6.483551025390625, 6.7703657150268555, 7.057180404663086, 7.343995094299316, 7.630809783935547, 7.917623996734619, 8.204439163208008, 8.491252899169922, 8.778067588806152, 9.064882278442383]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 7.0, 5.0, 7.0, 13.0, 20.0, 22.0, 43.0, 61.0, 97.0, 152.0, 245.0, 399.0, 602.0, 1031.0, 1702.0, 2763.0, 4874.0, 8141.0, 14762.0, 26435.0, 49547.0, 90515.0, 155806.0, 217254.0, 195821.0, 124256.0, 69010.0, 37480.0, 20310.0, 11357.0, 6449.0, 3686.0, 2199.0, 1311.0, 784.0, 519.0, 303.0, 187.0, 129.0, 82.0, 61.0, 35.0, 31.0, 14.0, 11.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.46875, -8.218017578125, -7.96728515625, -7.716552734375, -7.4658203125, -7.215087890625, -6.96435546875, -6.713623046875, -6.462890625, -6.212158203125, -5.96142578125, -5.710693359375, -5.4599609375, -5.209228515625, -4.95849609375, -4.707763671875, -4.45703125, -4.206298828125, -3.95556640625, -3.704833984375, -3.4541015625, -3.203369140625, -2.95263671875, -2.701904296875, -2.451171875, -2.200439453125, -1.94970703125, -1.698974609375, -1.4482421875, -1.197509765625, -0.94677734375, -0.696044921875, -0.4453125, -0.194580078125, 0.05615234375, 0.306884765625, 0.5576171875, 0.808349609375, 1.05908203125, 1.309814453125, 1.560546875, 1.811279296875, 2.06201171875, 2.312744140625, 2.5634765625, 2.814208984375, 3.06494140625, 3.315673828125, 3.56640625, 3.817138671875, 4.06787109375, 4.318603515625, 4.5693359375, 4.820068359375, 5.07080078125, 5.321533203125, 5.572265625, 5.822998046875, 6.07373046875, 6.324462890625, 6.5751953125, 6.825927734375, 7.07666015625, 7.327392578125, 7.578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 5.0, 8.0, 4.0, 8.0, 10.0, 9.0, 15.0, 17.0, 24.0, 21.0, 23.0, 36.0, 25.0, 27.0, 43.0, 43.0, 46.0, 35.0, 44.0, 43.0, 43.0, 43.0, 37.0, 40.0, 44.0, 28.0, 34.0, 35.0, 29.0, 33.0, 13.0, 19.0, 31.0, 14.0, 13.0, 9.0, 12.0, 9.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.953125, -10.61474609375, -10.2763671875, -9.93798828125, -9.599609375, -9.26123046875, -8.9228515625, -8.58447265625, -8.24609375, -7.90771484375, -7.5693359375, -7.23095703125, -6.892578125, -6.55419921875, -6.2158203125, -5.87744140625, -5.5390625, -5.20068359375, -4.8623046875, -4.52392578125, -4.185546875, -3.84716796875, -3.5087890625, -3.17041015625, -2.83203125, -2.49365234375, -2.1552734375, -1.81689453125, -1.478515625, -1.14013671875, -0.8017578125, -0.46337890625, -0.125, 0.21337890625, 0.5517578125, 0.89013671875, 1.228515625, 1.56689453125, 1.9052734375, 2.24365234375, 2.58203125, 2.92041015625, 3.2587890625, 3.59716796875, 3.935546875, 4.27392578125, 4.6123046875, 4.95068359375, 5.2890625, 5.62744140625, 5.9658203125, 6.30419921875, 6.642578125, 6.98095703125, 7.3193359375, 7.65771484375, 7.99609375, 8.33447265625, 8.6728515625, 9.01123046875, 9.349609375, 9.68798828125, 10.0263671875, 10.36474609375, 10.703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 11.0, 15.0, 26.0, 32.0, 45.0, 70.0, 109.0, 194.0, 258.0, 389.0, 596.0, 887.0, 1397.0, 2366.0, 4006.0, 6628.0, 12461.0, 23738.0, 47877.0, 101055.0, 207705.0, 285017.0, 180179.0, 85606.0, 40910.0, 20507.0, 11011.0, 6019.0, 3532.0, 2082.0, 1389.0, 803.0, 593.0, 333.0, 247.0, 151.0, 111.0, 61.0, 32.0, 38.0, 27.0, 16.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.3515625, -9.9993896484375, -9.647216796875, -9.2950439453125, -8.94287109375, -8.5906982421875, -8.238525390625, -7.8863525390625, -7.5341796875, -7.1820068359375, -6.829833984375, -6.4776611328125, -6.12548828125, -5.7733154296875, -5.421142578125, -5.0689697265625, -4.716796875, -4.3646240234375, -4.012451171875, -3.6602783203125, -3.30810546875, -2.9559326171875, -2.603759765625, -2.2515869140625, -1.8994140625, -1.5472412109375, -1.195068359375, -0.8428955078125, -0.49072265625, -0.1385498046875, 0.213623046875, 0.5657958984375, 0.91796875, 1.2701416015625, 1.622314453125, 1.9744873046875, 2.32666015625, 2.6788330078125, 3.031005859375, 3.3831787109375, 3.7353515625, 4.0875244140625, 4.439697265625, 4.7918701171875, 5.14404296875, 5.4962158203125, 5.848388671875, 6.2005615234375, 6.552734375, 6.9049072265625, 7.257080078125, 7.6092529296875, 7.96142578125, 8.3135986328125, 8.665771484375, 9.0179443359375, 9.3701171875, 9.7222900390625, 10.074462890625, 10.4266357421875, 10.77880859375, 11.1309814453125, 11.483154296875, 11.8353271484375, 12.1875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 4.0, 8.0, 10.0, 14.0, 11.0, 13.0, 13.0, 16.0, 23.0, 24.0, 23.0, 29.0, 38.0, 44.0, 35.0, 39.0, 39.0, 30.0, 38.0, 42.0, 51.0, 35.0, 37.0, 50.0, 44.0, 29.0, 32.0, 29.0, 25.0, 25.0, 23.0, 20.0, 19.0, 13.0, 9.0, 13.0, 9.0, 4.0, 11.0, 6.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6636962890625, -6.468017578125, -6.2723388671875, -6.07666015625, -5.8809814453125, -5.685302734375, -5.4896240234375, -5.2939453125, -5.0982666015625, -4.902587890625, -4.7069091796875, -4.51123046875, -4.3155517578125, -4.119873046875, -3.9241943359375, -3.728515625, -3.5328369140625, -3.337158203125, -3.1414794921875, -2.94580078125, -2.7501220703125, -2.554443359375, -2.3587646484375, -2.1630859375, -1.9674072265625, -1.771728515625, -1.5760498046875, -1.38037109375, -1.1846923828125, -0.989013671875, -0.7933349609375, -0.59765625, -0.4019775390625, -0.206298828125, -0.0106201171875, 0.18505859375, 0.3807373046875, 0.576416015625, 0.7720947265625, 0.9677734375, 1.1634521484375, 1.359130859375, 1.5548095703125, 1.75048828125, 1.9461669921875, 2.141845703125, 2.3375244140625, 2.533203125, 2.7288818359375, 2.924560546875, 3.1202392578125, 3.31591796875, 3.5115966796875, 3.707275390625, 3.9029541015625, 4.0986328125, 4.2943115234375, 4.489990234375, 4.6856689453125, 4.88134765625, 5.0770263671875, 5.272705078125, 5.4683837890625, 5.6640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 11.0, 12.0, 20.0, 33.0, 28.0, 41.0, 55.0, 65.0, 112.0, 152.0, 198.0, 267.0, 402.0, 669.0, 954.0, 1647.0, 2659.0, 4605.0, 8798.0, 18342.0, 44058.0, 124305.0, 366112.0, 305867.0, 98450.0, 36071.0, 15669.0, 7947.0, 4180.0, 2498.0, 1471.0, 946.0, 590.0, 370.0, 271.0, 198.0, 129.0, 95.0, 69.0, 50.0, 39.0, 20.0, 19.0, 12.0, 14.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4609375, -5.28973388671875, -5.1185302734375, -4.94732666015625, -4.776123046875, -4.60491943359375, -4.4337158203125, -4.26251220703125, -4.09130859375, -3.92010498046875, -3.7489013671875, -3.57769775390625, -3.406494140625, -3.23529052734375, -3.0640869140625, -2.89288330078125, -2.7216796875, -2.55047607421875, -2.3792724609375, -2.20806884765625, -2.036865234375, -1.86566162109375, -1.6944580078125, -1.52325439453125, -1.35205078125, -1.18084716796875, -1.0096435546875, -0.83843994140625, -0.667236328125, -0.49603271484375, -0.3248291015625, -0.15362548828125, 0.017578125, 0.18878173828125, 0.3599853515625, 0.53118896484375, 0.702392578125, 0.87359619140625, 1.0447998046875, 1.21600341796875, 1.38720703125, 1.55841064453125, 1.7296142578125, 1.90081787109375, 2.072021484375, 2.24322509765625, 2.4144287109375, 2.58563232421875, 2.7568359375, 2.92803955078125, 3.0992431640625, 3.27044677734375, 3.441650390625, 3.61285400390625, 3.7840576171875, 3.95526123046875, 4.12646484375, 4.29766845703125, 4.4688720703125, 4.64007568359375, 4.811279296875, 4.98248291015625, 5.1536865234375, 5.32489013671875, 5.49609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 8.0, 5.0, 6.0, 18.0, 25.0, 38.0, 69.0, 126.0, 136.0, 162.0, 154.0, 99.0, 45.0, 35.0, 14.0, 17.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005412101745605469, -0.0005239173769950867, -0.0005066245794296265, -0.0004893317818641663, -0.00047203898429870605, -0.00045474618673324585, -0.00043745338916778564, -0.00042016059160232544, -0.00040286779403686523, -0.00038557499647140503, -0.0003682821989059448, -0.0003509894013404846, -0.0003336966037750244, -0.0003164038062095642, -0.000299111008644104, -0.0002818182110786438, -0.0002645254135131836, -0.0002472326159477234, -0.00022993981838226318, -0.00021264702081680298, -0.00019535422325134277, -0.00017806142568588257, -0.00016076862812042236, -0.00014347583055496216, -0.00012618303298950195, -0.00010889023542404175, -9.159743785858154e-05, -7.430464029312134e-05, -5.701184272766113e-05, -3.971904516220093e-05, -2.2426247596740723e-05, -5.133450031280518e-06, 1.2159347534179688e-05, 2.9452145099639893e-05, 4.67449426651001e-05, 6.40377402305603e-05, 8.133053779602051e-05, 9.862333536148071e-05, 0.00011591613292694092, 0.00013320893049240112, 0.00015050172805786133, 0.00016779452562332153, 0.00018508732318878174, 0.00020238012075424194, 0.00021967291831970215, 0.00023696571588516235, 0.00025425851345062256, 0.00027155131101608276, 0.00028884410858154297, 0.0003061369061470032, 0.0003234297037124634, 0.0003407225012779236, 0.0003580152988433838, 0.000375308096408844, 0.0003926008939743042, 0.0004098936915397644, 0.0004271864891052246, 0.0004444792866706848, 0.000461772084236145, 0.0004790648818016052, 0.0004963576793670654, 0.0005136504769325256, 0.0005309432744979858, 0.000548236072063446, 0.0005655288696289062]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 11.0, 15.0, 16.0, 22.0, 42.0, 82.0, 87.0, 142.0, 190.0, 309.0, 501.0, 781.0, 1297.0, 2263.0, 3841.0, 7277.0, 14032.0, 29037.0, 68265.0, 169363.0, 315911.0, 244777.0, 104837.0, 43362.0, 19831.0, 9749.0, 5312.0, 2846.0, 1648.0, 950.0, 641.0, 382.0, 252.0, 137.0, 119.0, 88.0, 46.0, 30.0, 24.0, 12.0, 9.0, 10.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.0078125, -4.859375, -4.7109375, -4.5625, -4.4140625, -4.265625, -4.1171875, -3.96875, -3.8203125, -3.671875, -3.5234375, -3.375, -3.2265625, -3.078125, -2.9296875, -2.78125, -2.6328125, -2.484375, -2.3359375, -2.1875, -2.0390625, -1.890625, -1.7421875, -1.59375, -1.4453125, -1.296875, -1.1484375, -1.0, -0.8515625, -0.703125, -0.5546875, -0.40625, -0.2578125, -0.109375, 0.0390625, 0.1875, 0.3359375, 0.484375, 0.6328125, 0.78125, 0.9296875, 1.078125, 1.2265625, 1.375, 1.5234375, 1.671875, 1.8203125, 1.96875, 2.1171875, 2.265625, 2.4140625, 2.5625, 2.7109375, 2.859375, 3.0078125, 3.15625, 3.3046875, 3.453125, 3.6015625, 3.75, 3.8984375, 4.046875, 4.1953125, 4.34375, 4.4921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 7.0, 6.0, 10.0, 8.0, 12.0, 18.0, 10.0, 11.0, 27.0, 28.0, 28.0, 37.0, 52.0, 50.0, 64.0, 62.0, 64.0, 73.0, 65.0, 43.0, 52.0, 34.0, 35.0, 44.0, 22.0, 21.0, 22.0, 15.0, 15.0, 6.0, 10.0, 6.0, 5.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9990234375, -0.9684524536132812, -0.9378814697265625, -0.9073104858398438, -0.876739501953125, -0.8461685180664062, -0.8155975341796875, -0.7850265502929688, -0.75445556640625, -0.7238845825195312, -0.6933135986328125, -0.6627426147460938, -0.632171630859375, -0.6016006469726562, -0.5710296630859375, -0.5404586791992188, -0.5098876953125, -0.47931671142578125, -0.4487457275390625, -0.41817474365234375, -0.387603759765625, -0.35703277587890625, -0.3264617919921875, -0.29589080810546875, -0.26531982421875, -0.23474884033203125, -0.2041778564453125, -0.17360687255859375, -0.143035888671875, -0.11246490478515625, -0.0818939208984375, -0.05132293701171875, -0.020751953125, 0.00981903076171875, 0.0403900146484375, 0.07096099853515625, 0.101531982421875, 0.13210296630859375, 0.1626739501953125, 0.19324493408203125, 0.22381591796875, 0.25438690185546875, 0.2849578857421875, 0.31552886962890625, 0.346099853515625, 0.37667083740234375, 0.4072418212890625, 0.43781280517578125, 0.4683837890625, 0.49895477294921875, 0.5295257568359375, 0.5600967407226562, 0.590667724609375, 0.6212387084960938, 0.6518096923828125, 0.6823806762695312, 0.71295166015625, 0.7435226440429688, 0.7740936279296875, 0.8046646118164062, 0.835235595703125, 0.8658065795898438, 0.8963775634765625, 0.9269485473632812, 0.95751953125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 9.0, 13.0, 7.0, 13.0, 15.0, 32.0, 35.0, 38.0, 72.0, 79.0, 92.0, 89.0, 92.0, 91.0, 73.0, 52.0, 53.0, 36.0, 30.0, 17.0, 19.0, 9.0, 3.0, 12.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.266084671020508, -28.569189071655273, -27.872295379638672, -27.175399780273438, -26.478504180908203, -25.7816104888916, -25.084714889526367, -24.387821197509766, -23.69092559814453, -22.994029998779297, -22.297136306762695, -21.60024070739746, -20.90334701538086, -20.206451416015625, -19.50955581665039, -18.812660217285156, -18.115766525268555, -17.41887092590332, -16.72197723388672, -16.025081634521484, -15.328186988830566, -14.631292343139648, -13.934396743774414, -13.237502098083496, -12.540607452392578, -11.84371280670166, -11.146818161010742, -10.449922561645508, -9.75302791595459, -9.056133270263672, -8.359237670898438, -7.6623430252075195, -6.965449333190918, -6.2685546875, -5.571659564971924, -4.874764442443848, -4.17786979675293, -3.4809749126434326, -2.7840800285339355, -2.0871849060058594, -1.3902902603149414, -0.6933953762054443, 0.0034995079040527344, 0.7003943920135498, 1.3972892761230469, 2.094184160232544, 2.791079044342041, 3.487974166870117, 4.184868812561035, 4.881763458251953, 5.578658580780029, 6.2755537033081055, 6.972448348999023, 7.669342994689941, 8.36623764038086, 9.063133239746094, 9.760027885437012, 10.45692253112793, 11.153818130493164, 11.850712776184082, 12.547607421875, 13.244502067565918, 13.941396713256836, 14.63829231262207, 15.335186958312988]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 0.0, 2.0, 9.0, 8.0, 13.0, 13.0, 10.0, 7.0, 21.0, 27.0, 30.0, 26.0, 31.0, 27.0, 33.0, 39.0, 45.0, 40.0, 39.0, 40.0, 35.0, 41.0, 42.0, 36.0, 27.0, 32.0, 35.0, 38.0, 23.0, 33.0, 29.0, 28.0, 17.0, 25.0, 19.0, 17.0, 10.0, 9.0, 5.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.192453384399414, -8.90573501586914, -8.61901569366455, -8.332297325134277, -8.045578002929688, -7.758859634399414, -7.472140789031982, -7.185421943664551, -6.898703098297119, -6.6119842529296875, -6.325265407562256, -6.038546562194824, -5.751828193664551, -5.465108871459961, -5.1783905029296875, -4.891671657562256, -4.604952812194824, -4.318233966827393, -4.031515121459961, -3.7447965145111084, -3.4580776691436768, -3.171358823776245, -2.8846402168273926, -2.597921371459961, -2.3112025260925293, -2.0244836807250977, -1.7377649545669556, -1.4510462284088135, -1.1643273830413818, -0.8776085376739502, -0.5908898115158081, -0.304171085357666, -0.017452239990234375, 0.2692665457725525, 0.5559853315353394, 0.8427041172981262, 1.129422903060913, 1.4161417484283447, 1.7028604745864868, 1.989579200744629, 2.2762980461120605, 2.563016891479492, 2.849735736846924, 3.1364543437957764, 3.423173189163208, 3.7098920345306396, 3.996610641479492, 4.283329486846924, 4.5700483322143555, 4.856767177581787, 5.143486022949219, 5.43020486831665, 5.716923713684082, 6.0036420822143555, 6.290360927581787, 6.577079772949219, 6.86379861831665, 7.150517463684082, 7.437236309051514, 7.723955154418945, 8.010673522949219, 8.297392845153809, 8.584111213684082, 8.870830535888672, 9.157548904418945]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 12.0, 6.0, 12.0, 13.0, 23.0, 33.0, 64.0, 92.0, 124.0, 229.0, 386.0, 595.0, 1093.0, 2045.0, 3571.0, 6764.0, 12645.0, 24790.0, 49223.0, 94410.0, 164942.0, 223707.0, 199922.0, 125215.0, 67159.0, 34202.0, 17390.0, 9163.0, 4789.0, 2543.0, 1412.0, 791.0, 473.0, 281.0, 133.0, 102.0, 55.0, 47.0, 31.0, 20.0, 14.0, 12.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.84375, -15.3597412109375, -14.875732421875, -14.3917236328125, -13.90771484375, -13.4237060546875, -12.939697265625, -12.4556884765625, -11.9716796875, -11.4876708984375, -11.003662109375, -10.5196533203125, -10.03564453125, -9.5516357421875, -9.067626953125, -8.5836181640625, -8.099609375, -7.6156005859375, -7.131591796875, -6.6475830078125, -6.16357421875, -5.6795654296875, -5.195556640625, -4.7115478515625, -4.2275390625, -3.7435302734375, -3.259521484375, -2.7755126953125, -2.29150390625, -1.8074951171875, -1.323486328125, -0.8394775390625, -0.35546875, 0.1285400390625, 0.612548828125, 1.0965576171875, 1.58056640625, 2.0645751953125, 2.548583984375, 3.0325927734375, 3.5166015625, 4.0006103515625, 4.484619140625, 4.9686279296875, 5.45263671875, 5.9366455078125, 6.420654296875, 6.9046630859375, 7.388671875, 7.8726806640625, 8.356689453125, 8.8406982421875, 9.32470703125, 9.8087158203125, 10.292724609375, 10.7767333984375, 11.2607421875, 11.7447509765625, 12.228759765625, 12.7127685546875, 13.19677734375, 13.6807861328125, 14.164794921875, 14.6488037109375, 15.1328125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 3.0, 5.0, 8.0, 7.0, 11.0, 6.0, 25.0, 23.0, 25.0, 24.0, 34.0, 29.0, 28.0, 35.0, 36.0, 34.0, 50.0, 40.0, 34.0, 48.0, 43.0, 35.0, 33.0, 31.0, 32.0, 36.0, 25.0, 36.0, 26.0, 25.0, 22.0, 16.0, 18.0, 23.0, 18.0, 17.0, 10.0, 7.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.1640625, -8.865234375, -8.56640625, -8.267578125, -7.96875, -7.669921875, -7.37109375, -7.072265625, -6.7734375, -6.474609375, -6.17578125, -5.876953125, -5.578125, -5.279296875, -4.98046875, -4.681640625, -4.3828125, -4.083984375, -3.78515625, -3.486328125, -3.1875, -2.888671875, -2.58984375, -2.291015625, -1.9921875, -1.693359375, -1.39453125, -1.095703125, -0.796875, -0.498046875, -0.19921875, 0.099609375, 0.3984375, 0.697265625, 0.99609375, 1.294921875, 1.59375, 1.892578125, 2.19140625, 2.490234375, 2.7890625, 3.087890625, 3.38671875, 3.685546875, 3.984375, 4.283203125, 4.58203125, 4.880859375, 5.1796875, 5.478515625, 5.77734375, 6.076171875, 6.375, 6.673828125, 6.97265625, 7.271484375, 7.5703125, 7.869140625, 8.16796875, 8.466796875, 8.765625, 9.064453125, 9.36328125, 9.662109375, 9.9609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 16.0, 14.0, 31.0, 38.0, 58.0, 87.0, 101.0, 158.0, 239.0, 360.0, 591.0, 1046.0, 1801.0, 3528.0, 7262.0, 15189.0, 34124.0, 77476.0, 165722.0, 262636.0, 236566.0, 131533.0, 59839.0, 25996.0, 11744.0, 5628.0, 2848.0, 1522.0, 883.0, 517.0, 326.0, 220.0, 132.0, 97.0, 51.0, 46.0, 32.0, 18.0, 17.0, 17.0, 12.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-20.59375, -19.985107421875, -19.37646484375, -18.767822265625, -18.1591796875, -17.550537109375, -16.94189453125, -16.333251953125, -15.724609375, -15.115966796875, -14.50732421875, -13.898681640625, -13.2900390625, -12.681396484375, -12.07275390625, -11.464111328125, -10.85546875, -10.246826171875, -9.63818359375, -9.029541015625, -8.4208984375, -7.812255859375, -7.20361328125, -6.594970703125, -5.986328125, -5.377685546875, -4.76904296875, -4.160400390625, -3.5517578125, -2.943115234375, -2.33447265625, -1.725830078125, -1.1171875, -0.508544921875, 0.10009765625, 0.708740234375, 1.3173828125, 1.926025390625, 2.53466796875, 3.143310546875, 3.751953125, 4.360595703125, 4.96923828125, 5.577880859375, 6.1865234375, 6.795166015625, 7.40380859375, 8.012451171875, 8.62109375, 9.229736328125, 9.83837890625, 10.447021484375, 11.0556640625, 11.664306640625, 12.27294921875, 12.881591796875, 13.490234375, 14.098876953125, 14.70751953125, 15.316162109375, 15.9248046875, 16.533447265625, 17.14208984375, 17.750732421875, 18.359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 14.0, 10.0, 17.0, 17.0, 21.0, 27.0, 30.0, 31.0, 33.0, 44.0, 39.0, 52.0, 44.0, 41.0, 56.0, 46.0, 55.0, 38.0, 48.0, 44.0, 37.0, 32.0, 30.0, 29.0, 24.0, 33.0, 14.0, 22.0, 11.0, 8.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.40606689453125, -5.1988525390625, -4.99163818359375, -4.784423828125, -4.57720947265625, -4.3699951171875, -4.16278076171875, -3.95556640625, -3.74835205078125, -3.5411376953125, -3.33392333984375, -3.126708984375, -2.91949462890625, -2.7122802734375, -2.50506591796875, -2.2978515625, -2.09063720703125, -1.8834228515625, -1.67620849609375, -1.468994140625, -1.26177978515625, -1.0545654296875, -0.84735107421875, -0.64013671875, -0.43292236328125, -0.2257080078125, -0.01849365234375, 0.188720703125, 0.39593505859375, 0.6031494140625, 0.81036376953125, 1.017578125, 1.22479248046875, 1.4320068359375, 1.63922119140625, 1.846435546875, 2.05364990234375, 2.2608642578125, 2.46807861328125, 2.67529296875, 2.88250732421875, 3.0897216796875, 3.29693603515625, 3.504150390625, 3.71136474609375, 3.9185791015625, 4.12579345703125, 4.3330078125, 4.54022216796875, 4.7474365234375, 4.95465087890625, 5.161865234375, 5.36907958984375, 5.5762939453125, 5.78350830078125, 5.99072265625, 6.19793701171875, 6.4051513671875, 6.61236572265625, 6.819580078125, 7.02679443359375, 7.2340087890625, 7.44122314453125, 7.6484375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 16.0, 21.0, 32.0, 42.0, 80.0, 105.0, 122.0, 182.0, 290.0, 483.0, 621.0, 1000.0, 1668.0, 2887.0, 5355.0, 11363.0, 27406.0, 79215.0, 232230.0, 381140.0, 194350.0, 64866.0, 23346.0, 9948.0, 4870.0, 2626.0, 1547.0, 903.0, 575.0, 421.0, 252.0, 186.0, 126.0, 81.0, 54.0, 45.0, 29.0, 16.0, 18.0, 10.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -7.9752197265625, -7.661376953125, -7.3475341796875, -7.03369140625, -6.7198486328125, -6.406005859375, -6.0921630859375, -5.7783203125, -5.4644775390625, -5.150634765625, -4.8367919921875, -4.52294921875, -4.2091064453125, -3.895263671875, -3.5814208984375, -3.267578125, -2.9537353515625, -2.639892578125, -2.3260498046875, -2.01220703125, -1.6983642578125, -1.384521484375, -1.0706787109375, -0.7568359375, -0.4429931640625, -0.129150390625, 0.1846923828125, 0.49853515625, 0.8123779296875, 1.126220703125, 1.4400634765625, 1.75390625, 2.0677490234375, 2.381591796875, 2.6954345703125, 3.00927734375, 3.3231201171875, 3.636962890625, 3.9508056640625, 4.2646484375, 4.5784912109375, 4.892333984375, 5.2061767578125, 5.52001953125, 5.8338623046875, 6.147705078125, 6.4615478515625, 6.775390625, 7.0892333984375, 7.403076171875, 7.7169189453125, 8.03076171875, 8.3446044921875, 8.658447265625, 8.9722900390625, 9.2861328125, 9.5999755859375, 9.913818359375, 10.2276611328125, 10.54150390625, 10.8553466796875, 11.169189453125, 11.4830322265625, 11.796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 12.0, 13.0, 22.0, 34.0, 40.0, 51.0, 54.0, 62.0, 96.0, 109.0, 124.0, 104.0, 79.0, 56.0, 34.0, 31.0, 24.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010318756103515625, -0.0010039210319519043, -0.0009759664535522461, -0.0009480118751525879, -0.0009200572967529297, -0.0008921027183532715, -0.0008641481399536133, -0.0008361935615539551, -0.0008082389831542969, -0.0007802844047546387, -0.0007523298263549805, -0.0007243752479553223, -0.0006964206695556641, -0.0006684660911560059, -0.0006405115127563477, -0.0006125569343566895, -0.0005846023559570312, -0.000556647777557373, -0.0005286931991577148, -0.0005007386207580566, -0.00047278404235839844, -0.00044482946395874023, -0.00041687488555908203, -0.00038892030715942383, -0.0003609657287597656, -0.0003330111503601074, -0.0003050565719604492, -0.000277101993560791, -0.0002491474151611328, -0.0002211928367614746, -0.0001932382583618164, -0.0001652836799621582, -0.0001373291015625, -0.0001093745231628418, -8.14199447631836e-05, -5.346536636352539e-05, -2.5510787963867188e-05, 2.4437904357910156e-06, 3.039836883544922e-05, 5.835294723510742e-05, 8.630752563476562e-05, 0.00011426210403442383, 0.00014221668243408203, 0.00017017126083374023, 0.00019812583923339844, 0.00022608041763305664, 0.00025403499603271484, 0.00028198957443237305, 0.00030994415283203125, 0.00033789873123168945, 0.00036585330963134766, 0.00039380788803100586, 0.00042176246643066406, 0.00044971704483032227, 0.00047767162322998047, 0.0005056262016296387, 0.0005335807800292969, 0.0005615353584289551, 0.0005894899368286133, 0.0006174445152282715, 0.0006453990936279297, 0.0006733536720275879, 0.0007013082504272461, 0.0007292628288269043, 0.0007572174072265625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 4.0, 5.0, 10.0, 16.0, 17.0, 20.0, 27.0, 27.0, 56.0, 64.0, 66.0, 112.0, 173.0, 225.0, 351.0, 512.0, 772.0, 1192.0, 1795.0, 3057.0, 5040.0, 8829.0, 16441.0, 30709.0, 62295.0, 123674.0, 219309.0, 247141.0, 157876.0, 80147.0, 40489.0, 20792.0, 11042.0, 6151.0, 3606.0, 2221.0, 1377.0, 924.0, 604.0, 411.0, 278.0, 213.0, 146.0, 101.0, 72.0, 54.0, 38.0, 28.0, 16.0, 9.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.4453125, -6.2318115234375, -6.018310546875, -5.8048095703125, -5.59130859375, -5.3778076171875, -5.164306640625, -4.9508056640625, -4.7373046875, -4.5238037109375, -4.310302734375, -4.0968017578125, -3.88330078125, -3.6697998046875, -3.456298828125, -3.2427978515625, -3.029296875, -2.8157958984375, -2.602294921875, -2.3887939453125, -2.17529296875, -1.9617919921875, -1.748291015625, -1.5347900390625, -1.3212890625, -1.1077880859375, -0.894287109375, -0.6807861328125, -0.46728515625, -0.2537841796875, -0.040283203125, 0.1732177734375, 0.38671875, 0.6002197265625, 0.813720703125, 1.0272216796875, 1.24072265625, 1.4542236328125, 1.667724609375, 1.8812255859375, 2.0947265625, 2.3082275390625, 2.521728515625, 2.7352294921875, 2.94873046875, 3.1622314453125, 3.375732421875, 3.5892333984375, 3.802734375, 4.0162353515625, 4.229736328125, 4.4432373046875, 4.65673828125, 4.8702392578125, 5.083740234375, 5.2972412109375, 5.5107421875, 5.7242431640625, 5.937744140625, 6.1512451171875, 6.36474609375, 6.5782470703125, 6.791748046875, 7.0052490234375, 7.21875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 10.0, 5.0, 9.0, 14.0, 11.0, 21.0, 35.0, 40.0, 50.0, 48.0, 74.0, 60.0, 93.0, 76.0, 72.0, 67.0, 67.0, 58.0, 41.0, 39.0, 33.0, 13.0, 15.0, 9.0, 10.0, 5.0, 7.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76171875, -1.6949462890625, -1.628173828125, -1.5614013671875, -1.49462890625, -1.4278564453125, -1.361083984375, -1.2943115234375, -1.2275390625, -1.1607666015625, -1.093994140625, -1.0272216796875, -0.96044921875, -0.8936767578125, -0.826904296875, -0.7601318359375, -0.693359375, -0.6265869140625, -0.559814453125, -0.4930419921875, -0.42626953125, -0.3594970703125, -0.292724609375, -0.2259521484375, -0.1591796875, -0.0924072265625, -0.025634765625, 0.0411376953125, 0.10791015625, 0.1746826171875, 0.241455078125, 0.3082275390625, 0.375, 0.4417724609375, 0.508544921875, 0.5753173828125, 0.64208984375, 0.7088623046875, 0.775634765625, 0.8424072265625, 0.9091796875, 0.9759521484375, 1.042724609375, 1.1094970703125, 1.17626953125, 1.2430419921875, 1.309814453125, 1.3765869140625, 1.443359375, 1.5101318359375, 1.576904296875, 1.6436767578125, 1.71044921875, 1.7772216796875, 1.843994140625, 1.9107666015625, 1.9775390625, 2.0443115234375, 2.111083984375, 2.1778564453125, 2.24462890625, 2.3114013671875, 2.378173828125, 2.4449462890625, 2.51171875]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 17.0, 19.0, 17.0, 35.0, 42.0, 46.0, 74.0, 84.0, 84.0, 99.0, 86.0, 85.0, 67.0, 54.0, 44.0, 42.0, 23.0, 18.0, 13.0, 6.0, 8.0, 11.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-31.046098709106445, -30.335796356201172, -29.6254940032959, -28.915191650390625, -28.204891204833984, -27.49458885192871, -26.784286499023438, -26.073984146118164, -25.36368179321289, -24.653379440307617, -23.943077087402344, -23.232776641845703, -22.52247428894043, -21.812171936035156, -21.101869583129883, -20.39156723022461, -19.68126678466797, -18.970964431762695, -18.260662078857422, -17.55036163330078, -16.840059280395508, -16.129756927490234, -15.419454574584961, -14.709152221679688, -13.99885082244873, -13.288548469543457, -12.5782470703125, -11.867944717407227, -11.157642364501953, -10.447340965270996, -9.737038612365723, -9.026737213134766, -8.31643295288086, -7.606131076812744, -6.895829200744629, -6.1855268478393555, -5.47522497177124, -4.764923095703125, -4.054620742797852, -3.3443188667297363, -2.634016990661621, -1.9237149953842163, -1.2134130001068115, -0.5031108856201172, 0.20719099044799805, 0.9174928665161133, 1.6277952194213867, 2.338097095489502, 3.048398971557617, 3.7587008476257324, 4.469002723693848, 5.179305076599121, 5.889606952667236, 6.599908828735352, 7.310211181640625, 8.020513534545898, 8.730814933776855, 9.441117286682129, 10.151418685913086, 10.86172103881836, 11.572023391723633, 12.28232479095459, 12.992627143859863, 13.70292854309082, 14.413230895996094]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 5.0, 3.0, 8.0, 6.0, 6.0, 17.0, 10.0, 11.0, 21.0, 10.0, 23.0, 21.0, 25.0, 27.0, 35.0, 30.0, 43.0, 44.0, 32.0, 49.0, 33.0, 46.0, 51.0, 33.0, 45.0, 34.0, 36.0, 27.0, 34.0, 27.0, 34.0, 19.0, 14.0, 20.0, 14.0, 19.0, 21.0, 16.0, 7.0, 13.0, 7.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.479201316833496, -8.194890022277832, -7.910579204559326, -7.626267910003662, -7.341957092285156, -7.057645797729492, -6.773334503173828, -6.489023208618164, -6.204712390899658, -5.920401096343994, -5.636090278625488, -5.351778984069824, -5.06746768951416, -4.783156871795654, -4.49884557723999, -4.214534759521484, -3.9302234649658203, -3.6459124088287354, -3.3616013526916504, -3.0772900581359863, -2.7929790019989014, -2.5086679458618164, -2.2243566513061523, -1.9400455951690674, -1.6557345390319824, -1.3714234828948975, -1.087112307548523, -0.8028011918067932, -0.5184900760650635, -0.23417901992797852, 0.050132155418395996, 0.3344433307647705, 0.6187534332275391, 0.9030645489692688, 1.1873756647109985, 1.471686840057373, 1.755997896194458, 2.040308952331543, 2.324620246887207, 2.608931303024292, 2.893242359161377, 3.177553415298462, 3.461864471435547, 3.746175765991211, 4.030487060546875, 4.314797878265381, 4.599109172821045, 4.883419990539551, 5.167731285095215, 5.452042579650879, 5.736353397369385, 6.020664691925049, 6.304975509643555, 6.589286804199219, 6.873598098754883, 7.157909393310547, 7.442220211029053, 7.726531505584717, 8.010842323303223, 8.295153617858887, 8.57946491241455, 8.863775253295898, 9.148086547851562, 9.432397842407227, 9.71670913696289]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 12.0, 24.0, 19.0, 43.0, 52.0, 114.0, 159.0, 220.0, 387.0, 670.0, 1053.0, 1923.0, 3327.0, 5780.0, 10622.0, 20739.0, 44174.0, 104670.0, 282464.0, 846967.0, 1550583.0, 845542.0, 278880.0, 103811.0, 44640.0, 21682.0, 11209.0, 5968.0, 3350.0, 1924.0, 1199.0, 730.0, 450.0, 280.0, 178.0, 140.0, 82.0, 63.0, 45.0, 31.0, 25.0, 13.0, 11.0, 5.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.09375, -17.48046875, -16.8671875, -16.25390625, -15.640625, -15.02734375, -14.4140625, -13.80078125, -13.1875, -12.57421875, -11.9609375, -11.34765625, -10.734375, -10.12109375, -9.5078125, -8.89453125, -8.28125, -7.66796875, -7.0546875, -6.44140625, -5.828125, -5.21484375, -4.6015625, -3.98828125, -3.375, -2.76171875, -2.1484375, -1.53515625, -0.921875, -0.30859375, 0.3046875, 0.91796875, 1.53125, 2.14453125, 2.7578125, 3.37109375, 3.984375, 4.59765625, 5.2109375, 5.82421875, 6.4375, 7.05078125, 7.6640625, 8.27734375, 8.890625, 9.50390625, 10.1171875, 10.73046875, 11.34375, 11.95703125, 12.5703125, 13.18359375, 13.796875, 14.41015625, 15.0234375, 15.63671875, 16.25, 16.86328125, 17.4765625, 18.08984375, 18.703125, 19.31640625, 19.9296875, 20.54296875, 21.15625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 10.0, 16.0, 15.0, 22.0, 27.0, 19.0, 33.0, 34.0, 34.0, 29.0, 44.0, 47.0, 41.0, 42.0, 60.0, 32.0, 58.0, 58.0, 45.0, 31.0, 34.0, 33.0, 38.0, 30.0, 18.0, 16.0, 25.0, 18.0, 16.0, 13.0, 15.0, 1.0, 3.0, 7.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.74609375, -7.506103515625, -7.26611328125, -7.026123046875, -6.7861328125, -6.546142578125, -6.30615234375, -6.066162109375, -5.826171875, -5.586181640625, -5.34619140625, -5.106201171875, -4.8662109375, -4.626220703125, -4.38623046875, -4.146240234375, -3.90625, -3.666259765625, -3.42626953125, -3.186279296875, -2.9462890625, -2.706298828125, -2.46630859375, -2.226318359375, -1.986328125, -1.746337890625, -1.50634765625, -1.266357421875, -1.0263671875, -0.786376953125, -0.54638671875, -0.306396484375, -0.06640625, 0.173583984375, 0.41357421875, 0.653564453125, 0.8935546875, 1.133544921875, 1.37353515625, 1.613525390625, 1.853515625, 2.093505859375, 2.33349609375, 2.573486328125, 2.8134765625, 3.053466796875, 3.29345703125, 3.533447265625, 3.7734375, 4.013427734375, 4.25341796875, 4.493408203125, 4.7333984375, 4.973388671875, 5.21337890625, 5.453369140625, 5.693359375, 5.933349609375, 6.17333984375, 6.413330078125, 6.6533203125, 6.893310546875, 7.13330078125, 7.373291015625, 7.61328125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 16.0, 15.0, 26.0, 38.0, 74.0, 101.0, 163.0, 244.0, 447.0, 817.0, 1252.0, 2228.0, 3961.0, 7499.0, 14258.0, 29449.0, 63394.0, 148652.0, 379294.0, 980095.0, 1395510.0, 698977.0, 266398.0, 107184.0, 47493.0, 22408.0, 11121.0, 5843.0, 3113.0, 1756.0, 955.0, 588.0, 347.0, 218.0, 123.0, 96.0, 45.0, 27.0, 22.0, 18.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.187744140625, -19.56298828125, -18.938232421875, -18.3134765625, -17.688720703125, -17.06396484375, -16.439208984375, -15.814453125, -15.189697265625, -14.56494140625, -13.940185546875, -13.3154296875, -12.690673828125, -12.06591796875, -11.441162109375, -10.81640625, -10.191650390625, -9.56689453125, -8.942138671875, -8.3173828125, -7.692626953125, -7.06787109375, -6.443115234375, -5.818359375, -5.193603515625, -4.56884765625, -3.944091796875, -3.3193359375, -2.694580078125, -2.06982421875, -1.445068359375, -0.8203125, -0.195556640625, 0.42919921875, 1.053955078125, 1.6787109375, 2.303466796875, 2.92822265625, 3.552978515625, 4.177734375, 4.802490234375, 5.42724609375, 6.052001953125, 6.6767578125, 7.301513671875, 7.92626953125, 8.551025390625, 9.17578125, 9.800537109375, 10.42529296875, 11.050048828125, 11.6748046875, 12.299560546875, 12.92431640625, 13.549072265625, 14.173828125, 14.798583984375, 15.42333984375, 16.048095703125, 16.6728515625, 17.297607421875, 17.92236328125, 18.547119140625, 19.171875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 4.0, 9.0, 8.0, 9.0, 17.0, 20.0, 25.0, 20.0, 34.0, 45.0, 82.0, 97.0, 117.0, 133.0, 191.0, 260.0, 277.0, 300.0, 372.0, 351.0, 325.0, 270.0, 224.0, 208.0, 163.0, 136.0, 85.0, 72.0, 46.0, 51.0, 36.0, 27.0, 25.0, 12.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.26519775390625, -5.1007080078125, -4.93621826171875, -4.771728515625, -4.60723876953125, -4.4427490234375, -4.27825927734375, -4.11376953125, -3.94927978515625, -3.7847900390625, -3.62030029296875, -3.455810546875, -3.29132080078125, -3.1268310546875, -2.96234130859375, -2.7978515625, -2.63336181640625, -2.4688720703125, -2.30438232421875, -2.139892578125, -1.97540283203125, -1.8109130859375, -1.64642333984375, -1.48193359375, -1.31744384765625, -1.1529541015625, -0.98846435546875, -0.823974609375, -0.65948486328125, -0.4949951171875, -0.33050537109375, -0.166015625, -0.00152587890625, 0.1629638671875, 0.32745361328125, 0.491943359375, 0.65643310546875, 0.8209228515625, 0.98541259765625, 1.14990234375, 1.31439208984375, 1.4788818359375, 1.64337158203125, 1.807861328125, 1.97235107421875, 2.1368408203125, 2.30133056640625, 2.4658203125, 2.63031005859375, 2.7947998046875, 2.95928955078125, 3.123779296875, 3.28826904296875, 3.4527587890625, 3.61724853515625, 3.78173828125, 3.94622802734375, 4.1107177734375, 4.27520751953125, 4.439697265625, 4.60418701171875, 4.7686767578125, 4.93316650390625, 5.09765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 3.0, 11.0, 6.0, 21.0, 15.0, 28.0, 50.0, 52.0, 84.0, 87.0, 99.0, 93.0, 113.0, 71.0, 74.0, 49.0, 34.0, 27.0, 18.0, 16.0, 17.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.92160415649414, -29.140708923339844, -28.359813690185547, -27.57891845703125, -26.798023223876953, -26.017127990722656, -25.23623275756836, -24.455337524414062, -23.674442291259766, -22.89354705810547, -22.112651824951172, -21.331756591796875, -20.550861358642578, -19.76996612548828, -18.989070892333984, -18.208175659179688, -17.42728042602539, -16.646385192871094, -15.865489959716797, -15.0845947265625, -14.303699493408203, -13.522804260253906, -12.74190902709961, -11.961013793945312, -11.180118560791016, -10.399223327636719, -9.618328094482422, -8.837432861328125, -8.056537628173828, -7.275642395019531, -6.494747161865234, -5.7138519287109375, -4.932958602905273, -4.152063369750977, -3.3711681365966797, -2.590272903442383, -1.809377670288086, -1.028482437133789, -0.2475872039794922, 0.5333080291748047, 1.3142032623291016, 2.0950984954833984, 2.8759937286376953, 3.656888961791992, 4.437784194946289, 5.218679428100586, 5.999574661254883, 6.78046989440918, 7.561365127563477, 8.342260360717773, 9.12315559387207, 9.904050827026367, 10.684946060180664, 11.465841293334961, 12.246736526489258, 13.027631759643555, 13.808526992797852, 14.589422225952148, 15.370317459106445, 16.151212692260742, 16.93210792541504, 17.713003158569336, 18.493898391723633, 19.27479362487793, 20.055688858032227]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 13.0, 11.0, 14.0, 13.0, 23.0, 29.0, 27.0, 24.0, 32.0, 30.0, 51.0, 52.0, 43.0, 47.0, 58.0, 51.0, 37.0, 45.0, 50.0, 36.0, 38.0, 25.0, 40.0, 35.0, 23.0, 26.0, 29.0, 21.0, 13.0, 9.0, 4.0, 11.0, 10.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.636570930480957, -10.317435264587402, -9.998299598693848, -9.679163932800293, -9.360027313232422, -9.040891647338867, -8.721755981445312, -8.402620315551758, -8.083484649658203, -7.764348983764648, -7.445213317871094, -7.126077175140381, -6.806941509246826, -6.4878058433532715, -6.168669700622559, -5.849534034729004, -5.530398368835449, -5.2112627029418945, -4.89212703704834, -4.572990894317627, -4.253855228424072, -3.9347195625305176, -3.615583658218384, -3.29644775390625, -2.9773120880126953, -2.6581764221191406, -2.339040517807007, -2.019904613494873, -1.7007689476013184, -1.3816331624984741, -1.0624973773956299, -0.7433614730834961, -0.4242267608642578, -0.10509097576141357, 0.21404480934143066, 0.5331805944442749, 0.8523163795471191, 1.1714521646499634, 1.4905879497528076, 1.8097238540649414, 2.128859519958496, 2.447995185852051, 2.7671310901641846, 3.0862669944763184, 3.405402660369873, 3.7245383262634277, 4.043674468994141, 4.362810134887695, 4.68194580078125, 5.001081466674805, 5.320217132568359, 5.639353275299072, 5.958488941192627, 6.277624607086182, 6.5967607498168945, 6.915896415710449, 7.235032081604004, 7.554167747497559, 7.873303413391113, 8.192439079284668, 8.511575698852539, 8.830711364746094, 9.149847030639648, 9.468982696533203, 9.788118362426758]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 12.0, 19.0, 28.0, 43.0, 56.0, 99.0, 143.0, 252.0, 406.0, 704.0, 1124.0, 2045.0, 3863.0, 7021.0, 13825.0, 27538.0, 55535.0, 110359.0, 198017.0, 248079.0, 182114.0, 97338.0, 48753.0, 24475.0, 12220.0, 6507.0, 3356.0, 1904.0, 1078.0, 635.0, 386.0, 208.0, 143.0, 90.0, 58.0, 37.0, 31.0, 12.0, 11.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.69049072265625, -6.4630126953125, -6.23553466796875, -6.008056640625, -5.78057861328125, -5.5531005859375, -5.32562255859375, -5.09814453125, -4.87066650390625, -4.6431884765625, -4.41571044921875, -4.188232421875, -3.96075439453125, -3.7332763671875, -3.50579833984375, -3.2783203125, -3.05084228515625, -2.8233642578125, -2.59588623046875, -2.368408203125, -2.14093017578125, -1.9134521484375, -1.68597412109375, -1.45849609375, -1.23101806640625, -1.0035400390625, -0.77606201171875, -0.548583984375, -0.32110595703125, -0.0936279296875, 0.13385009765625, 0.361328125, 0.58880615234375, 0.8162841796875, 1.04376220703125, 1.271240234375, 1.49871826171875, 1.7261962890625, 1.95367431640625, 2.18115234375, 2.40863037109375, 2.6361083984375, 2.86358642578125, 3.091064453125, 3.31854248046875, 3.5460205078125, 3.77349853515625, 4.0009765625, 4.22845458984375, 4.4559326171875, 4.68341064453125, 4.910888671875, 5.13836669921875, 5.3658447265625, 5.59332275390625, 5.82080078125, 6.04827880859375, 6.2757568359375, 6.50323486328125, 6.730712890625, 6.95819091796875, 7.1856689453125, 7.41314697265625, 7.640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 13.0, 3.0, 16.0, 21.0, 25.0, 19.0, 25.0, 22.0, 26.0, 55.0, 46.0, 51.0, 58.0, 55.0, 52.0, 63.0, 46.0, 54.0, 51.0, 43.0, 36.0, 35.0, 26.0, 25.0, 21.0, 25.0, 17.0, 16.0, 7.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.7611083984375, -10.389404296875, -10.0177001953125, -9.64599609375, -9.2742919921875, -8.902587890625, -8.5308837890625, -8.1591796875, -7.7874755859375, -7.415771484375, -7.0440673828125, -6.67236328125, -6.3006591796875, -5.928955078125, -5.5572509765625, -5.185546875, -4.8138427734375, -4.442138671875, -4.0704345703125, -3.69873046875, -3.3270263671875, -2.955322265625, -2.5836181640625, -2.2119140625, -1.8402099609375, -1.468505859375, -1.0968017578125, -0.72509765625, -0.3533935546875, 0.018310546875, 0.3900146484375, 0.76171875, 1.1334228515625, 1.505126953125, 1.8768310546875, 2.24853515625, 2.6202392578125, 2.991943359375, 3.3636474609375, 3.7353515625, 4.1070556640625, 4.478759765625, 4.8504638671875, 5.22216796875, 5.5938720703125, 5.965576171875, 6.3372802734375, 6.708984375, 7.0806884765625, 7.452392578125, 7.8240966796875, 8.19580078125, 8.5675048828125, 8.939208984375, 9.3109130859375, 9.6826171875, 10.0543212890625, 10.426025390625, 10.7977294921875, 11.16943359375, 11.5411376953125, 11.912841796875, 12.2845458984375, 12.65625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 12.0, 18.0, 34.0, 35.0, 50.0, 100.0, 108.0, 125.0, 213.0, 287.0, 378.0, 546.0, 793.0, 1089.0, 1563.0, 2230.0, 3284.0, 5009.0, 7914.0, 12558.0, 20082.0, 33487.0, 56356.0, 94729.0, 150515.0, 198292.0, 172163.0, 112091.0, 67612.0, 40598.0, 24006.0, 14575.0, 9110.0, 5988.0, 3939.0, 2624.0, 1723.0, 1237.0, 869.0, 643.0, 435.0, 314.0, 215.0, 195.0, 125.0, 89.0, 62.0, 42.0, 28.0, 21.0, 13.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0], "bins": [-6.42578125, -6.2291259765625, -6.032470703125, -5.8358154296875, -5.63916015625, -5.4425048828125, -5.245849609375, -5.0491943359375, -4.8525390625, -4.6558837890625, -4.459228515625, -4.2625732421875, -4.06591796875, -3.8692626953125, -3.672607421875, -3.4759521484375, -3.279296875, -3.0826416015625, -2.885986328125, -2.6893310546875, -2.49267578125, -2.2960205078125, -2.099365234375, -1.9027099609375, -1.7060546875, -1.5093994140625, -1.312744140625, -1.1160888671875, -0.91943359375, -0.7227783203125, -0.526123046875, -0.3294677734375, -0.1328125, 0.0638427734375, 0.260498046875, 0.4571533203125, 0.65380859375, 0.8504638671875, 1.047119140625, 1.2437744140625, 1.4404296875, 1.6370849609375, 1.833740234375, 2.0303955078125, 2.22705078125, 2.4237060546875, 2.620361328125, 2.8170166015625, 3.013671875, 3.2103271484375, 3.406982421875, 3.6036376953125, 3.80029296875, 3.9969482421875, 4.193603515625, 4.3902587890625, 4.5869140625, 4.7835693359375, 4.980224609375, 5.1768798828125, 5.37353515625, 5.5701904296875, 5.766845703125, 5.9635009765625, 6.16015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 4.0, 12.0, 6.0, 10.0, 14.0, 19.0, 20.0, 28.0, 21.0, 20.0, 26.0, 30.0, 29.0, 25.0, 35.0, 33.0, 42.0, 37.0, 36.0, 31.0, 39.0, 44.0, 42.0, 41.0, 29.0, 34.0, 36.0, 32.0, 25.0, 30.0, 22.0, 18.0, 16.0, 19.0, 12.0, 13.0, 5.0, 7.0, 6.0, 7.0, 12.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.6480712890625, -4.491455078125, -4.3348388671875, -4.17822265625, -4.0216064453125, -3.864990234375, -3.7083740234375, -3.5517578125, -3.3951416015625, -3.238525390625, -3.0819091796875, -2.92529296875, -2.7686767578125, -2.612060546875, -2.4554443359375, -2.298828125, -2.1422119140625, -1.985595703125, -1.8289794921875, -1.67236328125, -1.5157470703125, -1.359130859375, -1.2025146484375, -1.0458984375, -0.8892822265625, -0.732666015625, -0.5760498046875, -0.41943359375, -0.2628173828125, -0.106201171875, 0.0504150390625, 0.20703125, 0.3636474609375, 0.520263671875, 0.6768798828125, 0.83349609375, 0.9901123046875, 1.146728515625, 1.3033447265625, 1.4599609375, 1.6165771484375, 1.773193359375, 1.9298095703125, 2.08642578125, 2.2430419921875, 2.399658203125, 2.5562744140625, 2.712890625, 2.8695068359375, 3.026123046875, 3.1827392578125, 3.33935546875, 3.4959716796875, 3.652587890625, 3.8092041015625, 3.9658203125, 4.1224365234375, 4.279052734375, 4.4356689453125, 4.59228515625, 4.7489013671875, 4.905517578125, 5.0621337890625, 5.21875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 10.0, 21.0, 36.0, 43.0, 65.0, 99.0, 158.0, 225.0, 344.0, 534.0, 861.0, 1354.0, 2160.0, 3801.0, 6597.0, 11866.0, 22169.0, 41866.0, 82045.0, 158307.0, 253006.0, 215267.0, 117992.0, 60035.0, 31234.0, 16367.0, 9066.0, 5129.0, 3065.0, 1776.0, 1066.0, 688.0, 421.0, 290.0, 198.0, 111.0, 76.0, 64.0, 33.0, 25.0, 27.0, 12.0, 7.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.697265625, -2.614959716796875, -2.53265380859375, -2.450347900390625, -2.3680419921875, -2.285736083984375, -2.20343017578125, -2.121124267578125, -2.038818359375, -1.956512451171875, -1.87420654296875, -1.791900634765625, -1.7095947265625, -1.627288818359375, -1.54498291015625, -1.462677001953125, -1.38037109375, -1.298065185546875, -1.21575927734375, -1.133453369140625, -1.0511474609375, -0.968841552734375, -0.88653564453125, -0.804229736328125, -0.721923828125, -0.639617919921875, -0.55731201171875, -0.475006103515625, -0.3927001953125, -0.310394287109375, -0.22808837890625, -0.145782470703125, -0.0634765625, 0.018829345703125, 0.10113525390625, 0.183441162109375, 0.2657470703125, 0.348052978515625, 0.43035888671875, 0.512664794921875, 0.594970703125, 0.677276611328125, 0.75958251953125, 0.841888427734375, 0.9241943359375, 1.006500244140625, 1.08880615234375, 1.171112060546875, 1.25341796875, 1.335723876953125, 1.41802978515625, 1.500335693359375, 1.5826416015625, 1.664947509765625, 1.74725341796875, 1.829559326171875, 1.911865234375, 1.994171142578125, 2.07647705078125, 2.158782958984375, 2.2410888671875, 2.323394775390625, 2.40570068359375, 2.488006591796875, 2.5703125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 9.0, 6.0, 8.0, 19.0, 14.0, 25.0, 22.0, 34.0, 55.0, 44.0, 51.0, 60.0, 81.0, 59.0, 70.0, 52.0, 54.0, 53.0, 44.0, 37.0, 29.0, 30.0, 27.0, 19.0, 11.0, 14.0, 11.0, 17.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002396106719970703, -0.00023347511887550354, -0.00022733956575393677, -0.00022120401263237, -0.00021506845951080322, -0.00020893290638923645, -0.00020279735326766968, -0.0001966618001461029, -0.00019052624702453613, -0.00018439069390296936, -0.0001782551407814026, -0.00017211958765983582, -0.00016598403453826904, -0.00015984848141670227, -0.0001537129282951355, -0.00014757737517356873, -0.00014144182205200195, -0.00013530626893043518, -0.0001291707158088684, -0.00012303516268730164, -0.00011689960956573486, -0.00011076405644416809, -0.00010462850332260132, -9.849295020103455e-05, -9.235739707946777e-05, -8.6221843957901e-05, -8.008629083633423e-05, -7.395073771476746e-05, -6.781518459320068e-05, -6.167963147163391e-05, -5.554407835006714e-05, -4.9408525228500366e-05, -4.3272972106933594e-05, -3.713741898536682e-05, -3.100186586380005e-05, -2.4866312742233276e-05, -1.8730759620666504e-05, -1.2595206499099731e-05, -6.459653377532959e-06, -3.241002559661865e-07, 5.811452865600586e-06, 1.1947005987167358e-05, 1.808255910873413e-05, 2.4218112230300903e-05, 3.0353665351867676e-05, 3.648921847343445e-05, 4.262477159500122e-05, 4.876032471656799e-05, 5.4895877838134766e-05, 6.103143095970154e-05, 6.716698408126831e-05, 7.330253720283508e-05, 7.943809032440186e-05, 8.557364344596863e-05, 9.17091965675354e-05, 9.784474968910217e-05, 0.00010398030281066895, 0.00011011585593223572, 0.00011625140905380249, 0.00012238696217536926, 0.00012852251529693604, 0.0001346580684185028, 0.00014079362154006958, 0.00014692917466163635, 0.00015306472778320312]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 22.0, 18.0, 41.0, 55.0, 93.0, 112.0, 171.0, 283.0, 422.0, 627.0, 990.0, 1476.0, 2314.0, 3856.0, 6311.0, 10955.0, 18810.0, 32914.0, 57295.0, 97763.0, 153220.0, 191815.0, 174302.0, 121283.0, 72621.0, 42126.0, 23791.0, 13790.0, 8046.0, 4851.0, 2862.0, 1903.0, 1128.0, 783.0, 510.0, 342.0, 192.0, 152.0, 98.0, 71.0, 33.0, 36.0, 24.0, 12.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.082275390625, -2.01220703125, -1.942138671875, -1.8720703125, -1.802001953125, -1.73193359375, -1.661865234375, -1.591796875, -1.521728515625, -1.45166015625, -1.381591796875, -1.3115234375, -1.241455078125, -1.17138671875, -1.101318359375, -1.03125, -0.961181640625, -0.89111328125, -0.821044921875, -0.7509765625, -0.680908203125, -0.61083984375, -0.540771484375, -0.470703125, -0.400634765625, -0.33056640625, -0.260498046875, -0.1904296875, -0.120361328125, -0.05029296875, 0.019775390625, 0.08984375, 0.159912109375, 0.22998046875, 0.300048828125, 0.3701171875, 0.440185546875, 0.51025390625, 0.580322265625, 0.650390625, 0.720458984375, 0.79052734375, 0.860595703125, 0.9306640625, 1.000732421875, 1.07080078125, 1.140869140625, 1.2109375, 1.281005859375, 1.35107421875, 1.421142578125, 1.4912109375, 1.561279296875, 1.63134765625, 1.701416015625, 1.771484375, 1.841552734375, 1.91162109375, 1.981689453125, 2.0517578125, 2.121826171875, 2.19189453125, 2.261962890625, 2.33203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 5.0, 12.0, 9.0, 16.0, 12.0, 26.0, 20.0, 26.0, 33.0, 29.0, 39.0, 36.0, 26.0, 49.0, 41.0, 53.0, 44.0, 42.0, 50.0, 44.0, 47.0, 40.0, 41.0, 36.0, 32.0, 25.0, 27.0, 18.0, 13.0, 12.0, 14.0, 12.0, 7.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.58349609375, -0.5662384033203125, -0.548980712890625, -0.5317230224609375, -0.51446533203125, -0.4972076416015625, -0.479949951171875, -0.4626922607421875, -0.4454345703125, -0.4281768798828125, -0.410919189453125, -0.3936614990234375, -0.37640380859375, -0.3591461181640625, -0.341888427734375, -0.3246307373046875, -0.307373046875, -0.2901153564453125, -0.272857666015625, -0.2555999755859375, -0.23834228515625, -0.2210845947265625, -0.203826904296875, -0.1865692138671875, -0.1693115234375, -0.1520538330078125, -0.134796142578125, -0.1175384521484375, -0.10028076171875, -0.0830230712890625, -0.065765380859375, -0.0485076904296875, -0.03125, -0.0139923095703125, 0.003265380859375, 0.0205230712890625, 0.03778076171875, 0.0550384521484375, 0.072296142578125, 0.0895538330078125, 0.1068115234375, 0.1240692138671875, 0.141326904296875, 0.1585845947265625, 0.17584228515625, 0.1930999755859375, 0.210357666015625, 0.2276153564453125, 0.244873046875, 0.2621307373046875, 0.279388427734375, 0.2966461181640625, 0.31390380859375, 0.3311614990234375, 0.348419189453125, 0.3656768798828125, 0.3829345703125, 0.4001922607421875, 0.417449951171875, 0.4347076416015625, 0.45196533203125, 0.4692230224609375, 0.486480712890625, 0.5037384033203125, 0.52099609375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 8.0, 9.0, 9.0, 17.0, 22.0, 33.0, 46.0, 49.0, 96.0, 87.0, 92.0, 111.0, 91.0, 80.0, 66.0, 48.0, 32.0, 28.0, 20.0, 11.0, 11.0, 11.0, 3.0, 2.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.20969581604004, -28.44330406188965, -27.676910400390625, -26.910518646240234, -26.144126892089844, -25.37773323059082, -24.61134147644043, -23.844947814941406, -23.078556060791016, -22.312164306640625, -21.5457706451416, -20.77937889099121, -20.012985229492188, -19.246593475341797, -18.480201721191406, -17.713809967041016, -16.947416305541992, -16.1810245513916, -15.414630889892578, -14.648239135742188, -13.88184642791748, -13.115453720092773, -12.349061965942383, -11.582669258117676, -10.816276550292969, -10.049883842468262, -9.283491134643555, -8.517099380493164, -7.750706672668457, -6.98431396484375, -6.217921733856201, -5.451529502868652, -4.685136795043945, -3.9187443256378174, -3.1523518562316895, -2.3859593868255615, -1.6195669174194336, -0.8531744480133057, -0.08678197860717773, 0.6796102523803711, 1.4460029602050781, 2.212395429611206, 2.978787899017334, 3.745180368423462, 4.51157283782959, 5.277965545654297, 6.044357776641846, 6.8107500076293945, 7.577142715454102, 8.343535423278809, 9.109928131103516, 9.876319885253906, 10.642712593078613, 11.40910530090332, 12.175497055053711, 12.941889762878418, 13.708282470703125, 14.474675178527832, 15.241067886352539, 16.00745964050293, 16.773853302001953, 17.540245056152344, 18.306636810302734, 19.073028564453125, 19.83942222595215]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 9.0, 9.0, 14.0, 8.0, 17.0, 15.0, 26.0, 27.0, 25.0, 25.0, 34.0, 39.0, 44.0, 56.0, 46.0, 52.0, 55.0, 44.0, 40.0, 57.0, 34.0, 45.0, 31.0, 40.0, 30.0, 30.0, 26.0, 28.0, 23.0, 21.0, 5.0, 13.0, 6.0, 13.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.59731388092041, -10.278158187866211, -9.959001541137695, -9.639845848083496, -9.320690155029297, -9.001534461975098, -8.682378768920898, -8.363222122192383, -8.044066429138184, -7.724910736083984, -7.405754566192627, -7.0865983963012695, -6.76744270324707, -6.448287010192871, -6.129130840301514, -5.809974670410156, -5.490818977355957, -5.171663284301758, -4.8525071144104, -4.533350944519043, -4.214195251464844, -3.8950393199920654, -3.575883388519287, -3.256727457046509, -2.9375715255737305, -2.618415594100952, -2.299259662628174, -1.9801037311553955, -1.6609477996826172, -1.3417918682098389, -1.0226359367370605, -0.7034800052642822, -0.3843231201171875, -0.06516718864440918, 0.25398874282836914, 0.5731446743011475, 0.8923006057739258, 1.211456537246704, 1.5306124687194824, 1.8497684001922607, 2.168924331665039, 2.4880802631378174, 2.8072361946105957, 3.126392126083374, 3.4455480575561523, 3.7647039890289307, 4.083859920501709, 4.403016090393066, 4.722171783447266, 5.041327476501465, 5.360483646392822, 5.67963981628418, 5.998795509338379, 6.317951202392578, 6.6371073722839355, 6.956263542175293, 7.275419235229492, 7.594574928283691, 7.913731098175049, 8.232887268066406, 8.552042961120605, 8.871198654174805, 9.19035530090332, 9.50951099395752, 9.828666687011719]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 11.0, 12.0, 24.0, 42.0, 58.0, 82.0, 143.0, 186.0, 313.0, 492.0, 808.0, 1279.0, 2214.0, 3587.0, 5819.0, 9926.0, 17075.0, 28856.0, 50085.0, 84116.0, 131007.0, 173593.0, 177320.0, 139069.0, 90285.0, 54760.0, 32108.0, 18317.0, 10717.0, 6291.0, 3804.0, 2268.0, 1408.0, 952.0, 565.0, 317.0, 228.0, 137.0, 97.0, 59.0, 42.0, 28.0, 17.0, 13.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.578125, -10.21435546875, -9.8505859375, -9.48681640625, -9.123046875, -8.75927734375, -8.3955078125, -8.03173828125, -7.66796875, -7.30419921875, -6.9404296875, -6.57666015625, -6.212890625, -5.84912109375, -5.4853515625, -5.12158203125, -4.7578125, -4.39404296875, -4.0302734375, -3.66650390625, -3.302734375, -2.93896484375, -2.5751953125, -2.21142578125, -1.84765625, -1.48388671875, -1.1201171875, -0.75634765625, -0.392578125, -0.02880859375, 0.3349609375, 0.69873046875, 1.0625, 1.42626953125, 1.7900390625, 2.15380859375, 2.517578125, 2.88134765625, 3.2451171875, 3.60888671875, 3.97265625, 4.33642578125, 4.7001953125, 5.06396484375, 5.427734375, 5.79150390625, 6.1552734375, 6.51904296875, 6.8828125, 7.24658203125, 7.6103515625, 7.97412109375, 8.337890625, 8.70166015625, 9.0654296875, 9.42919921875, 9.79296875, 10.15673828125, 10.5205078125, 10.88427734375, 11.248046875, 11.61181640625, 11.9755859375, 12.33935546875, 12.703125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 17.0, 13.0, 20.0, 14.0, 23.0, 26.0, 18.0, 35.0, 40.0, 41.0, 41.0, 51.0, 39.0, 49.0, 48.0, 41.0, 38.0, 39.0, 33.0, 34.0, 38.0, 34.0, 34.0, 34.0, 23.0, 25.0, 13.0, 18.0, 15.0, 20.0, 15.0, 11.0, 8.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.5859375, -9.2713623046875, -8.956787109375, -8.6422119140625, -8.32763671875, -8.0130615234375, -7.698486328125, -7.3839111328125, -7.0693359375, -6.7547607421875, -6.440185546875, -6.1256103515625, -5.81103515625, -5.4964599609375, -5.181884765625, -4.8673095703125, -4.552734375, -4.2381591796875, -3.923583984375, -3.6090087890625, -3.29443359375, -2.9798583984375, -2.665283203125, -2.3507080078125, -2.0361328125, -1.7215576171875, -1.406982421875, -1.0924072265625, -0.77783203125, -0.4632568359375, -0.148681640625, 0.1658935546875, 0.48046875, 0.7950439453125, 1.109619140625, 1.4241943359375, 1.73876953125, 2.0533447265625, 2.367919921875, 2.6824951171875, 2.9970703125, 3.3116455078125, 3.626220703125, 3.9407958984375, 4.25537109375, 4.5699462890625, 4.884521484375, 5.1990966796875, 5.513671875, 5.8282470703125, 6.142822265625, 6.4573974609375, 6.77197265625, 7.0865478515625, 7.401123046875, 7.7156982421875, 8.0302734375, 8.3448486328125, 8.659423828125, 8.9739990234375, 9.28857421875, 9.6031494140625, 9.917724609375, 10.2322998046875, 10.546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 13.0, 19.0, 36.0, 37.0, 79.0, 80.0, 138.0, 235.0, 345.0, 515.0, 892.0, 1378.0, 2393.0, 3931.0, 6619.0, 11244.0, 20420.0, 37016.0, 64431.0, 108105.0, 158392.0, 186891.0, 166467.0, 115884.0, 70571.0, 39905.0, 21932.0, 12500.0, 7260.0, 4162.0, 2444.0, 1545.0, 943.0, 596.0, 379.0, 267.0, 158.0, 92.0, 78.0, 57.0, 35.0, 19.0, 13.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-13.421875, -13.03369140625, -12.6455078125, -12.25732421875, -11.869140625, -11.48095703125, -11.0927734375, -10.70458984375, -10.31640625, -9.92822265625, -9.5400390625, -9.15185546875, -8.763671875, -8.37548828125, -7.9873046875, -7.59912109375, -7.2109375, -6.82275390625, -6.4345703125, -6.04638671875, -5.658203125, -5.27001953125, -4.8818359375, -4.49365234375, -4.10546875, -3.71728515625, -3.3291015625, -2.94091796875, -2.552734375, -2.16455078125, -1.7763671875, -1.38818359375, -1.0, -0.61181640625, -0.2236328125, 0.16455078125, 0.552734375, 0.94091796875, 1.3291015625, 1.71728515625, 2.10546875, 2.49365234375, 2.8818359375, 3.27001953125, 3.658203125, 4.04638671875, 4.4345703125, 4.82275390625, 5.2109375, 5.59912109375, 5.9873046875, 6.37548828125, 6.763671875, 7.15185546875, 7.5400390625, 7.92822265625, 8.31640625, 8.70458984375, 9.0927734375, 9.48095703125, 9.869140625, 10.25732421875, 10.6455078125, 11.03369140625, 11.421875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 7.0, 8.0, 15.0, 11.0, 10.0, 16.0, 18.0, 18.0, 17.0, 31.0, 26.0, 51.0, 31.0, 30.0, 40.0, 41.0, 26.0, 46.0, 35.0, 39.0, 43.0, 41.0, 42.0, 43.0, 28.0, 43.0, 30.0, 32.0, 33.0, 23.0, 19.0, 12.0, 16.0, 11.0, 10.0, 9.0, 9.0, 8.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.62530517578125, -5.4537353515625, -5.28216552734375, -5.110595703125, -4.93902587890625, -4.7674560546875, -4.59588623046875, -4.42431640625, -4.25274658203125, -4.0811767578125, -3.90960693359375, -3.738037109375, -3.56646728515625, -3.3948974609375, -3.22332763671875, -3.0517578125, -2.88018798828125, -2.7086181640625, -2.53704833984375, -2.365478515625, -2.19390869140625, -2.0223388671875, -1.85076904296875, -1.67919921875, -1.50762939453125, -1.3360595703125, -1.16448974609375, -0.992919921875, -0.82135009765625, -0.6497802734375, -0.47821044921875, -0.306640625, -0.13507080078125, 0.0364990234375, 0.20806884765625, 0.379638671875, 0.55120849609375, 0.7227783203125, 0.89434814453125, 1.06591796875, 1.23748779296875, 1.4090576171875, 1.58062744140625, 1.752197265625, 1.92376708984375, 2.0953369140625, 2.26690673828125, 2.4384765625, 2.61004638671875, 2.7816162109375, 2.95318603515625, 3.124755859375, 3.29632568359375, 3.4678955078125, 3.63946533203125, 3.81103515625, 3.98260498046875, 4.1541748046875, 4.32574462890625, 4.497314453125, 4.66888427734375, 4.8404541015625, 5.01202392578125, 5.18359375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 12.0, 9.0, 27.0, 42.0, 65.0, 74.0, 127.0, 179.0, 277.0, 409.0, 641.0, 927.0, 1480.0, 2371.0, 3925.0, 6438.0, 10634.0, 17975.0, 31224.0, 54709.0, 92261.0, 146311.0, 189532.0, 178464.0, 125698.0, 76640.0, 44830.0, 25504.0, 15000.0, 8732.0, 5320.0, 3159.0, 2003.0, 1232.0, 844.0, 474.0, 338.0, 214.0, 137.0, 85.0, 78.0, 41.0, 40.0, 21.0, 12.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.47265625, -4.33636474609375, -4.2000732421875, -4.06378173828125, -3.927490234375, -3.79119873046875, -3.6549072265625, -3.51861572265625, -3.38232421875, -3.24603271484375, -3.1097412109375, -2.97344970703125, -2.837158203125, -2.70086669921875, -2.5645751953125, -2.42828369140625, -2.2919921875, -2.15570068359375, -2.0194091796875, -1.88311767578125, -1.746826171875, -1.61053466796875, -1.4742431640625, -1.33795166015625, -1.20166015625, -1.06536865234375, -0.9290771484375, -0.79278564453125, -0.656494140625, -0.52020263671875, -0.3839111328125, -0.24761962890625, -0.111328125, 0.02496337890625, 0.1612548828125, 0.29754638671875, 0.433837890625, 0.57012939453125, 0.7064208984375, 0.84271240234375, 0.97900390625, 1.11529541015625, 1.2515869140625, 1.38787841796875, 1.524169921875, 1.66046142578125, 1.7967529296875, 1.93304443359375, 2.0693359375, 2.20562744140625, 2.3419189453125, 2.47821044921875, 2.614501953125, 2.75079345703125, 2.8870849609375, 3.02337646484375, 3.15966796875, 3.29595947265625, 3.4322509765625, 3.56854248046875, 3.704833984375, 3.84112548828125, 3.9774169921875, 4.11370849609375, 4.25]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 5.0, 6.0, 6.0, 9.0, 6.0, 8.0, 11.0, 14.0, 18.0, 17.0, 17.0, 31.0, 36.0, 27.0, 40.0, 58.0, 44.0, 62.0, 44.0, 50.0, 63.0, 56.0, 66.0, 44.0, 42.0, 32.0, 39.0, 34.0, 30.0, 21.0, 12.0, 13.0, 14.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00038814544677734375, -0.000374622642993927, -0.00036109983921051025, -0.0003475770354270935, -0.00033405423164367676, -0.00032053142786026, -0.00030700862407684326, -0.0002934858202934265, -0.00027996301651000977, -0.000266440212726593, -0.00025291740894317627, -0.00023939460515975952, -0.00022587180137634277, -0.00021234899759292603, -0.00019882619380950928, -0.00018530339002609253, -0.00017178058624267578, -0.00015825778245925903, -0.00014473497867584229, -0.00013121217489242554, -0.00011768937110900879, -0.00010416656732559204, -9.064376354217529e-05, -7.712095975875854e-05, -6.35981559753418e-05, -5.007535219192505e-05, -3.65525484085083e-05, -2.3029744625091553e-05, -9.506940841674805e-06, 4.015862941741943e-06, 1.753866672515869e-05, 3.106147050857544e-05, 4.458427429199219e-05, 5.8107078075408936e-05, 7.162988185882568e-05, 8.515268564224243e-05, 9.867548942565918e-05, 0.00011219829320907593, 0.00012572109699249268, 0.00013924390077590942, 0.00015276670455932617, 0.00016628950834274292, 0.00017981231212615967, 0.00019333511590957642, 0.00020685791969299316, 0.0002203807234764099, 0.00023390352725982666, 0.0002474263310432434, 0.00026094913482666016, 0.0002744719386100769, 0.00028799474239349365, 0.0003015175461769104, 0.00031504034996032715, 0.0003285631537437439, 0.00034208595752716064, 0.0003556087613105774, 0.00036913156509399414, 0.0003826543688774109, 0.00039617717266082764, 0.0004096999764442444, 0.00042322278022766113, 0.0004367455840110779, 0.00045026838779449463, 0.0004637911915779114, 0.0004773139953613281]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 8.0, 11.0, 18.0, 15.0, 32.0, 33.0, 50.0, 73.0, 106.0, 216.0, 288.0, 439.0, 693.0, 1085.0, 1716.0, 2744.0, 4262.0, 7263.0, 12056.0, 20013.0, 33542.0, 56154.0, 91997.0, 141120.0, 181245.0, 171559.0, 124038.0, 78497.0, 47707.0, 28031.0, 16813.0, 10306.0, 6131.0, 3761.0, 2362.0, 1494.0, 913.0, 608.0, 392.0, 258.0, 145.0, 101.0, 77.0, 52.0, 47.0, 37.0, 15.0, 14.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.15753173828125, -4.0181884765625, -3.87884521484375, -3.739501953125, -3.60015869140625, -3.4608154296875, -3.32147216796875, -3.18212890625, -3.04278564453125, -2.9034423828125, -2.76409912109375, -2.624755859375, -2.48541259765625, -2.3460693359375, -2.20672607421875, -2.0673828125, -1.92803955078125, -1.7886962890625, -1.64935302734375, -1.510009765625, -1.37066650390625, -1.2313232421875, -1.09197998046875, -0.95263671875, -0.81329345703125, -0.6739501953125, -0.53460693359375, -0.395263671875, -0.25592041015625, -0.1165771484375, 0.02276611328125, 0.162109375, 0.30145263671875, 0.4407958984375, 0.58013916015625, 0.719482421875, 0.85882568359375, 0.9981689453125, 1.13751220703125, 1.27685546875, 1.41619873046875, 1.5555419921875, 1.69488525390625, 1.834228515625, 1.97357177734375, 2.1129150390625, 2.25225830078125, 2.3916015625, 2.53094482421875, 2.6702880859375, 2.80963134765625, 2.948974609375, 3.08831787109375, 3.2276611328125, 3.36700439453125, 3.50634765625, 3.64569091796875, 3.7850341796875, 3.92437744140625, 4.063720703125, 4.20306396484375, 4.3424072265625, 4.48175048828125, 4.62109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 20.0, 16.0, 25.0, 20.0, 31.0, 28.0, 30.0, 36.0, 43.0, 40.0, 44.0, 57.0, 54.0, 52.0, 59.0, 44.0, 54.0, 42.0, 42.0, 41.0, 34.0, 33.0, 30.0, 18.0, 13.0, 18.0, 11.0, 13.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3134613037109375, -1.274383544921875, -1.2353057861328125, -1.19622802734375, -1.1571502685546875, -1.118072509765625, -1.0789947509765625, -1.0399169921875, -1.0008392333984375, -0.961761474609375, -0.9226837158203125, -0.88360595703125, -0.8445281982421875, -0.805450439453125, -0.7663726806640625, -0.727294921875, -0.6882171630859375, -0.649139404296875, -0.6100616455078125, -0.57098388671875, -0.5319061279296875, -0.492828369140625, -0.4537506103515625, -0.4146728515625, -0.3755950927734375, -0.336517333984375, -0.2974395751953125, -0.25836181640625, -0.2192840576171875, -0.180206298828125, -0.1411285400390625, -0.10205078125, -0.0629730224609375, -0.023895263671875, 0.0151824951171875, 0.05426025390625, 0.0933380126953125, 0.132415771484375, 0.1714935302734375, 0.2105712890625, 0.2496490478515625, 0.288726806640625, 0.3278045654296875, 0.36688232421875, 0.4059600830078125, 0.445037841796875, 0.4841156005859375, 0.523193359375, 0.5622711181640625, 0.601348876953125, 0.6404266357421875, 0.67950439453125, 0.7185821533203125, 0.757659912109375, 0.7967376708984375, 0.8358154296875, 0.8748931884765625, 0.913970947265625, 0.9530487060546875, 0.99212646484375, 1.0312042236328125, 1.070281982421875, 1.1093597412109375, 1.1484375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 17.0, 12.0, 14.0, 24.0, 37.0, 63.0, 71.0, 91.0, 109.0, 100.0, 97.0, 98.0, 66.0, 46.0, 38.0, 21.0, 19.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.74650001525879, -27.978233337402344, -27.2099666595459, -26.441699981689453, -25.673431396484375, -24.90516471862793, -24.136898040771484, -23.36863136291504, -22.600364685058594, -21.83209800720215, -21.063831329345703, -20.295562744140625, -19.52729606628418, -18.759029388427734, -17.99076271057129, -17.222496032714844, -16.454227447509766, -15.68596076965332, -14.917693138122559, -14.149426460266113, -13.381158828735352, -12.612892150878906, -11.844625473022461, -11.076358795166016, -10.308091163635254, -9.539824485778809, -8.771556854248047, -8.003290176391602, -7.235023021697998, -6.4667558670043945, -5.698489189147949, -4.930222034454346, -4.161952972412109, -3.393685817718506, -2.6254189014434814, -1.857151985168457, -1.0888848304748535, -0.32061767578125, 0.4476490020751953, 1.2159161567687988, 1.9841833114624023, 2.752450466156006, 3.5207173824310303, 4.288984298706055, 5.057251453399658, 5.825518608093262, 6.593785285949707, 7.3620524406433105, 8.130319595336914, 8.89858627319336, 9.666853904724121, 10.435120582580566, 11.203388214111328, 11.971654891967773, 12.739921569824219, 13.508188247680664, 14.276455879211426, 15.044722557067871, 15.812990188598633, 16.581256866455078, 17.349523544311523, 18.11779022216797, 18.886058807373047, 19.654325485229492, 20.422592163085938]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 7.0, 10.0, 8.0, 11.0, 4.0, 16.0, 15.0, 26.0, 29.0, 36.0, 22.0, 43.0, 44.0, 44.0, 44.0, 37.0, 37.0, 46.0, 53.0, 47.0, 39.0, 41.0, 50.0, 32.0, 39.0, 33.0, 33.0, 21.0, 23.0, 27.0, 16.0, 10.0, 8.0, 15.0, 6.0, 8.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.555373191833496, -10.253592491149902, -9.951812744140625, -9.650032043457031, -9.348251342773438, -9.04647159576416, -8.744690895080566, -8.442911148071289, -8.141130447387695, -7.83935022354126, -7.537569999694824, -7.2357892990112305, -6.934009075164795, -6.632228851318359, -6.330448150634766, -6.02866792678833, -5.7268877029418945, -5.425107479095459, -5.123327255249023, -4.82154655456543, -4.519766330718994, -4.217986106872559, -3.916205644607544, -3.6144251823425293, -3.3126449584960938, -3.010864734649658, -2.7090842723846436, -2.407303810119629, -2.1055235862731934, -1.8037432432174683, -1.5019629001617432, -1.2001824378967285, -0.8984012603759766, -0.5966209173202515, -0.29484057426452637, 0.0069397687911987305, 0.30872011184692383, 0.6105004549026489, 0.912280797958374, 1.2140612602233887, 1.5158414840698242, 1.8176218271255493, 2.1194021701812744, 2.421182632446289, 2.7229628562927246, 3.02474308013916, 3.326523542404175, 3.6283040046691895, 3.930084228515625, 4.2318644523620605, 4.533644676208496, 4.83542537689209, 5.137205600738525, 5.438985824584961, 5.740766525268555, 6.04254674911499, 6.344326972961426, 6.646107196807861, 6.947887420654297, 7.249668121337891, 7.551448345184326, 7.853228569030762, 8.155009269714355, 8.456789016723633, 8.758569717407227]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 10.0, 13.0, 16.0, 19.0, 39.0, 60.0, 89.0, 120.0, 208.0, 321.0, 535.0, 769.0, 1321.0, 2223.0, 3808.0, 6954.0, 13364.0, 26885.0, 59025.0, 140947.0, 387492.0, 1072273.0, 1433278.0, 650378.0, 224835.0, 87404.0, 38934.0, 19056.0, 9979.0, 5403.0, 3157.0, 1949.0, 1171.0, 762.0, 483.0, 310.0, 223.0, 158.0, 96.0, 58.0, 41.0, 35.0, 30.0, 19.0, 10.0, 6.0, 3.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.140625, -15.569091796875, -14.99755859375, -14.426025390625, -13.8544921875, -13.282958984375, -12.71142578125, -12.139892578125, -11.568359375, -10.996826171875, -10.42529296875, -9.853759765625, -9.2822265625, -8.710693359375, -8.13916015625, -7.567626953125, -6.99609375, -6.424560546875, -5.85302734375, -5.281494140625, -4.7099609375, -4.138427734375, -3.56689453125, -2.995361328125, -2.423828125, -1.852294921875, -1.28076171875, -0.709228515625, -0.1376953125, 0.433837890625, 1.00537109375, 1.576904296875, 2.1484375, 2.719970703125, 3.29150390625, 3.863037109375, 4.4345703125, 5.006103515625, 5.57763671875, 6.149169921875, 6.720703125, 7.292236328125, 7.86376953125, 8.435302734375, 9.0068359375, 9.578369140625, 10.14990234375, 10.721435546875, 11.29296875, 11.864501953125, 12.43603515625, 13.007568359375, 13.5791015625, 14.150634765625, 14.72216796875, 15.293701171875, 15.865234375, 16.436767578125, 17.00830078125, 17.579833984375, 18.1513671875, 18.722900390625, 19.29443359375, 19.865966796875, 20.4375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 9.0, 6.0, 14.0, 11.0, 12.0, 20.0, 24.0, 27.0, 26.0, 25.0, 37.0, 40.0, 37.0, 40.0, 44.0, 42.0, 44.0, 34.0, 35.0, 45.0, 37.0, 42.0, 55.0, 32.0, 38.0, 38.0, 20.0, 25.0, 22.0, 22.0, 21.0, 9.0, 8.0, 7.0, 9.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.01171875, -6.7952880859375, -6.578857421875, -6.3624267578125, -6.14599609375, -5.9295654296875, -5.713134765625, -5.4967041015625, -5.2802734375, -5.0638427734375, -4.847412109375, -4.6309814453125, -4.41455078125, -4.1981201171875, -3.981689453125, -3.7652587890625, -3.548828125, -3.3323974609375, -3.115966796875, -2.8995361328125, -2.68310546875, -2.4666748046875, -2.250244140625, -2.0338134765625, -1.8173828125, -1.6009521484375, -1.384521484375, -1.1680908203125, -0.95166015625, -0.7352294921875, -0.518798828125, -0.3023681640625, -0.0859375, 0.1304931640625, 0.346923828125, 0.5633544921875, 0.77978515625, 0.9962158203125, 1.212646484375, 1.4290771484375, 1.6455078125, 1.8619384765625, 2.078369140625, 2.2947998046875, 2.51123046875, 2.7276611328125, 2.944091796875, 3.1605224609375, 3.376953125, 3.5933837890625, 3.809814453125, 4.0262451171875, 4.24267578125, 4.4591064453125, 4.675537109375, 4.8919677734375, 5.1083984375, 5.3248291015625, 5.541259765625, 5.7576904296875, 5.97412109375, 6.1905517578125, 6.406982421875, 6.6234130859375, 6.83984375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 6.0, 13.0, 20.0, 24.0, 42.0, 49.0, 77.0, 122.0, 188.0, 242.0, 476.0, 713.0, 1178.0, 2001.0, 3234.0, 5850.0, 10503.0, 20184.0, 41310.0, 90135.0, 216389.0, 550684.0, 1230338.0, 1159887.0, 498878.0, 198077.0, 83200.0, 38242.0, 18807.0, 9873.0, 5449.0, 3128.0, 1918.0, 1190.0, 682.0, 431.0, 235.0, 188.0, 116.0, 66.0, 49.0, 21.0, 28.0, 16.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.81396484375, -18.2060546875, -17.59814453125, -16.990234375, -16.38232421875, -15.7744140625, -15.16650390625, -14.55859375, -13.95068359375, -13.3427734375, -12.73486328125, -12.126953125, -11.51904296875, -10.9111328125, -10.30322265625, -9.6953125, -9.08740234375, -8.4794921875, -7.87158203125, -7.263671875, -6.65576171875, -6.0478515625, -5.43994140625, -4.83203125, -4.22412109375, -3.6162109375, -3.00830078125, -2.400390625, -1.79248046875, -1.1845703125, -0.57666015625, 0.03125, 0.63916015625, 1.2470703125, 1.85498046875, 2.462890625, 3.07080078125, 3.6787109375, 4.28662109375, 4.89453125, 5.50244140625, 6.1103515625, 6.71826171875, 7.326171875, 7.93408203125, 8.5419921875, 9.14990234375, 9.7578125, 10.36572265625, 10.9736328125, 11.58154296875, 12.189453125, 12.79736328125, 13.4052734375, 14.01318359375, 14.62109375, 15.22900390625, 15.8369140625, 16.44482421875, 17.052734375, 17.66064453125, 18.2685546875, 18.87646484375, 19.484375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 9.0, 11.0, 23.0, 23.0, 33.0, 48.0, 58.0, 60.0, 109.0, 131.0, 148.0, 188.0, 223.0, 290.0, 339.0, 350.0, 336.0, 310.0, 278.0, 238.0, 195.0, 160.0, 129.0, 88.0, 49.0, 46.0, 45.0, 35.0, 25.0, 20.0, 11.0, 10.0, 14.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.55859375, -5.399658203125, -5.24072265625, -5.081787109375, -4.9228515625, -4.763916015625, -4.60498046875, -4.446044921875, -4.287109375, -4.128173828125, -3.96923828125, -3.810302734375, -3.6513671875, -3.492431640625, -3.33349609375, -3.174560546875, -3.015625, -2.856689453125, -2.69775390625, -2.538818359375, -2.3798828125, -2.220947265625, -2.06201171875, -1.903076171875, -1.744140625, -1.585205078125, -1.42626953125, -1.267333984375, -1.1083984375, -0.949462890625, -0.79052734375, -0.631591796875, -0.47265625, -0.313720703125, -0.15478515625, 0.004150390625, 0.1630859375, 0.322021484375, 0.48095703125, 0.639892578125, 0.798828125, 0.957763671875, 1.11669921875, 1.275634765625, 1.4345703125, 1.593505859375, 1.75244140625, 1.911376953125, 2.0703125, 2.229248046875, 2.38818359375, 2.547119140625, 2.7060546875, 2.864990234375, 3.02392578125, 3.182861328125, 3.341796875, 3.500732421875, 3.65966796875, 3.818603515625, 3.9775390625, 4.136474609375, 4.29541015625, 4.454345703125, 4.61328125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 12.0, 27.0, 31.0, 27.0, 35.0, 61.0, 68.0, 93.0, 106.0, 97.0, 98.0, 87.0, 59.0, 50.0, 38.0, 24.0, 21.0, 11.0, 5.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.156291961669922, -27.379981994628906, -26.60367202758789, -25.827362060546875, -25.051050186157227, -24.27474021911621, -23.498430252075195, -22.72212028503418, -21.94580841064453, -21.169498443603516, -20.3931884765625, -19.616878509521484, -18.840566635131836, -18.06425666809082, -17.287946701049805, -16.51163673400879, -15.735326766967773, -14.959016799926758, -14.182705879211426, -13.40639591217041, -12.630084991455078, -11.853775024414062, -11.077465057373047, -10.301155090332031, -9.5248441696167, -8.748534202575684, -7.972223281860352, -7.195913314819336, -6.419602870941162, -5.643292427062988, -4.866982460021973, -4.090672016143799, -3.314361572265625, -2.538051128387451, -1.7617409229278564, -0.9854307174682617, -0.2091202735900879, 0.5671901702880859, 1.3435001373291016, 2.1198105812072754, 2.896121025085449, 3.672431468963623, 4.448741912841797, 5.2250518798828125, 6.001362323760986, 6.77767276763916, 7.553982734680176, 8.330293655395508, 9.106603622436523, 9.882913589477539, 10.659224510192871, 11.435534477233887, 12.211845397949219, 12.988155364990234, 13.76446533203125, 14.540775299072266, 15.317086219787598, 16.09339714050293, 16.869707107543945, 17.64601707458496, 18.422327041625977, 19.198638916015625, 19.97494888305664, 20.751258850097656, 21.527568817138672]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 11.0, 12.0, 10.0, 12.0, 15.0, 31.0, 25.0, 24.0, 18.0, 23.0, 25.0, 49.0, 47.0, 43.0, 35.0, 53.0, 53.0, 45.0, 42.0, 37.0, 48.0, 49.0, 35.0, 39.0, 26.0, 32.0, 27.0, 27.0, 25.0, 17.0, 10.0, 8.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673925399780273, -9.38236141204834, -9.090797424316406, -8.799233436584473, -8.507669448852539, -8.216106414794922, -7.924542427062988, -7.632978439331055, -7.341414451599121, -7.0498504638671875, -6.758286476135254, -6.4667229652404785, -6.175158977508545, -5.883594989776611, -5.592031478881836, -5.300467491149902, -5.008903503417969, -4.717339515686035, -4.425775527954102, -4.134212017059326, -3.8426480293273926, -3.551084041595459, -3.2595202922821045, -2.96795654296875, -2.6763925552368164, -2.384828567504883, -2.0932648181915283, -1.8017009496688843, -1.5101370811462402, -1.2185732126235962, -0.9270093441009521, -0.6354455947875977, -0.34388256072998047, -0.052318692207336426, 0.23924517631530762, 0.5308090448379517, 0.8223729133605957, 1.1139367818832397, 1.4055006504058838, 1.6970643997192383, 1.9886283874511719, 2.2801923751831055, 2.57175612449646, 2.8633198738098145, 3.154883861541748, 3.4464478492736816, 3.738011598587036, 4.029575347900391, 4.321139335632324, 4.612703323364258, 4.904267311096191, 5.195830821990967, 5.4873948097229, 5.778958797454834, 6.070522308349609, 6.362086296081543, 6.653650283813477, 6.94521427154541, 7.236778259277344, 7.528341770172119, 7.819905757904053, 8.111469268798828, 8.403033256530762, 8.694597244262695, 8.986161231994629]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 9.0, 19.0, 10.0, 18.0, 30.0, 70.0, 67.0, 133.0, 196.0, 292.0, 456.0, 787.0, 1341.0, 2365.0, 4223.0, 8062.0, 15797.0, 31183.0, 63709.0, 128020.0, 223267.0, 247390.0, 158639.0, 81154.0, 39573.0, 19630.0, 9979.0, 5179.0, 2917.0, 1585.0, 950.0, 539.0, 348.0, 213.0, 130.0, 99.0, 60.0, 36.0, 17.0, 25.0, 12.0, 12.0, 4.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.48046875, -7.2479248046875, -7.015380859375, -6.7828369140625, -6.55029296875, -6.3177490234375, -6.085205078125, -5.8526611328125, -5.6201171875, -5.3875732421875, -5.155029296875, -4.9224853515625, -4.68994140625, -4.4573974609375, -4.224853515625, -3.9923095703125, -3.759765625, -3.5272216796875, -3.294677734375, -3.0621337890625, -2.82958984375, -2.5970458984375, -2.364501953125, -2.1319580078125, -1.8994140625, -1.6668701171875, -1.434326171875, -1.2017822265625, -0.96923828125, -0.7366943359375, -0.504150390625, -0.2716064453125, -0.0390625, 0.1934814453125, 0.426025390625, 0.6585693359375, 0.89111328125, 1.1236572265625, 1.356201171875, 1.5887451171875, 1.8212890625, 2.0538330078125, 2.286376953125, 2.5189208984375, 2.75146484375, 2.9840087890625, 3.216552734375, 3.4490966796875, 3.681640625, 3.9141845703125, 4.146728515625, 4.3792724609375, 4.61181640625, 4.8443603515625, 5.076904296875, 5.3094482421875, 5.5419921875, 5.7745361328125, 6.007080078125, 6.2396240234375, 6.47216796875, 6.7047119140625, 6.937255859375, 7.1697998046875, 7.40234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 10.0, 5.0, 4.0, 11.0, 15.0, 9.0, 18.0, 20.0, 23.0, 38.0, 34.0, 33.0, 52.0, 39.0, 47.0, 55.0, 56.0, 51.0, 54.0, 54.0, 44.0, 43.0, 36.0, 41.0, 34.0, 31.0, 31.0, 19.0, 13.0, 23.0, 9.0, 10.0, 11.0, 7.0, 11.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7890625, -11.4381103515625, -11.087158203125, -10.7362060546875, -10.38525390625, -10.0343017578125, -9.683349609375, -9.3323974609375, -8.9814453125, -8.6304931640625, -8.279541015625, -7.9285888671875, -7.57763671875, -7.2266845703125, -6.875732421875, -6.5247802734375, -6.173828125, -5.8228759765625, -5.471923828125, -5.1209716796875, -4.77001953125, -4.4190673828125, -4.068115234375, -3.7171630859375, -3.3662109375, -3.0152587890625, -2.664306640625, -2.3133544921875, -1.96240234375, -1.6114501953125, -1.260498046875, -0.9095458984375, -0.55859375, -0.2076416015625, 0.143310546875, 0.4942626953125, 0.84521484375, 1.1961669921875, 1.547119140625, 1.8980712890625, 2.2490234375, 2.5999755859375, 2.950927734375, 3.3018798828125, 3.65283203125, 4.0037841796875, 4.354736328125, 4.7056884765625, 5.056640625, 5.4075927734375, 5.758544921875, 6.1094970703125, 6.46044921875, 6.8114013671875, 7.162353515625, 7.5133056640625, 7.8642578125, 8.2152099609375, 8.566162109375, 8.9171142578125, 9.26806640625, 9.6190185546875, 9.969970703125, 10.3209228515625, 10.671875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 16.0, 17.0, 36.0, 42.0, 62.0, 79.0, 140.0, 154.0, 251.0, 384.0, 560.0, 789.0, 1203.0, 1851.0, 2855.0, 4453.0, 7397.0, 12135.0, 20294.0, 36648.0, 64542.0, 115678.0, 190663.0, 222377.0, 155925.0, 89627.0, 49881.0, 28060.0, 16186.0, 9570.0, 5941.0, 3707.0, 2338.0, 1494.0, 1054.0, 684.0, 461.0, 305.0, 219.0, 145.0, 109.0, 76.0, 45.0, 29.0, 17.0, 16.0, 13.0, 4.0, 5.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.90625, -6.67816162109375, -6.4500732421875, -6.22198486328125, -5.993896484375, -5.76580810546875, -5.5377197265625, -5.30963134765625, -5.08154296875, -4.85345458984375, -4.6253662109375, -4.39727783203125, -4.169189453125, -3.94110107421875, -3.7130126953125, -3.48492431640625, -3.2568359375, -3.02874755859375, -2.8006591796875, -2.57257080078125, -2.344482421875, -2.11639404296875, -1.8883056640625, -1.66021728515625, -1.43212890625, -1.20404052734375, -0.9759521484375, -0.74786376953125, -0.519775390625, -0.29168701171875, -0.0635986328125, 0.16448974609375, 0.392578125, 0.62066650390625, 0.8487548828125, 1.07684326171875, 1.304931640625, 1.53302001953125, 1.7611083984375, 1.98919677734375, 2.21728515625, 2.44537353515625, 2.6734619140625, 2.90155029296875, 3.129638671875, 3.35772705078125, 3.5858154296875, 3.81390380859375, 4.0419921875, 4.27008056640625, 4.4981689453125, 4.72625732421875, 4.954345703125, 5.18243408203125, 5.4105224609375, 5.63861083984375, 5.86669921875, 6.09478759765625, 6.3228759765625, 6.55096435546875, 6.779052734375, 7.00714111328125, 7.2352294921875, 7.46331787109375, 7.69140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 10.0, 18.0, 11.0, 14.0, 13.0, 16.0, 24.0, 18.0, 26.0, 26.0, 19.0, 32.0, 32.0, 30.0, 41.0, 42.0, 33.0, 35.0, 39.0, 28.0, 26.0, 46.0, 36.0, 26.0, 35.0, 39.0, 25.0, 35.0, 31.0, 26.0, 20.0, 22.0, 12.0, 18.0, 13.0, 17.0, 9.0, 12.0, 9.0, 10.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5478515625, -4.392578125, -4.2373046875, -4.08203125, -3.9267578125, -3.771484375, -3.6162109375, -3.4609375, -3.3056640625, -3.150390625, -2.9951171875, -2.83984375, -2.6845703125, -2.529296875, -2.3740234375, -2.21875, -2.0634765625, -1.908203125, -1.7529296875, -1.59765625, -1.4423828125, -1.287109375, -1.1318359375, -0.9765625, -0.8212890625, -0.666015625, -0.5107421875, -0.35546875, -0.2001953125, -0.044921875, 0.1103515625, 0.265625, 0.4208984375, 0.576171875, 0.7314453125, 0.88671875, 1.0419921875, 1.197265625, 1.3525390625, 1.5078125, 1.6630859375, 1.818359375, 1.9736328125, 2.12890625, 2.2841796875, 2.439453125, 2.5947265625, 2.75, 2.9052734375, 3.060546875, 3.2158203125, 3.37109375, 3.5263671875, 3.681640625, 3.8369140625, 3.9921875, 4.1474609375, 4.302734375, 4.4580078125, 4.61328125, 4.7685546875, 4.923828125, 5.0791015625, 5.234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 8.0, 5.0, 6.0, 19.0, 21.0, 34.0, 43.0, 61.0, 124.0, 198.0, 322.0, 550.0, 885.0, 1641.0, 3033.0, 5552.0, 10782.0, 21843.0, 47423.0, 108229.0, 240895.0, 310862.0, 161990.0, 70684.0, 31723.0, 14973.0, 7605.0, 3904.0, 2136.0, 1267.0, 699.0, 403.0, 261.0, 151.0, 98.0, 43.0, 35.0, 21.0, 8.0, 13.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.892578125, -3.788055419921875, -3.68353271484375, -3.579010009765625, -3.4744873046875, -3.369964599609375, -3.26544189453125, -3.160919189453125, -3.056396484375, -2.951873779296875, -2.84735107421875, -2.742828369140625, -2.6383056640625, -2.533782958984375, -2.42926025390625, -2.324737548828125, -2.22021484375, -2.115692138671875, -2.01116943359375, -1.906646728515625, -1.8021240234375, -1.697601318359375, -1.59307861328125, -1.488555908203125, -1.384033203125, -1.279510498046875, -1.17498779296875, -1.070465087890625, -0.9659423828125, -0.861419677734375, -0.75689697265625, -0.652374267578125, -0.5478515625, -0.443328857421875, -0.33880615234375, -0.234283447265625, -0.1297607421875, -0.025238037109375, 0.07928466796875, 0.183807373046875, 0.288330078125, 0.392852783203125, 0.49737548828125, 0.601898193359375, 0.7064208984375, 0.810943603515625, 0.91546630859375, 1.019989013671875, 1.12451171875, 1.229034423828125, 1.33355712890625, 1.438079833984375, 1.5426025390625, 1.647125244140625, 1.75164794921875, 1.856170654296875, 1.960693359375, 2.065216064453125, 2.16973876953125, 2.274261474609375, 2.3787841796875, 2.483306884765625, 2.58782958984375, 2.692352294921875, 2.796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 6.0, 12.0, 7.0, 16.0, 29.0, 28.0, 38.0, 38.0, 59.0, 66.0, 67.0, 68.0, 75.0, 81.0, 76.0, 69.0, 49.0, 48.0, 32.0, 32.0, 14.0, 16.0, 23.0, 16.0, 9.0, 12.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002593994140625, -0.00025214627385139465, -0.0002448931336402893, -0.00023763999342918396, -0.0002303868532180786, -0.00022313371300697327, -0.00021588057279586792, -0.00020862743258476257, -0.00020137429237365723, -0.00019412115216255188, -0.00018686801195144653, -0.0001796148717403412, -0.00017236173152923584, -0.0001651085913181305, -0.00015785545110702515, -0.0001506023108959198, -0.00014334917068481445, -0.0001360960304737091, -0.00012884289026260376, -0.00012158975005149841, -0.00011433660984039307, -0.00010708346962928772, -9.983032941818237e-05, -9.257718920707703e-05, -8.532404899597168e-05, -7.807090878486633e-05, -7.081776857376099e-05, -6.356462836265564e-05, -5.631148815155029e-05, -4.9058347940444946e-05, -4.18052077293396e-05, -3.455206751823425e-05, -2.7298927307128906e-05, -2.004578709602356e-05, -1.2792646884918213e-05, -5.539506673812866e-06, 1.7136335372924805e-06, 8.966773748397827e-06, 1.6219913959503174e-05, 2.347305417060852e-05, 3.072619438171387e-05, 3.7979334592819214e-05, 4.523247480392456e-05, 5.248561501502991e-05, 5.9738755226135254e-05, 6.69918954372406e-05, 7.424503564834595e-05, 8.14981758594513e-05, 8.875131607055664e-05, 9.600445628166199e-05, 0.00010325759649276733, 0.00011051073670387268, 0.00011776387691497803, 0.00012501701712608337, 0.00013227015733718872, 0.00013952329754829407, 0.00014677643775939941, 0.00015402957797050476, 0.0001612827181816101, 0.00016853585839271545, 0.0001757889986038208, 0.00018304213881492615, 0.0001902952790260315, 0.00019754841923713684, 0.0002048015594482422]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 18.0, 18.0, 24.0, 28.0, 46.0, 56.0, 93.0, 141.0, 187.0, 287.0, 454.0, 679.0, 1056.0, 1744.0, 2793.0, 4808.0, 8116.0, 13860.0, 24592.0, 43747.0, 78082.0, 130524.0, 186441.0, 195446.0, 146644.0, 89654.0, 51224.0, 28324.0, 16046.0, 9287.0, 5340.0, 3280.0, 2061.0, 1233.0, 783.0, 479.0, 316.0, 221.0, 119.0, 105.0, 59.0, 41.0, 28.0, 28.0, 18.0, 6.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.599609375, -2.5234375, -2.447265625, -2.37109375, -2.294921875, -2.21875, -2.142578125, -2.06640625, -1.990234375, -1.9140625, -1.837890625, -1.76171875, -1.685546875, -1.609375, -1.533203125, -1.45703125, -1.380859375, -1.3046875, -1.228515625, -1.15234375, -1.076171875, -1.0, -0.923828125, -0.84765625, -0.771484375, -0.6953125, -0.619140625, -0.54296875, -0.466796875, -0.390625, -0.314453125, -0.23828125, -0.162109375, -0.0859375, -0.009765625, 0.06640625, 0.142578125, 0.21875, 0.294921875, 0.37109375, 0.447265625, 0.5234375, 0.599609375, 0.67578125, 0.751953125, 0.828125, 0.904296875, 0.98046875, 1.056640625, 1.1328125, 1.208984375, 1.28515625, 1.361328125, 1.4375, 1.513671875, 1.58984375, 1.666015625, 1.7421875, 1.818359375, 1.89453125, 1.970703125, 2.046875, 2.123046875, 2.19921875, 2.275390625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 8.0, 8.0, 14.0, 10.0, 11.0, 9.0, 13.0, 20.0, 28.0, 15.0, 25.0, 25.0, 39.0, 33.0, 34.0, 48.0, 42.0, 38.0, 49.0, 50.0, 56.0, 50.0, 45.0, 50.0, 29.0, 36.0, 29.0, 23.0, 18.0, 22.0, 20.0, 11.0, 7.0, 7.0, 11.0, 13.0, 4.0, 3.0, 13.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.477783203125, -0.4606971740722656, -0.44361114501953125, -0.4265251159667969, -0.4094390869140625, -0.3923530578613281, -0.37526702880859375, -0.3581809997558594, -0.341094970703125, -0.3240089416503906, -0.30692291259765625, -0.2898368835449219, -0.2727508544921875, -0.2556648254394531, -0.23857879638671875, -0.22149276733398438, -0.20440673828125, -0.18732070922851562, -0.17023468017578125, -0.15314865112304688, -0.1360626220703125, -0.11897659301757812, -0.10189056396484375, -0.08480453491210938, -0.067718505859375, -0.050632476806640625, -0.03354644775390625, -0.016460418701171875, 0.0006256103515625, 0.017711639404296875, 0.03479766845703125, 0.051883697509765625, 0.0689697265625, 0.08605575561523438, 0.10314178466796875, 0.12022781372070312, 0.1373138427734375, 0.15439987182617188, 0.17148590087890625, 0.18857192993164062, 0.205657958984375, 0.22274398803710938, 0.23983001708984375, 0.2569160461425781, 0.2740020751953125, 0.2910881042480469, 0.30817413330078125, 0.3252601623535156, 0.34234619140625, 0.3594322204589844, 0.37651824951171875, 0.3936042785644531, 0.4106903076171875, 0.4277763366699219, 0.44486236572265625, 0.4619483947753906, 0.479034423828125, 0.4961204528808594, 0.5132064819335938, 0.5302925109863281, 0.5473785400390625, 0.5644645690917969, 0.5815505981445312, 0.5986366271972656, 0.61572265625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 8.0, 16.0, 22.0, 32.0, 30.0, 29.0, 58.0, 79.0, 100.0, 100.0, 99.0, 103.0, 92.0, 43.0, 51.0, 32.0, 24.0, 17.0, 10.0, 8.0, 9.0, 5.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.03840446472168, -27.26146125793457, -26.48451805114746, -25.70757484436035, -24.930631637573242, -24.153688430786133, -23.37674331665039, -22.59980010986328, -21.822856903076172, -21.045913696289062, -20.268970489501953, -19.492027282714844, -18.715084075927734, -17.938140869140625, -17.161197662353516, -16.384254455566406, -15.607311248779297, -14.830368041992188, -14.053424835205078, -13.276481628417969, -12.49953842163086, -11.72259521484375, -10.945651054382324, -10.168707847595215, -9.391764640808105, -8.614821434020996, -7.837878227233887, -7.060934543609619, -6.28399133682251, -5.5070481300354, -4.730104446411133, -3.9531612396240234, -3.176219940185547, -2.3992767333984375, -1.622333288192749, -0.8453898429870605, -0.06844663619995117, 0.7084965705871582, 1.4854402542114258, 2.262383460998535, 3.0393266677856445, 3.816269874572754, 4.593213081359863, 5.370156764984131, 6.14709997177124, 6.92404317855835, 7.700986862182617, 8.477930068969727, 9.254873275756836, 10.031816482543945, 10.808759689331055, 11.585702896118164, 12.362646102905273, 13.139589309692383, 13.916533470153809, 14.693476676940918, 15.470419883728027, 16.247364044189453, 17.024307250976562, 17.801250457763672, 18.57819366455078, 19.35513687133789, 20.132080078125, 20.90902328491211, 21.68596649169922]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 4.0, 8.0, 16.0, 7.0, 13.0, 13.0, 27.0, 28.0, 23.0, 20.0, 23.0, 26.0, 43.0, 47.0, 45.0, 35.0, 52.0, 51.0, 39.0, 51.0, 39.0, 51.0, 44.0, 40.0, 40.0, 23.0, 31.0, 24.0, 30.0, 30.0, 14.0, 12.0, 9.0, 11.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.641823768615723, -9.352274894714355, -9.062726020812988, -8.773177146911621, -8.483628273010254, -8.194079399108887, -7.904531002044678, -7.6149821281433105, -7.325433254241943, -7.035884380340576, -6.746335506439209, -6.456786632537842, -6.167238235473633, -5.877689361572266, -5.588140487670898, -5.298591613769531, -5.009042739868164, -4.719493865966797, -4.42994499206543, -4.1403961181640625, -3.8508474826812744, -3.5612986087799072, -3.271749973297119, -2.982201099395752, -2.6926522254943848, -2.4031033515930176, -2.1135544776916504, -1.8240058422088623, -1.5344569683074951, -1.244908094406128, -0.9553593397140503, -0.6658105850219727, -0.3762626647949219, -0.08671385049819946, 0.20283496379852295, 0.49238377809524536, 0.7819325923919678, 1.071481466293335, 1.3610302209854126, 1.6505789756774902, 1.9401278495788574, 2.2296767234802246, 2.519225597381592, 2.80877423286438, 3.098323106765747, 3.3878719806671143, 3.6774206161499023, 3.9669694900512695, 4.256518363952637, 4.546067237854004, 4.835616111755371, 5.125164985656738, 5.4147138595581055, 5.704262733459473, 5.993811130523682, 6.283360004425049, 6.572908878326416, 6.862457752227783, 7.15200662612915, 7.441555500030518, 7.731103897094727, 8.020652770996094, 8.310201644897461, 8.599750518798828, 8.889299392700195]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 12.0, 7.0, 15.0, 27.0, 30.0, 40.0, 64.0, 93.0, 139.0, 182.0, 301.0, 451.0, 693.0, 1084.0, 1605.0, 2479.0, 3905.0, 6266.0, 10201.0, 17068.0, 27889.0, 44955.0, 70278.0, 105351.0, 142008.0, 160607.0, 145726.0, 109481.0, 73783.0, 47446.0, 29269.0, 17934.0, 10816.0, 6698.0, 4210.0, 2627.0, 1639.0, 1074.0, 674.0, 468.0, 316.0, 211.0, 120.0, 90.0, 72.0, 52.0, 28.0, 26.0, 18.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0], "bins": [-11.21875, -10.8843994140625, -10.550048828125, -10.2156982421875, -9.88134765625, -9.5469970703125, -9.212646484375, -8.8782958984375, -8.5439453125, -8.2095947265625, -7.875244140625, -7.5408935546875, -7.20654296875, -6.8721923828125, -6.537841796875, -6.2034912109375, -5.869140625, -5.5347900390625, -5.200439453125, -4.8660888671875, -4.53173828125, -4.1973876953125, -3.863037109375, -3.5286865234375, -3.1943359375, -2.8599853515625, -2.525634765625, -2.1912841796875, -1.85693359375, -1.5225830078125, -1.188232421875, -0.8538818359375, -0.51953125, -0.1851806640625, 0.149169921875, 0.4835205078125, 0.81787109375, 1.1522216796875, 1.486572265625, 1.8209228515625, 2.1552734375, 2.4896240234375, 2.823974609375, 3.1583251953125, 3.49267578125, 3.8270263671875, 4.161376953125, 4.4957275390625, 4.830078125, 5.1644287109375, 5.498779296875, 5.8331298828125, 6.16748046875, 6.5018310546875, 6.836181640625, 7.1705322265625, 7.5048828125, 7.8392333984375, 8.173583984375, 8.5079345703125, 8.84228515625, 9.1766357421875, 9.510986328125, 9.8453369140625, 10.1796875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 6.0, 9.0, 9.0, 15.0, 15.0, 21.0, 18.0, 18.0, 14.0, 29.0, 31.0, 44.0, 42.0, 40.0, 32.0, 46.0, 43.0, 56.0, 58.0, 42.0, 42.0, 40.0, 34.0, 32.0, 33.0, 28.0, 31.0, 36.0, 20.0, 21.0, 20.0, 16.0, 9.0, 12.0, 4.0, 6.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8671875, -9.5587158203125, -9.250244140625, -8.9417724609375, -8.63330078125, -8.3248291015625, -8.016357421875, -7.7078857421875, -7.3994140625, -7.0909423828125, -6.782470703125, -6.4739990234375, -6.16552734375, -5.8570556640625, -5.548583984375, -5.2401123046875, -4.931640625, -4.6231689453125, -4.314697265625, -4.0062255859375, -3.69775390625, -3.3892822265625, -3.080810546875, -2.7723388671875, -2.4638671875, -2.1553955078125, -1.846923828125, -1.5384521484375, -1.22998046875, -0.9215087890625, -0.613037109375, -0.3045654296875, 0.00390625, 0.3123779296875, 0.620849609375, 0.9293212890625, 1.23779296875, 1.5462646484375, 1.854736328125, 2.1632080078125, 2.4716796875, 2.7801513671875, 3.088623046875, 3.3970947265625, 3.70556640625, 4.0140380859375, 4.322509765625, 4.6309814453125, 4.939453125, 5.2479248046875, 5.556396484375, 5.8648681640625, 6.17333984375, 6.4818115234375, 6.790283203125, 7.0987548828125, 7.4072265625, 7.7156982421875, 8.024169921875, 8.3326416015625, 8.64111328125, 8.9495849609375, 9.258056640625, 9.5665283203125, 9.875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 12.0, 7.0, 14.0, 16.0, 31.0, 39.0, 68.0, 118.0, 171.0, 285.0, 452.0, 671.0, 1183.0, 2034.0, 3446.0, 6058.0, 10641.0, 19299.0, 34190.0, 59740.0, 99504.0, 147613.0, 180085.0, 169759.0, 125797.0, 80045.0, 46706.0, 26137.0, 14771.0, 8109.0, 4645.0, 2733.0, 1651.0, 935.0, 599.0, 356.0, 219.0, 143.0, 90.0, 65.0, 43.0, 29.0, 19.0, 14.0, 6.0, 4.0, 3.0, 1.0, 2.0], "bins": [-14.8984375, -14.5040283203125, -14.109619140625, -13.7152099609375, -13.32080078125, -12.9263916015625, -12.531982421875, -12.1375732421875, -11.7431640625, -11.3487548828125, -10.954345703125, -10.5599365234375, -10.16552734375, -9.7711181640625, -9.376708984375, -8.9822998046875, -8.587890625, -8.1934814453125, -7.799072265625, -7.4046630859375, -7.01025390625, -6.6158447265625, -6.221435546875, -5.8270263671875, -5.4326171875, -5.0382080078125, -4.643798828125, -4.2493896484375, -3.85498046875, -3.4605712890625, -3.066162109375, -2.6717529296875, -2.27734375, -1.8829345703125, -1.488525390625, -1.0941162109375, -0.69970703125, -0.3052978515625, 0.089111328125, 0.4835205078125, 0.8779296875, 1.2723388671875, 1.666748046875, 2.0611572265625, 2.45556640625, 2.8499755859375, 3.244384765625, 3.6387939453125, 4.033203125, 4.4276123046875, 4.822021484375, 5.2164306640625, 5.61083984375, 6.0052490234375, 6.399658203125, 6.7940673828125, 7.1884765625, 7.5828857421875, 7.977294921875, 8.3717041015625, 8.76611328125, 9.1605224609375, 9.554931640625, 9.9493408203125, 10.34375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 6.0, 9.0, 12.0, 14.0, 15.0, 17.0, 20.0, 32.0, 22.0, 22.0, 27.0, 29.0, 34.0, 42.0, 45.0, 43.0, 37.0, 53.0, 26.0, 39.0, 36.0, 49.0, 45.0, 31.0, 25.0, 28.0, 35.0, 31.0, 27.0, 30.0, 18.0, 21.0, 9.0, 6.0, 9.0, 10.0, 6.0, 8.0, 4.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.140625, -4.9735107421875, -4.806396484375, -4.6392822265625, -4.47216796875, -4.3050537109375, -4.137939453125, -3.9708251953125, -3.8037109375, -3.6365966796875, -3.469482421875, -3.3023681640625, -3.13525390625, -2.9681396484375, -2.801025390625, -2.6339111328125, -2.466796875, -2.2996826171875, -2.132568359375, -1.9654541015625, -1.79833984375, -1.6312255859375, -1.464111328125, -1.2969970703125, -1.1298828125, -0.9627685546875, -0.795654296875, -0.6285400390625, -0.46142578125, -0.2943115234375, -0.127197265625, 0.0399169921875, 0.20703125, 0.3741455078125, 0.541259765625, 0.7083740234375, 0.87548828125, 1.0426025390625, 1.209716796875, 1.3768310546875, 1.5439453125, 1.7110595703125, 1.878173828125, 2.0452880859375, 2.21240234375, 2.3795166015625, 2.546630859375, 2.7137451171875, 2.880859375, 3.0479736328125, 3.215087890625, 3.3822021484375, 3.54931640625, 3.7164306640625, 3.883544921875, 4.0506591796875, 4.2177734375, 4.3848876953125, 4.552001953125, 4.7191162109375, 4.88623046875, 5.0533447265625, 5.220458984375, 5.3875732421875, 5.5546875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 9.0, 8.0, 15.0, 30.0, 46.0, 65.0, 105.0, 112.0, 193.0, 281.0, 468.0, 745.0, 1080.0, 1677.0, 2725.0, 4547.0, 7626.0, 13142.0, 23409.0, 42881.0, 81503.0, 147718.0, 218323.0, 206998.0, 132915.0, 72534.0, 38669.0, 20974.0, 11828.0, 6904.0, 4148.0, 2441.0, 1577.0, 1002.0, 599.0, 456.0, 247.0, 191.0, 114.0, 92.0, 54.0, 46.0, 19.0, 11.0, 10.0, 9.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.1649169921875, -4.997802734375, -4.8306884765625, -4.66357421875, -4.4964599609375, -4.329345703125, -4.1622314453125, -3.9951171875, -3.8280029296875, -3.660888671875, -3.4937744140625, -3.32666015625, -3.1595458984375, -2.992431640625, -2.8253173828125, -2.658203125, -2.4910888671875, -2.323974609375, -2.1568603515625, -1.98974609375, -1.8226318359375, -1.655517578125, -1.4884033203125, -1.3212890625, -1.1541748046875, -0.987060546875, -0.8199462890625, -0.65283203125, -0.4857177734375, -0.318603515625, -0.1514892578125, 0.015625, 0.1827392578125, 0.349853515625, 0.5169677734375, 0.68408203125, 0.8511962890625, 1.018310546875, 1.1854248046875, 1.3525390625, 1.5196533203125, 1.686767578125, 1.8538818359375, 2.02099609375, 2.1881103515625, 2.355224609375, 2.5223388671875, 2.689453125, 2.8565673828125, 3.023681640625, 3.1907958984375, 3.35791015625, 3.5250244140625, 3.692138671875, 3.8592529296875, 4.0263671875, 4.1934814453125, 4.360595703125, 4.5277099609375, 4.69482421875, 4.8619384765625, 5.029052734375, 5.1961669921875, 5.36328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 9.0, 9.0, 18.0, 17.0, 21.0, 27.0, 28.0, 39.0, 46.0, 55.0, 67.0, 74.0, 60.0, 71.0, 65.0, 57.0, 65.0, 46.0, 41.0, 34.0, 15.0, 20.0, 21.0, 20.0, 8.0, 9.0, 13.0, 5.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004773139953613281, -0.000460110604763031, -0.0004429072141647339, -0.00042570382356643677, -0.00040850043296813965, -0.00039129704236984253, -0.0003740936517715454, -0.0003568902611732483, -0.00033968687057495117, -0.00032248347997665405, -0.00030528008937835693, -0.0002880766987800598, -0.0002708733081817627, -0.0002536699175834656, -0.00023646652698516846, -0.00021926313638687134, -0.00020205974578857422, -0.0001848563551902771, -0.00016765296459197998, -0.00015044957399368286, -0.00013324618339538574, -0.00011604279279708862, -9.88394021987915e-05, -8.163601160049438e-05, -6.443262100219727e-05, -4.7229230403900146e-05, -3.0025839805603027e-05, -1.2822449207305908e-05, 4.380941390991211e-06, 2.158433198928833e-05, 3.878772258758545e-05, 5.599111318588257e-05, 7.319450378417969e-05, 9.03978943824768e-05, 0.00010760128498077393, 0.00012480467557907104, 0.00014200806617736816, 0.00015921145677566528, 0.0001764148473739624, 0.00019361823797225952, 0.00021082162857055664, 0.00022802501916885376, 0.0002452284097671509, 0.000262431800365448, 0.0002796351909637451, 0.00029683858156204224, 0.00031404197216033936, 0.0003312453627586365, 0.0003484487533569336, 0.0003656521439552307, 0.00038285553455352783, 0.00040005892515182495, 0.00041726231575012207, 0.0004344657063484192, 0.0004516690969467163, 0.00046887248754501343, 0.00048607587814331055, 0.0005032792687416077, 0.0005204826593399048, 0.0005376860499382019, 0.000554889440536499, 0.0005720928311347961, 0.0005892962217330933, 0.0006064996123313904, 0.0006237030029296875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 7.0, 14.0, 17.0, 16.0, 36.0, 48.0, 74.0, 113.0, 148.0, 204.0, 296.0, 425.0, 625.0, 895.0, 1336.0, 1959.0, 2927.0, 4640.0, 7194.0, 11654.0, 18945.0, 32408.0, 55556.0, 93714.0, 149239.0, 192570.0, 174409.0, 119690.0, 72102.0, 41991.0, 24599.0, 14679.0, 9102.0, 5837.0, 3668.0, 2413.0, 1617.0, 1140.0, 697.0, 463.0, 343.0, 204.0, 156.0, 105.0, 91.0, 45.0, 46.0, 16.0, 18.0, 20.0, 7.0, 15.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-4.58203125, -4.43768310546875, -4.2933349609375, -4.14898681640625, -4.004638671875, -3.86029052734375, -3.7159423828125, -3.57159423828125, -3.42724609375, -3.28289794921875, -3.1385498046875, -2.99420166015625, -2.849853515625, -2.70550537109375, -2.5611572265625, -2.41680908203125, -2.2724609375, -2.12811279296875, -1.9837646484375, -1.83941650390625, -1.695068359375, -1.55072021484375, -1.4063720703125, -1.26202392578125, -1.11767578125, -0.97332763671875, -0.8289794921875, -0.68463134765625, -0.540283203125, -0.39593505859375, -0.2515869140625, -0.10723876953125, 0.037109375, 0.18145751953125, 0.3258056640625, 0.47015380859375, 0.614501953125, 0.75885009765625, 0.9031982421875, 1.04754638671875, 1.19189453125, 1.33624267578125, 1.4805908203125, 1.62493896484375, 1.769287109375, 1.91363525390625, 2.0579833984375, 2.20233154296875, 2.3466796875, 2.49102783203125, 2.6353759765625, 2.77972412109375, 2.924072265625, 3.06842041015625, 3.2127685546875, 3.35711669921875, 3.50146484375, 3.64581298828125, 3.7901611328125, 3.93450927734375, 4.078857421875, 4.22320556640625, 4.3675537109375, 4.51190185546875, 4.65625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 11.0, 13.0, 18.0, 16.0, 11.0, 15.0, 20.0, 26.0, 39.0, 29.0, 48.0, 48.0, 49.0, 62.0, 64.0, 59.0, 46.0, 52.0, 68.0, 41.0, 37.0, 33.0, 25.0, 17.0, 29.0, 21.0, 14.0, 10.0, 11.0, 11.0, 9.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.7060546875, -1.658447265625, -1.61083984375, -1.563232421875, -1.515625, -1.468017578125, -1.42041015625, -1.372802734375, -1.3251953125, -1.277587890625, -1.22998046875, -1.182373046875, -1.134765625, -1.087158203125, -1.03955078125, -0.991943359375, -0.9443359375, -0.896728515625, -0.84912109375, -0.801513671875, -0.75390625, -0.706298828125, -0.65869140625, -0.611083984375, -0.5634765625, -0.515869140625, -0.46826171875, -0.420654296875, -0.373046875, -0.325439453125, -0.27783203125, -0.230224609375, -0.1826171875, -0.135009765625, -0.08740234375, -0.039794921875, 0.0078125, 0.055419921875, 0.10302734375, 0.150634765625, 0.1982421875, 0.245849609375, 0.29345703125, 0.341064453125, 0.388671875, 0.436279296875, 0.48388671875, 0.531494140625, 0.5791015625, 0.626708984375, 0.67431640625, 0.721923828125, 0.76953125, 0.817138671875, 0.86474609375, 0.912353515625, 0.9599609375, 1.007568359375, 1.05517578125, 1.102783203125, 1.150390625, 1.197998046875, 1.24560546875, 1.293212890625, 1.3408203125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 17.0, 25.0, 16.0, 27.0, 35.0, 40.0, 61.0, 81.0, 88.0, 99.0, 90.0, 80.0, 67.0, 58.0, 49.0, 25.0, 30.0, 14.0, 20.0, 6.0, 7.0, 8.0, 9.0, 3.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.686668395996094, -23.007476806640625, -22.328285217285156, -21.649091720581055, -20.969900131225586, -20.290708541870117, -19.611515045166016, -18.932323455810547, -18.253131866455078, -17.57394027709961, -16.89474868774414, -16.21555519104004, -15.53636360168457, -14.857172012329102, -14.177979469299316, -13.498786926269531, -12.819595336914062, -12.140403747558594, -11.461211204528809, -10.782018661499023, -10.102827072143555, -9.423635482788086, -8.7444429397583, -8.065250396728516, -7.386058807373047, -6.70686674118042, -6.027674674987793, -5.348482608795166, -4.669290542602539, -3.990098476409912, -3.310906410217285, -2.631714344024658, -1.9525203704833984, -1.2733283042907715, -0.5941362380981445, 0.08505582809448242, 0.7642478942871094, 1.4434399604797363, 2.1226320266723633, 2.8018240928649902, 3.481016159057617, 4.160208225250244, 4.839400291442871, 5.518592357635498, 6.197784423828125, 6.876976490020752, 7.556168556213379, 8.235361099243164, 8.914552688598633, 9.593744277954102, 10.272936820983887, 10.952129364013672, 11.63132095336914, 12.31051254272461, 12.989705085754395, 13.66889762878418, 14.348089218139648, 15.027280807495117, 15.706473350524902, 16.385665893554688, 17.064857482910156, 17.744049072265625, 18.423240661621094, 19.102434158325195, 19.781625747680664]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 0.0, 4.0, 5.0, 14.0, 11.0, 14.0, 20.0, 19.0, 15.0, 22.0, 20.0, 17.0, 22.0, 30.0, 34.0, 36.0, 36.0, 42.0, 36.0, 45.0, 34.0, 52.0, 45.0, 35.0, 36.0, 37.0, 33.0, 38.0, 43.0, 22.0, 23.0, 28.0, 21.0, 24.0, 11.0, 16.0, 7.0, 12.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.297547340393066, -9.032727241516113, -8.76790714263916, -8.50308609008789, -8.238265991210938, -7.973445892333984, -7.708625793457031, -7.44380521774292, -7.178984642028809, -6.9141645431518555, -6.649343967437744, -6.384523868560791, -6.11970329284668, -5.854883193969727, -5.590063095092773, -5.325242519378662, -5.060422420501709, -4.795602321624756, -4.5307817459106445, -4.265961647033691, -4.00114107131958, -3.736320972442627, -3.4715006351470947, -3.2066802978515625, -2.9418599605560303, -2.677039623260498, -2.412219285964966, -2.1473989486694336, -1.882578730583191, -1.6177583932876587, -1.352938175201416, -1.0881178379058838, -0.8232970237731934, -0.5584766864776611, -0.2936564087867737, -0.02883613109588623, 0.235984206199646, 0.5008045434951782, 0.7656247615814209, 1.0304450988769531, 1.2952654361724854, 1.5600857734680176, 1.8249061107635498, 2.089726448059082, 2.354546546936035, 2.6193671226501465, 2.8841872215270996, 3.149007558822632, 3.413827896118164, 3.6786482334136963, 3.9434685707092285, 4.208288669586182, 4.473109245300293, 4.737929344177246, 5.002749443054199, 5.2675700187683105, 5.532390594482422, 5.797210693359375, 6.062031269073486, 6.3268513679504395, 6.591671943664551, 6.856492042541504, 7.121312141418457, 7.386132717132568, 7.6509528160095215]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 12.0, 8.0, 17.0, 23.0, 41.0, 70.0, 119.0, 170.0, 288.0, 477.0, 720.0, 1336.0, 2351.0, 4611.0, 8922.0, 18858.0, 43168.0, 110209.0, 327936.0, 1085977.0, 1625663.0, 637327.0, 195985.0, 70854.0, 29499.0, 13714.0, 6708.0, 3741.0, 2057.0, 1240.0, 791.0, 457.0, 288.0, 183.0, 151.0, 94.0, 63.0, 41.0, 38.0, 18.0, 14.0, 15.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.609375, -17.927001953125, -17.24462890625, -16.562255859375, -15.8798828125, -15.197509765625, -14.51513671875, -13.832763671875, -13.150390625, -12.468017578125, -11.78564453125, -11.103271484375, -10.4208984375, -9.738525390625, -9.05615234375, -8.373779296875, -7.69140625, -7.009033203125, -6.32666015625, -5.644287109375, -4.9619140625, -4.279541015625, -3.59716796875, -2.914794921875, -2.232421875, -1.550048828125, -0.86767578125, -0.185302734375, 0.4970703125, 1.179443359375, 1.86181640625, 2.544189453125, 3.2265625, 3.908935546875, 4.59130859375, 5.273681640625, 5.9560546875, 6.638427734375, 7.32080078125, 8.003173828125, 8.685546875, 9.367919921875, 10.05029296875, 10.732666015625, 11.4150390625, 12.097412109375, 12.77978515625, 13.462158203125, 14.14453125, 14.826904296875, 15.50927734375, 16.191650390625, 16.8740234375, 17.556396484375, 18.23876953125, 18.921142578125, 19.603515625, 20.285888671875, 20.96826171875, 21.650634765625, 22.3330078125, 23.015380859375, 23.69775390625, 24.380126953125, 25.0625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 7.0, 6.0, 13.0, 23.0, 12.0, 16.0, 25.0, 20.0, 23.0, 28.0, 34.0, 35.0, 39.0, 38.0, 43.0, 46.0, 54.0, 47.0, 33.0, 49.0, 47.0, 25.0, 39.0, 43.0, 30.0, 39.0, 27.0, 25.0, 28.0, 18.0, 10.0, 17.0, 12.0, 8.0, 6.0, 7.0, 8.0, 3.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.54296875, -7.31884765625, -7.0947265625, -6.87060546875, -6.646484375, -6.42236328125, -6.1982421875, -5.97412109375, -5.75, -5.52587890625, -5.3017578125, -5.07763671875, -4.853515625, -4.62939453125, -4.4052734375, -4.18115234375, -3.95703125, -3.73291015625, -3.5087890625, -3.28466796875, -3.060546875, -2.83642578125, -2.6123046875, -2.38818359375, -2.1640625, -1.93994140625, -1.7158203125, -1.49169921875, -1.267578125, -1.04345703125, -0.8193359375, -0.59521484375, -0.37109375, -0.14697265625, 0.0771484375, 0.30126953125, 0.525390625, 0.74951171875, 0.9736328125, 1.19775390625, 1.421875, 1.64599609375, 1.8701171875, 2.09423828125, 2.318359375, 2.54248046875, 2.7666015625, 2.99072265625, 3.21484375, 3.43896484375, 3.6630859375, 3.88720703125, 4.111328125, 4.33544921875, 4.5595703125, 4.78369140625, 5.0078125, 5.23193359375, 5.4560546875, 5.68017578125, 5.904296875, 6.12841796875, 6.3525390625, 6.57666015625, 6.80078125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 8.0, 7.0, 18.0, 17.0, 24.0, 46.0, 63.0, 84.0, 171.0, 231.0, 316.0, 472.0, 742.0, 1210.0, 1916.0, 2924.0, 4823.0, 8046.0, 13706.0, 24076.0, 44035.0, 85632.0, 176346.0, 383234.0, 816585.0, 1186880.0, 754978.0, 349520.0, 161950.0, 79347.0, 41379.0, 22513.0, 12708.0, 7594.0, 4516.0, 2915.0, 1762.0, 1204.0, 768.0, 486.0, 343.0, 216.0, 162.0, 103.0, 72.0, 45.0, 33.0, 24.0, 12.0, 14.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.2041015625, -16.673828125, -16.1435546875, -15.61328125, -15.0830078125, -14.552734375, -14.0224609375, -13.4921875, -12.9619140625, -12.431640625, -11.9013671875, -11.37109375, -10.8408203125, -10.310546875, -9.7802734375, -9.25, -8.7197265625, -8.189453125, -7.6591796875, -7.12890625, -6.5986328125, -6.068359375, -5.5380859375, -5.0078125, -4.4775390625, -3.947265625, -3.4169921875, -2.88671875, -2.3564453125, -1.826171875, -1.2958984375, -0.765625, -0.2353515625, 0.294921875, 0.8251953125, 1.35546875, 1.8857421875, 2.416015625, 2.9462890625, 3.4765625, 4.0068359375, 4.537109375, 5.0673828125, 5.59765625, 6.1279296875, 6.658203125, 7.1884765625, 7.71875, 8.2490234375, 8.779296875, 9.3095703125, 9.83984375, 10.3701171875, 10.900390625, 11.4306640625, 11.9609375, 12.4912109375, 13.021484375, 13.5517578125, 14.08203125, 14.6123046875, 15.142578125, 15.6728515625, 16.203125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 7.0, 11.0, 13.0, 19.0, 28.0, 30.0, 38.0, 44.0, 55.0, 68.0, 93.0, 121.0, 154.0, 190.0, 219.0, 288.0, 311.0, 348.0, 334.0, 302.0, 248.0, 241.0, 190.0, 137.0, 121.0, 86.0, 72.0, 60.0, 49.0, 42.0, 36.0, 21.0, 20.0, 10.0, 12.0, 15.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.86328125, -4.71044921875, -4.5576171875, -4.40478515625, -4.251953125, -4.09912109375, -3.9462890625, -3.79345703125, -3.640625, -3.48779296875, -3.3349609375, -3.18212890625, -3.029296875, -2.87646484375, -2.7236328125, -2.57080078125, -2.41796875, -2.26513671875, -2.1123046875, -1.95947265625, -1.806640625, -1.65380859375, -1.5009765625, -1.34814453125, -1.1953125, -1.04248046875, -0.8896484375, -0.73681640625, -0.583984375, -0.43115234375, -0.2783203125, -0.12548828125, 0.02734375, 0.18017578125, 0.3330078125, 0.48583984375, 0.638671875, 0.79150390625, 0.9443359375, 1.09716796875, 1.25, 1.40283203125, 1.5556640625, 1.70849609375, 1.861328125, 2.01416015625, 2.1669921875, 2.31982421875, 2.47265625, 2.62548828125, 2.7783203125, 2.93115234375, 3.083984375, 3.23681640625, 3.3896484375, 3.54248046875, 3.6953125, 3.84814453125, 4.0009765625, 4.15380859375, 4.306640625, 4.45947265625, 4.6123046875, 4.76513671875, 4.91796875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 3.0, 13.0, 16.0, 31.0, 27.0, 53.0, 75.0, 91.0, 112.0, 116.0, 112.0, 87.0, 73.0, 35.0, 38.0, 30.0, 17.0, 12.0, 11.0, 10.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-38.19105911254883, -37.31455612182617, -36.438053131103516, -35.561546325683594, -34.68504333496094, -33.80854034423828, -32.932037353515625, -32.05553436279297, -31.17902946472168, -30.302526473999023, -29.426021575927734, -28.549518585205078, -27.673015594482422, -26.796510696411133, -25.920007705688477, -25.043502807617188, -24.16699981689453, -23.290496826171875, -22.413991928100586, -21.53748893737793, -20.66098403930664, -19.784481048583984, -18.907978057861328, -18.031475067138672, -17.154970169067383, -16.278467178344727, -15.401962280273438, -14.525459289550781, -13.648955345153809, -12.772451400756836, -11.89594841003418, -11.019444465637207, -10.142940521240234, -9.266436576843262, -8.389932632446289, -7.513429641723633, -6.63692569732666, -5.7604217529296875, -4.883918285369873, -4.007414817810059, -3.130910873413086, -2.2544071674346924, -1.3779034614562988, -0.5013997554779053, 0.3751039505004883, 1.251607894897461, 2.1281113624572754, 3.00461483001709, 3.8811187744140625, 4.757622718811035, 5.63412618637085, 6.510629653930664, 7.387133598327637, 8.26363754272461, 9.140140533447266, 10.016644477844238, 10.893148422241211, 11.769652366638184, 12.646156311035156, 13.522659301757812, 14.399163246154785, 15.275667190551758, 16.152170181274414, 17.028675079345703, 17.90517807006836]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 7.0, 4.0, 10.0, 11.0, 8.0, 9.0, 10.0, 18.0, 17.0, 23.0, 19.0, 22.0, 27.0, 29.0, 31.0, 40.0, 48.0, 32.0, 34.0, 40.0, 49.0, 45.0, 36.0, 43.0, 38.0, 46.0, 35.0, 35.0, 26.0, 37.0, 35.0, 19.0, 17.0, 18.0, 17.0, 26.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.3289213180542, -9.054272651672363, -8.779623031616211, -8.504974365234375, -8.230324745178223, -7.9556756019592285, -7.681026458740234, -7.406377792358398, -7.131728172302246, -6.857079029083252, -6.582429885864258, -6.307780742645264, -6.0331315994262695, -5.758482456207275, -5.483833312988281, -5.209184646606445, -4.934535503387451, -4.659886360168457, -4.385237216949463, -4.110588073730469, -3.8359389305114746, -3.5612897872924805, -3.2866408824920654, -3.0119917392730713, -2.737342596054077, -2.462693452835083, -2.188044309616089, -1.9133952856063843, -1.6387461423873901, -1.364096999168396, -1.0894479751586914, -0.8147988319396973, -0.5401496887207031, -0.26550057530403137, 0.00914853811264038, 0.28379762172698975, 0.5584467649459839, 0.833095908164978, 1.1077449321746826, 1.3823940753936768, 1.657043218612671, 1.931692361831665, 2.206341505050659, 2.480990409851074, 2.7556395530700684, 3.0302886962890625, 3.3049378395080566, 3.579586982727051, 3.854236125946045, 4.128885269165039, 4.403534412384033, 4.678183555603027, 4.9528326988220215, 5.227481842041016, 5.502130508422852, 5.776780128479004, 6.05142879486084, 6.326077938079834, 6.600727081298828, 6.875376224517822, 7.150025367736816, 7.4246745109558105, 7.699323654174805, 7.973972320556641, 8.248621940612793]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 10.0, 10.0, 14.0, 37.0, 53.0, 70.0, 120.0, 195.0, 305.0, 555.0, 1064.0, 2255.0, 5258.0, 15145.0, 50234.0, 176845.0, 413819.0, 266978.0, 79216.0, 22817.0, 7574.0, 2955.0, 1436.0, 653.0, 366.0, 214.0, 118.0, 80.0, 56.0, 40.0, 21.0, 12.0, 11.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.890625, -16.417236328125, -15.94384765625, -15.470458984375, -14.9970703125, -14.523681640625, -14.05029296875, -13.576904296875, -13.103515625, -12.630126953125, -12.15673828125, -11.683349609375, -11.2099609375, -10.736572265625, -10.26318359375, -9.789794921875, -9.31640625, -8.843017578125, -8.36962890625, -7.896240234375, -7.4228515625, -6.949462890625, -6.47607421875, -6.002685546875, -5.529296875, -5.055908203125, -4.58251953125, -4.109130859375, -3.6357421875, -3.162353515625, -2.68896484375, -2.215576171875, -1.7421875, -1.268798828125, -0.79541015625, -0.322021484375, 0.1513671875, 0.624755859375, 1.09814453125, 1.571533203125, 2.044921875, 2.518310546875, 2.99169921875, 3.465087890625, 3.9384765625, 4.411865234375, 4.88525390625, 5.358642578125, 5.83203125, 6.305419921875, 6.77880859375, 7.252197265625, 7.7255859375, 8.198974609375, 8.67236328125, 9.145751953125, 9.619140625, 10.092529296875, 10.56591796875, 11.039306640625, 11.5126953125, 11.986083984375, 12.45947265625, 12.932861328125, 13.40625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 8.0, 7.0, 18.0, 12.0, 16.0, 13.0, 19.0, 30.0, 32.0, 42.0, 34.0, 60.0, 46.0, 53.0, 56.0, 52.0, 59.0, 65.0, 55.0, 56.0, 45.0, 37.0, 34.0, 24.0, 32.0, 20.0, 18.0, 14.0, 9.0, 13.0, 6.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-17.0625, -16.653076171875, -16.24365234375, -15.834228515625, -15.4248046875, -15.015380859375, -14.60595703125, -14.196533203125, -13.787109375, -13.377685546875, -12.96826171875, -12.558837890625, -12.1494140625, -11.739990234375, -11.33056640625, -10.921142578125, -10.51171875, -10.102294921875, -9.69287109375, -9.283447265625, -8.8740234375, -8.464599609375, -8.05517578125, -7.645751953125, -7.236328125, -6.826904296875, -6.41748046875, -6.008056640625, -5.5986328125, -5.189208984375, -4.77978515625, -4.370361328125, -3.9609375, -3.551513671875, -3.14208984375, -2.732666015625, -2.3232421875, -1.913818359375, -1.50439453125, -1.094970703125, -0.685546875, -0.276123046875, 0.13330078125, 0.542724609375, 0.9521484375, 1.361572265625, 1.77099609375, 2.180419921875, 2.58984375, 2.999267578125, 3.40869140625, 3.818115234375, 4.2275390625, 4.636962890625, 5.04638671875, 5.455810546875, 5.865234375, 6.274658203125, 6.68408203125, 7.093505859375, 7.5029296875, 7.912353515625, 8.32177734375, 8.731201171875, 9.140625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 5.0, 5.0, 6.0, 9.0, 15.0, 12.0, 20.0, 23.0, 49.0, 71.0, 107.0, 159.0, 351.0, 615.0, 1276.0, 2883.0, 7822.0, 24596.0, 98487.0, 404364.0, 381388.0, 90681.0, 22760.0, 7342.0, 2798.0, 1310.0, 629.0, 289.0, 171.0, 111.0, 72.0, 38.0, 27.0, 21.0, 9.0, 10.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.546875, -18.915771484375, -18.28466796875, -17.653564453125, -17.0224609375, -16.391357421875, -15.76025390625, -15.129150390625, -14.498046875, -13.866943359375, -13.23583984375, -12.604736328125, -11.9736328125, -11.342529296875, -10.71142578125, -10.080322265625, -9.44921875, -8.818115234375, -8.18701171875, -7.555908203125, -6.9248046875, -6.293701171875, -5.66259765625, -5.031494140625, -4.400390625, -3.769287109375, -3.13818359375, -2.507080078125, -1.8759765625, -1.244873046875, -0.61376953125, 0.017333984375, 0.6484375, 1.279541015625, 1.91064453125, 2.541748046875, 3.1728515625, 3.803955078125, 4.43505859375, 5.066162109375, 5.697265625, 6.328369140625, 6.95947265625, 7.590576171875, 8.2216796875, 8.852783203125, 9.48388671875, 10.114990234375, 10.74609375, 11.377197265625, 12.00830078125, 12.639404296875, 13.2705078125, 13.901611328125, 14.53271484375, 15.163818359375, 15.794921875, 16.426025390625, 17.05712890625, 17.688232421875, 18.3193359375, 18.950439453125, 19.58154296875, 20.212646484375, 20.84375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 6.0, 9.0, 11.0, 15.0, 14.0, 14.0, 18.0, 16.0, 19.0, 26.0, 30.0, 31.0, 49.0, 41.0, 46.0, 32.0, 44.0, 44.0, 43.0, 43.0, 43.0, 36.0, 51.0, 33.0, 40.0, 30.0, 29.0, 28.0, 21.0, 20.0, 24.0, 16.0, 9.0, 18.0, 13.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.671875, -6.48162841796875, -6.2913818359375, -6.10113525390625, -5.910888671875, -5.72064208984375, -5.5303955078125, -5.34014892578125, -5.14990234375, -4.95965576171875, -4.7694091796875, -4.57916259765625, -4.388916015625, -4.19866943359375, -4.0084228515625, -3.81817626953125, -3.6279296875, -3.43768310546875, -3.2474365234375, -3.05718994140625, -2.866943359375, -2.67669677734375, -2.4864501953125, -2.29620361328125, -2.10595703125, -1.91571044921875, -1.7254638671875, -1.53521728515625, -1.344970703125, -1.15472412109375, -0.9644775390625, -0.77423095703125, -0.583984375, -0.39373779296875, -0.2034912109375, -0.01324462890625, 0.177001953125, 0.36724853515625, 0.5574951171875, 0.74774169921875, 0.93798828125, 1.12823486328125, 1.3184814453125, 1.50872802734375, 1.698974609375, 1.88922119140625, 2.0794677734375, 2.26971435546875, 2.4599609375, 2.65020751953125, 2.8404541015625, 3.03070068359375, 3.220947265625, 3.41119384765625, 3.6014404296875, 3.79168701171875, 3.98193359375, 4.17218017578125, 4.3624267578125, 4.55267333984375, 4.742919921875, 4.93316650390625, 5.1234130859375, 5.31365966796875, 5.50390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 17.0, 15.0, 21.0, 27.0, 33.0, 68.0, 93.0, 143.0, 205.0, 307.0, 421.0, 689.0, 1165.0, 1896.0, 3400.0, 6954.0, 16396.0, 47058.0, 171195.0, 480213.0, 222109.0, 59135.0, 19661.0, 7926.0, 3963.0, 2142.0, 1207.0, 683.0, 449.0, 306.0, 220.0, 142.0, 92.0, 54.0, 42.0, 29.0, 22.0, 24.0, 11.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1656494140625, -5.964111328125, -5.7625732421875, -5.56103515625, -5.3594970703125, -5.157958984375, -4.9564208984375, -4.7548828125, -4.5533447265625, -4.351806640625, -4.1502685546875, -3.94873046875, -3.7471923828125, -3.545654296875, -3.3441162109375, -3.142578125, -2.9410400390625, -2.739501953125, -2.5379638671875, -2.33642578125, -2.1348876953125, -1.933349609375, -1.7318115234375, -1.5302734375, -1.3287353515625, -1.127197265625, -0.9256591796875, -0.72412109375, -0.5225830078125, -0.321044921875, -0.1195068359375, 0.08203125, 0.2835693359375, 0.485107421875, 0.6866455078125, 0.88818359375, 1.0897216796875, 1.291259765625, 1.4927978515625, 1.6943359375, 1.8958740234375, 2.097412109375, 2.2989501953125, 2.50048828125, 2.7020263671875, 2.903564453125, 3.1051025390625, 3.306640625, 3.5081787109375, 3.709716796875, 3.9112548828125, 4.11279296875, 4.3143310546875, 4.515869140625, 4.7174072265625, 4.9189453125, 5.1204833984375, 5.322021484375, 5.5235595703125, 5.72509765625, 5.9266357421875, 6.128173828125, 6.3297119140625, 6.53125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 10.0, 17.0, 27.0, 32.0, 55.0, 70.0, 90.0, 113.0, 109.0, 94.0, 77.0, 86.0, 57.0, 39.0, 37.0, 18.0, 9.0, 16.0, 14.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0005025863647460938, -0.0004896000027656555, -0.0004766136407852173, -0.00046362727880477905, -0.0004506409168243408, -0.0004376545548439026, -0.00042466819286346436, -0.0004116818308830261, -0.0003986954689025879, -0.00038570910692214966, -0.0003727227449417114, -0.0003597363829612732, -0.00034675002098083496, -0.00033376365900039673, -0.0003207772970199585, -0.00030779093503952026, -0.00029480457305908203, -0.0002818182110786438, -0.00026883184909820557, -0.00025584548711776733, -0.0002428591251373291, -0.00022987276315689087, -0.00021688640117645264, -0.0002039000391960144, -0.00019091367721557617, -0.00017792731523513794, -0.0001649409532546997, -0.00015195459127426147, -0.00013896822929382324, -0.000125981867313385, -0.00011299550533294678, -0.00010000914335250854, -8.702278137207031e-05, -7.403641939163208e-05, -6.105005741119385e-05, -4.8063695430755615e-05, -3.507733345031738e-05, -2.209097146987915e-05, -9.104609489440918e-06, 3.8817524909973145e-06, 1.6868114471435547e-05, 2.985447645187378e-05, 4.284083843231201e-05, 5.5827200412750244e-05, 6.881356239318848e-05, 8.179992437362671e-05, 9.478628635406494e-05, 0.00010777264833450317, 0.0001207590103149414, 0.00013374537229537964, 0.00014673173427581787, 0.0001597180962562561, 0.00017270445823669434, 0.00018569082021713257, 0.0001986771821975708, 0.00021166354417800903, 0.00022464990615844727, 0.0002376362681388855, 0.00025062263011932373, 0.00026360899209976196, 0.0002765953540802002, 0.00028958171606063843, 0.00030256807804107666, 0.0003155544400215149, 0.0003285408020019531]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 10.0, 12.0, 16.0, 20.0, 31.0, 30.0, 64.0, 75.0, 100.0, 150.0, 224.0, 275.0, 419.0, 539.0, 855.0, 1330.0, 2193.0, 3606.0, 6689.0, 15235.0, 40528.0, 129877.0, 357099.0, 318907.0, 107146.0, 34413.0, 13311.0, 6193.0, 3326.0, 1939.0, 1243.0, 818.0, 534.0, 388.0, 250.0, 227.0, 111.0, 87.0, 69.0, 66.0, 30.0, 33.0, 22.0, 21.0, 14.0, 8.0, 8.0, 2.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5390625, -5.35394287109375, -5.1688232421875, -4.98370361328125, -4.798583984375, -4.61346435546875, -4.4283447265625, -4.24322509765625, -4.05810546875, -3.87298583984375, -3.6878662109375, -3.50274658203125, -3.317626953125, -3.13250732421875, -2.9473876953125, -2.76226806640625, -2.5771484375, -2.39202880859375, -2.2069091796875, -2.02178955078125, -1.836669921875, -1.65155029296875, -1.4664306640625, -1.28131103515625, -1.09619140625, -0.91107177734375, -0.7259521484375, -0.54083251953125, -0.355712890625, -0.17059326171875, 0.0145263671875, 0.19964599609375, 0.384765625, 0.56988525390625, 0.7550048828125, 0.94012451171875, 1.125244140625, 1.31036376953125, 1.4954833984375, 1.68060302734375, 1.86572265625, 2.05084228515625, 2.2359619140625, 2.42108154296875, 2.606201171875, 2.79132080078125, 2.9764404296875, 3.16156005859375, 3.3466796875, 3.53179931640625, 3.7169189453125, 3.90203857421875, 4.087158203125, 4.27227783203125, 4.4573974609375, 4.64251708984375, 4.82763671875, 5.01275634765625, 5.1978759765625, 5.38299560546875, 5.568115234375, 5.75323486328125, 5.9383544921875, 6.12347412109375, 6.30859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 9.0, 3.0, 11.0, 16.0, 38.0, 44.0, 95.0, 131.0, 168.0, 177.0, 112.0, 87.0, 51.0, 26.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.54425048828125, -2.4693603515625, -2.39447021484375, -2.319580078125, -2.24468994140625, -2.1697998046875, -2.09490966796875, -2.02001953125, -1.94512939453125, -1.8702392578125, -1.79534912109375, -1.720458984375, -1.64556884765625, -1.5706787109375, -1.49578857421875, -1.4208984375, -1.34600830078125, -1.2711181640625, -1.19622802734375, -1.121337890625, -1.04644775390625, -0.9715576171875, -0.89666748046875, -0.82177734375, -0.74688720703125, -0.6719970703125, -0.59710693359375, -0.522216796875, -0.44732666015625, -0.3724365234375, -0.29754638671875, -0.22265625, -0.14776611328125, -0.0728759765625, 0.00201416015625, 0.076904296875, 0.15179443359375, 0.2266845703125, 0.30157470703125, 0.37646484375, 0.45135498046875, 0.5262451171875, 0.60113525390625, 0.676025390625, 0.75091552734375, 0.8258056640625, 0.90069580078125, 0.9755859375, 1.05047607421875, 1.1253662109375, 1.20025634765625, 1.275146484375, 1.35003662109375, 1.4249267578125, 1.49981689453125, 1.57470703125, 1.64959716796875, 1.7244873046875, 1.79937744140625, 1.874267578125, 1.94915771484375, 2.0240478515625, 2.09893798828125, 2.173828125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 22.0, 20.0, 41.0, 46.0, 89.0, 96.0, 115.0, 127.0, 106.0, 82.0, 63.0, 41.0, 37.0, 23.0, 13.0, 11.0, 11.0, 10.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-39.90776824951172, -39.006874084472656, -38.10598373413086, -37.2050895690918, -36.30419921875, -35.40330505371094, -34.502410888671875, -33.60152053833008, -32.700626373291016, -31.799734115600586, -30.898841857910156, -29.997947692871094, -29.097055435180664, -28.196163177490234, -27.295270919799805, -26.394378662109375, -25.493486404418945, -24.592594146728516, -23.691701889038086, -22.790809631347656, -21.889915466308594, -20.989023208618164, -20.088130950927734, -19.187238693237305, -18.286346435546875, -17.385454177856445, -16.484561920166016, -15.58366870880127, -14.682775497436523, -13.781883239746094, -12.880990982055664, -11.980098724365234, -11.079206466674805, -10.178314208984375, -9.277420997619629, -8.3765287399292, -7.475636005401611, -6.574743270874023, -5.673851013183594, -4.772958278656006, -3.872065544128418, -2.97117280960083, -2.0702803134918213, -1.1693878173828125, -0.2684950828552246, 0.6323976516723633, 1.533289909362793, 2.434182643890381, 3.3350753784179688, 4.235968112945557, 5.1368608474731445, 6.037753105163574, 6.938645839691162, 7.83953857421875, 8.74043083190918, 9.64132308959961, 10.542216300964355, 11.443108558654785, 12.344001770019531, 13.244894027709961, 14.14578628540039, 15.046679496765137, 15.947571754455566, 16.848464965820312, 17.749357223510742]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 6.0, 7.0, 14.0, 4.0, 14.0, 11.0, 15.0, 23.0, 18.0, 20.0, 23.0, 31.0, 33.0, 31.0, 44.0, 35.0, 39.0, 34.0, 47.0, 51.0, 43.0, 42.0, 37.0, 41.0, 47.0, 35.0, 26.0, 40.0, 30.0, 27.0, 20.0, 20.0, 18.0, 22.0, 14.0, 8.0, 8.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-9.776090621948242, -9.494546890258789, -9.213003158569336, -8.931458473205566, -8.649914741516113, -8.36837100982666, -8.086827278137207, -7.805283546447754, -7.523739337921143, -7.2421956062316895, -6.960651397705078, -6.679107666015625, -6.397563934326172, -6.1160197257995605, -5.834475994110107, -5.552931785583496, -5.271388053894043, -4.98984432220459, -4.7083001136779785, -4.426756381988525, -4.145212173461914, -3.863668441772461, -3.582124710083008, -3.3005807399749756, -3.0190367698669434, -2.737492799758911, -2.455948829650879, -2.174405097961426, -1.8928611278533936, -1.6113171577453613, -1.3297733068466187, -1.048229455947876, -0.7666854858398438, -0.4851415753364563, -0.20359766483306885, 0.0779462456703186, 0.35949015617370605, 0.6410341262817383, 0.922577977180481, 1.2041218280792236, 1.4856657981872559, 1.767209768295288, 2.0487537384033203, 2.3302974700927734, 2.6118414402008057, 2.893385410308838, 3.174929141998291, 3.4564731121063232, 3.7380170822143555, 4.019560813903809, 4.30110502243042, 4.582648754119873, 4.864192962646484, 5.1457366943359375, 5.427280426025391, 5.708824157714844, 5.990368366241455, 6.271912097930908, 6.5534563064575195, 6.835000038146973, 7.116543769836426, 7.398087978363037, 7.67963171005249, 7.961175918579102, 8.242719650268555]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 6.0, 13.0, 15.0, 32.0, 45.0, 48.0, 89.0, 154.0, 238.0, 450.0, 797.0, 1456.0, 2866.0, 5613.0, 11546.0, 24004.0, 50536.0, 103317.0, 188922.0, 247354.0, 196393.0, 109881.0, 54203.0, 25473.0, 12509.0, 5952.0, 3065.0, 1583.0, 848.0, 420.0, 291.0, 152.0, 102.0, 53.0, 38.0, 24.0, 24.0, 14.0, 4.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.98681640625, -15.4267578125, -14.86669921875, -14.306640625, -13.74658203125, -13.1865234375, -12.62646484375, -12.06640625, -11.50634765625, -10.9462890625, -10.38623046875, -9.826171875, -9.26611328125, -8.7060546875, -8.14599609375, -7.5859375, -7.02587890625, -6.4658203125, -5.90576171875, -5.345703125, -4.78564453125, -4.2255859375, -3.66552734375, -3.10546875, -2.54541015625, -1.9853515625, -1.42529296875, -0.865234375, -0.30517578125, 0.2548828125, 0.81494140625, 1.375, 1.93505859375, 2.4951171875, 3.05517578125, 3.615234375, 4.17529296875, 4.7353515625, 5.29541015625, 5.85546875, 6.41552734375, 6.9755859375, 7.53564453125, 8.095703125, 8.65576171875, 9.2158203125, 9.77587890625, 10.3359375, 10.89599609375, 11.4560546875, 12.01611328125, 12.576171875, 13.13623046875, 13.6962890625, 14.25634765625, 14.81640625, 15.37646484375, 15.9365234375, 16.49658203125, 17.056640625, 17.61669921875, 18.1767578125, 18.73681640625, 19.296875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 5.0, 11.0, 11.0, 8.0, 10.0, 11.0, 20.0, 20.0, 30.0, 29.0, 38.0, 28.0, 43.0, 40.0, 42.0, 56.0, 37.0, 46.0, 52.0, 43.0, 51.0, 41.0, 47.0, 39.0, 32.0, 25.0, 35.0, 19.0, 19.0, 18.0, 20.0, 11.0, 16.0, 10.0, 1.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0], "bins": [-11.8515625, -11.52685546875, -11.2021484375, -10.87744140625, -10.552734375, -10.22802734375, -9.9033203125, -9.57861328125, -9.25390625, -8.92919921875, -8.6044921875, -8.27978515625, -7.955078125, -7.63037109375, -7.3056640625, -6.98095703125, -6.65625, -6.33154296875, -6.0068359375, -5.68212890625, -5.357421875, -5.03271484375, -4.7080078125, -4.38330078125, -4.05859375, -3.73388671875, -3.4091796875, -3.08447265625, -2.759765625, -2.43505859375, -2.1103515625, -1.78564453125, -1.4609375, -1.13623046875, -0.8115234375, -0.48681640625, -0.162109375, 0.16259765625, 0.4873046875, 0.81201171875, 1.13671875, 1.46142578125, 1.7861328125, 2.11083984375, 2.435546875, 2.76025390625, 3.0849609375, 3.40966796875, 3.734375, 4.05908203125, 4.3837890625, 4.70849609375, 5.033203125, 5.35791015625, 5.6826171875, 6.00732421875, 6.33203125, 6.65673828125, 6.9814453125, 7.30615234375, 7.630859375, 7.95556640625, 8.2802734375, 8.60498046875, 8.9296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 18.0, 19.0, 29.0, 56.0, 55.0, 90.0, 140.0, 189.0, 327.0, 580.0, 1021.0, 1930.0, 3927.0, 8354.0, 18775.0, 44059.0, 104956.0, 219089.0, 288103.0, 197087.0, 91017.0, 37880.0, 16077.0, 7237.0, 3446.0, 1721.0, 924.0, 495.0, 351.0, 173.0, 126.0, 81.0, 54.0, 41.0, 35.0, 13.0, 17.0, 13.0, 3.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.702392578125, -19.99853515625, -19.294677734375, -18.5908203125, -17.886962890625, -17.18310546875, -16.479248046875, -15.775390625, -15.071533203125, -14.36767578125, -13.663818359375, -12.9599609375, -12.256103515625, -11.55224609375, -10.848388671875, -10.14453125, -9.440673828125, -8.73681640625, -8.032958984375, -7.3291015625, -6.625244140625, -5.92138671875, -5.217529296875, -4.513671875, -3.809814453125, -3.10595703125, -2.402099609375, -1.6982421875, -0.994384765625, -0.29052734375, 0.413330078125, 1.1171875, 1.821044921875, 2.52490234375, 3.228759765625, 3.9326171875, 4.636474609375, 5.34033203125, 6.044189453125, 6.748046875, 7.451904296875, 8.15576171875, 8.859619140625, 9.5634765625, 10.267333984375, 10.97119140625, 11.675048828125, 12.37890625, 13.082763671875, 13.78662109375, 14.490478515625, 15.1943359375, 15.898193359375, 16.60205078125, 17.305908203125, 18.009765625, 18.713623046875, 19.41748046875, 20.121337890625, 20.8251953125, 21.529052734375, 22.23291015625, 22.936767578125, 23.640625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 7.0, 8.0, 7.0, 7.0, 6.0, 7.0, 17.0, 9.0, 16.0, 13.0, 17.0, 20.0, 17.0, 25.0, 24.0, 28.0, 36.0, 31.0, 36.0, 36.0, 46.0, 45.0, 38.0, 38.0, 55.0, 40.0, 32.0, 38.0, 38.0, 37.0, 35.0, 31.0, 25.0, 29.0, 14.0, 8.0, 20.0, 11.0, 7.0, 12.0, 10.0, 10.0, 7.0, 8.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.23046875, -6.0467529296875, -5.863037109375, -5.6793212890625, -5.49560546875, -5.3118896484375, -5.128173828125, -4.9444580078125, -4.7607421875, -4.5770263671875, -4.393310546875, -4.2095947265625, -4.02587890625, -3.8421630859375, -3.658447265625, -3.4747314453125, -3.291015625, -3.1072998046875, -2.923583984375, -2.7398681640625, -2.55615234375, -2.3724365234375, -2.188720703125, -2.0050048828125, -1.8212890625, -1.6375732421875, -1.453857421875, -1.2701416015625, -1.08642578125, -0.9027099609375, -0.718994140625, -0.5352783203125, -0.3515625, -0.1678466796875, 0.015869140625, 0.1995849609375, 0.38330078125, 0.5670166015625, 0.750732421875, 0.9344482421875, 1.1181640625, 1.3018798828125, 1.485595703125, 1.6693115234375, 1.85302734375, 2.0367431640625, 2.220458984375, 2.4041748046875, 2.587890625, 2.7716064453125, 2.955322265625, 3.1390380859375, 3.32275390625, 3.5064697265625, 3.690185546875, 3.8739013671875, 4.0576171875, 4.2413330078125, 4.425048828125, 4.6087646484375, 4.79248046875, 4.9761962890625, 5.159912109375, 5.3436279296875, 5.52734375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 15.0, 19.0, 22.0, 38.0, 46.0, 53.0, 74.0, 102.0, 110.0, 168.0, 241.0, 283.0, 426.0, 623.0, 874.0, 1443.0, 2382.0, 4263.0, 8620.0, 20976.0, 64914.0, 225792.0, 429849.0, 194578.0, 55772.0, 18536.0, 7800.0, 3842.0, 2255.0, 1311.0, 946.0, 543.0, 443.0, 288.0, 222.0, 165.0, 127.0, 110.0, 58.0, 43.0, 39.0, 32.0, 28.0, 26.0, 9.0, 8.0, 9.0, 4.0, 6.0, 1.0, 0.0, 7.0, 1.0, 1.0], "bins": [-11.8671875, -11.5013427734375, -11.135498046875, -10.7696533203125, -10.40380859375, -10.0379638671875, -9.672119140625, -9.3062744140625, -8.9404296875, -8.5745849609375, -8.208740234375, -7.8428955078125, -7.47705078125, -7.1112060546875, -6.745361328125, -6.3795166015625, -6.013671875, -5.6478271484375, -5.281982421875, -4.9161376953125, -4.55029296875, -4.1844482421875, -3.818603515625, -3.4527587890625, -3.0869140625, -2.7210693359375, -2.355224609375, -1.9893798828125, -1.62353515625, -1.2576904296875, -0.891845703125, -0.5260009765625, -0.16015625, 0.2056884765625, 0.571533203125, 0.9373779296875, 1.30322265625, 1.6690673828125, 2.034912109375, 2.4007568359375, 2.7666015625, 3.1324462890625, 3.498291015625, 3.8641357421875, 4.22998046875, 4.5958251953125, 4.961669921875, 5.3275146484375, 5.693359375, 6.0592041015625, 6.425048828125, 6.7908935546875, 7.15673828125, 7.5225830078125, 7.888427734375, 8.2542724609375, 8.6201171875, 8.9859619140625, 9.351806640625, 9.7176513671875, 10.08349609375, 10.4493408203125, 10.815185546875, 11.1810302734375, 11.546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 14.0, 8.0, 12.0, 22.0, 41.0, 68.0, 91.0, 165.0, 168.0, 149.0, 100.0, 52.0, 55.0, 21.0, 18.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014905929565429688, -0.00144977867603302, -0.0014089643955230713, -0.0013681501150131226, -0.0013273358345031738, -0.001286521553993225, -0.0012457072734832764, -0.0012048929929733276, -0.001164078712463379, -0.0011232644319534302, -0.0010824501514434814, -0.0010416358709335327, -0.001000821590423584, -0.0009600073099136353, -0.0009191930294036865, -0.0008783787488937378, -0.0008375644683837891, -0.0007967501878738403, -0.0007559359073638916, -0.0007151216268539429, -0.0006743073463439941, -0.0006334930658340454, -0.0005926787853240967, -0.000551864504814148, -0.0005110502243041992, -0.0004702359437942505, -0.00042942166328430176, -0.00038860738277435303, -0.0003477931022644043, -0.00030697882175445557, -0.00026616454124450684, -0.0002253502607345581, -0.00018453598022460938, -0.00014372169971466064, -0.00010290741920471191, -6.209313869476318e-05, -2.1278858184814453e-05, 1.9535422325134277e-05, 6.034970283508301e-05, 0.00010116398334503174, 0.00014197826385498047, 0.0001827925443649292, 0.00022360682487487793, 0.00026442110538482666, 0.0003052353858947754, 0.0003460496664047241, 0.00038686394691467285, 0.0004276782274246216, 0.0004684925079345703, 0.000509306788444519, 0.0005501210689544678, 0.0005909353494644165, 0.0006317496299743652, 0.000672563910484314, 0.0007133781909942627, 0.0007541924715042114, 0.0007950067520141602, 0.0008358210325241089, 0.0008766353130340576, 0.0009174495935440063, 0.0009582638740539551, 0.0009990781545639038, 0.0010398924350738525, 0.0010807067155838013, 0.00112152099609375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 16.0, 12.0, 22.0, 37.0, 46.0, 44.0, 89.0, 136.0, 180.0, 231.0, 418.0, 562.0, 821.0, 1368.0, 1978.0, 3287.0, 6058.0, 12177.0, 28387.0, 70832.0, 179841.0, 326344.0, 240420.0, 100873.0, 39283.0, 16283.0, 7705.0, 4146.0, 2325.0, 1562.0, 984.0, 641.0, 452.0, 299.0, 210.0, 122.0, 109.0, 72.0, 46.0, 33.0, 31.0, 18.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.83203125, -7.56817626953125, -7.3043212890625, -7.04046630859375, -6.776611328125, -6.51275634765625, -6.2489013671875, -5.98504638671875, -5.72119140625, -5.45733642578125, -5.1934814453125, -4.92962646484375, -4.665771484375, -4.40191650390625, -4.1380615234375, -3.87420654296875, -3.6103515625, -3.34649658203125, -3.0826416015625, -2.81878662109375, -2.554931640625, -2.29107666015625, -2.0272216796875, -1.76336669921875, -1.49951171875, -1.23565673828125, -0.9718017578125, -0.70794677734375, -0.444091796875, -0.18023681640625, 0.0836181640625, 0.34747314453125, 0.611328125, 0.87518310546875, 1.1390380859375, 1.40289306640625, 1.666748046875, 1.93060302734375, 2.1944580078125, 2.45831298828125, 2.72216796875, 2.98602294921875, 3.2498779296875, 3.51373291015625, 3.777587890625, 4.04144287109375, 4.3052978515625, 4.56915283203125, 4.8330078125, 5.09686279296875, 5.3607177734375, 5.62457275390625, 5.888427734375, 6.15228271484375, 6.4161376953125, 6.67999267578125, 6.94384765625, 7.20770263671875, 7.4715576171875, 7.73541259765625, 7.999267578125, 8.26312255859375, 8.5269775390625, 8.79083251953125, 9.0546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 14.0, 20.0, 35.0, 46.0, 70.0, 69.0, 87.0, 111.0, 126.0, 104.0, 89.0, 61.0, 44.0, 26.0, 25.0, 20.0, 13.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.9906005859375, -2.891357421875, -2.7921142578125, -2.69287109375, -2.5936279296875, -2.494384765625, -2.3951416015625, -2.2958984375, -2.1966552734375, -2.097412109375, -1.9981689453125, -1.89892578125, -1.7996826171875, -1.700439453125, -1.6011962890625, -1.501953125, -1.4027099609375, -1.303466796875, -1.2042236328125, -1.10498046875, -1.0057373046875, -0.906494140625, -0.8072509765625, -0.7080078125, -0.6087646484375, -0.509521484375, -0.4102783203125, -0.31103515625, -0.2117919921875, -0.112548828125, -0.0133056640625, 0.0859375, 0.1851806640625, 0.284423828125, 0.3836669921875, 0.48291015625, 0.5821533203125, 0.681396484375, 0.7806396484375, 0.8798828125, 0.9791259765625, 1.078369140625, 1.1776123046875, 1.27685546875, 1.3760986328125, 1.475341796875, 1.5745849609375, 1.673828125, 1.7730712890625, 1.872314453125, 1.9715576171875, 2.07080078125, 2.1700439453125, 2.269287109375, 2.3685302734375, 2.4677734375, 2.5670166015625, 2.666259765625, 2.7655029296875, 2.86474609375, 2.9639892578125, 3.063232421875, 3.1624755859375, 3.26171875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 9.0, 11.0, 12.0, 24.0, 48.0, 50.0, 68.0, 77.0, 133.0, 125.0, 111.0, 71.0, 85.0, 41.0, 33.0, 21.0, 20.0, 16.0, 10.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-36.806739807128906, -35.895565032958984, -34.98439025878906, -34.07321548461914, -33.16204071044922, -32.2508659362793, -31.339691162109375, -30.428516387939453, -29.51734161376953, -28.60616683959961, -27.694992065429688, -26.783817291259766, -25.872642517089844, -24.961467742919922, -24.05029296875, -23.139118194580078, -22.227943420410156, -21.316768646240234, -20.405593872070312, -19.49441909790039, -18.58324432373047, -17.672069549560547, -16.760894775390625, -15.849720001220703, -14.938545227050781, -14.02737045288086, -13.116195678710938, -12.205020904541016, -11.293846130371094, -10.382671356201172, -9.47149658203125, -8.560321807861328, -7.649145126342773, -6.737970352172852, -5.82679557800293, -4.915620803833008, -4.004446029663086, -3.093271255493164, -2.182096481323242, -1.2709217071533203, -0.35974693298339844, 0.5514278411865234, 1.4626026153564453, 2.373777389526367, 3.284952163696289, 4.196126937866211, 5.107301712036133, 6.018476486206055, 6.929651260375977, 7.840826034545898, 8.75200080871582, 9.663175582885742, 10.574350357055664, 11.485525131225586, 12.396699905395508, 13.30787467956543, 14.219049453735352, 15.130224227905273, 16.041399002075195, 16.952573776245117, 17.86374855041504, 18.77492332458496, 19.686098098754883, 20.597272872924805, 21.508447647094727]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 11.0, 11.0, 6.0, 8.0, 9.0, 11.0, 11.0, 17.0, 10.0, 23.0, 21.0, 25.0, 25.0, 34.0, 20.0, 31.0, 36.0, 34.0, 29.0, 27.0, 37.0, 39.0, 33.0, 31.0, 35.0, 42.0, 28.0, 30.0, 39.0, 32.0, 22.0, 26.0, 23.0, 20.0, 18.0, 16.0, 12.0, 13.0, 15.0, 13.0, 16.0, 15.0, 4.0, 8.0, 5.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0], "bins": [-8.060611724853516, -7.823540687561035, -7.586470127105713, -7.349399566650391, -7.11232852935791, -6.87525749206543, -6.638186931610107, -6.401116371154785, -6.164045333862305, -5.926974296569824, -5.689903736114502, -5.45283317565918, -5.215762138366699, -4.978691101074219, -4.7416205406188965, -4.504549980163574, -4.267478942871094, -4.030407905578613, -3.793337345123291, -3.5562665462493896, -3.3191957473754883, -3.082124948501587, -2.8450541496276855, -2.607983350753784, -2.370912551879883, -2.1338417530059814, -1.89677095413208, -1.6597001552581787, -1.4226293563842773, -1.185558557510376, -0.9484877586364746, -0.7114169597625732, -0.47434568405151367, -0.2372748851776123, -0.0002040863037109375, 0.23686671257019043, 0.4739375114440918, 0.7110083103179932, 0.9480791091918945, 1.185149908065796, 1.4222207069396973, 1.6592915058135986, 1.8963623046875, 2.1334331035614014, 2.3705039024353027, 2.607574701309204, 2.8446455001831055, 3.081716299057007, 3.318787097930908, 3.5558578968048096, 3.792928695678711, 4.029999732971191, 4.267070293426514, 4.504140853881836, 4.741211891174316, 4.978282928466797, 5.215353488922119, 5.452424049377441, 5.689495086669922, 5.926566123962402, 6.163636684417725, 6.400707244873047, 6.637778282165527, 6.874849319458008, 7.11191987991333]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 17.0, 8.0, 17.0, 22.0, 38.0, 49.0, 64.0, 83.0, 144.0, 235.0, 316.0, 461.0, 719.0, 1163.0, 1839.0, 3074.0, 5340.0, 10034.0, 19943.0, 41666.0, 94644.0, 243933.0, 736718.0, 1590568.0, 924550.0, 305799.0, 114956.0, 48979.0, 22951.0, 11226.0, 5993.0, 3274.0, 1979.0, 1204.0, 790.0, 505.0, 304.0, 186.0, 137.0, 101.0, 82.0, 48.0, 36.0, 30.0, 10.0, 10.0, 8.0, 10.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.96875, -19.316162109375, -18.66357421875, -18.010986328125, -17.3583984375, -16.705810546875, -16.05322265625, -15.400634765625, -14.748046875, -14.095458984375, -13.44287109375, -12.790283203125, -12.1376953125, -11.485107421875, -10.83251953125, -10.179931640625, -9.52734375, -8.874755859375, -8.22216796875, -7.569580078125, -6.9169921875, -6.264404296875, -5.61181640625, -4.959228515625, -4.306640625, -3.654052734375, -3.00146484375, -2.348876953125, -1.6962890625, -1.043701171875, -0.39111328125, 0.261474609375, 0.9140625, 1.566650390625, 2.21923828125, 2.871826171875, 3.5244140625, 4.177001953125, 4.82958984375, 5.482177734375, 6.134765625, 6.787353515625, 7.43994140625, 8.092529296875, 8.7451171875, 9.397705078125, 10.05029296875, 10.702880859375, 11.35546875, 12.008056640625, 12.66064453125, 13.313232421875, 13.9658203125, 14.618408203125, 15.27099609375, 15.923583984375, 16.576171875, 17.228759765625, 17.88134765625, 18.533935546875, 19.1865234375, 19.839111328125, 20.49169921875, 21.144287109375, 21.796875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 7.0, 13.0, 18.0, 19.0, 18.0, 35.0, 33.0, 32.0, 27.0, 28.0, 31.0, 40.0, 44.0, 35.0, 44.0, 31.0, 32.0, 46.0, 42.0, 40.0, 38.0, 46.0, 34.0, 31.0, 18.0, 17.0, 20.0, 26.0, 19.0, 20.0, 14.0, 10.0, 16.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.09765625, -6.884521484375, -6.67138671875, -6.458251953125, -6.2451171875, -6.031982421875, -5.81884765625, -5.605712890625, -5.392578125, -5.179443359375, -4.96630859375, -4.753173828125, -4.5400390625, -4.326904296875, -4.11376953125, -3.900634765625, -3.6875, -3.474365234375, -3.26123046875, -3.048095703125, -2.8349609375, -2.621826171875, -2.40869140625, -2.195556640625, -1.982421875, -1.769287109375, -1.55615234375, -1.343017578125, -1.1298828125, -0.916748046875, -0.70361328125, -0.490478515625, -0.27734375, -0.064208984375, 0.14892578125, 0.362060546875, 0.5751953125, 0.788330078125, 1.00146484375, 1.214599609375, 1.427734375, 1.640869140625, 1.85400390625, 2.067138671875, 2.2802734375, 2.493408203125, 2.70654296875, 2.919677734375, 3.1328125, 3.345947265625, 3.55908203125, 3.772216796875, 3.9853515625, 4.198486328125, 4.41162109375, 4.624755859375, 4.837890625, 5.051025390625, 5.26416015625, 5.477294921875, 5.6904296875, 5.903564453125, 6.11669921875, 6.329833984375, 6.54296875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 15.0, 16.0, 25.0, 47.0, 63.0, 95.0, 156.0, 249.0, 363.0, 620.0, 890.0, 1445.0, 2373.0, 4037.0, 7026.0, 12494.0, 22767.0, 44260.0, 89876.0, 191893.0, 433692.0, 958447.0, 1227135.0, 649955.0, 283775.0, 128875.0, 62010.0, 31724.0, 16803.0, 9575.0, 5356.0, 3155.0, 1914.0, 1174.0, 736.0, 428.0, 278.0, 179.0, 118.0, 81.0, 64.0, 36.0, 31.0, 6.0, 8.0, 8.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.930908203125, -15.34619140625, -14.761474609375, -14.1767578125, -13.592041015625, -13.00732421875, -12.422607421875, -11.837890625, -11.253173828125, -10.66845703125, -10.083740234375, -9.4990234375, -8.914306640625, -8.32958984375, -7.744873046875, -7.16015625, -6.575439453125, -5.99072265625, -5.406005859375, -4.8212890625, -4.236572265625, -3.65185546875, -3.067138671875, -2.482421875, -1.897705078125, -1.31298828125, -0.728271484375, -0.1435546875, 0.441162109375, 1.02587890625, 1.610595703125, 2.1953125, 2.780029296875, 3.36474609375, 3.949462890625, 4.5341796875, 5.118896484375, 5.70361328125, 6.288330078125, 6.873046875, 7.457763671875, 8.04248046875, 8.627197265625, 9.2119140625, 9.796630859375, 10.38134765625, 10.966064453125, 11.55078125, 12.135498046875, 12.72021484375, 13.304931640625, 13.8896484375, 14.474365234375, 15.05908203125, 15.643798828125, 16.228515625, 16.813232421875, 17.39794921875, 17.982666015625, 18.5673828125, 19.152099609375, 19.73681640625, 20.321533203125, 20.90625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 7.0, 7.0, 24.0, 27.0, 34.0, 54.0, 50.0, 72.0, 82.0, 117.0, 145.0, 172.0, 261.0, 267.0, 313.0, 303.0, 349.0, 321.0, 280.0, 272.0, 212.0, 164.0, 116.0, 93.0, 87.0, 55.0, 46.0, 28.0, 30.0, 28.0, 11.0, 9.0, 11.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.7188720703125, -5.551025390625, -5.3831787109375, -5.21533203125, -5.0474853515625, -4.879638671875, -4.7117919921875, -4.5439453125, -4.3760986328125, -4.208251953125, -4.0404052734375, -3.87255859375, -3.7047119140625, -3.536865234375, -3.3690185546875, -3.201171875, -3.0333251953125, -2.865478515625, -2.6976318359375, -2.52978515625, -2.3619384765625, -2.194091796875, -2.0262451171875, -1.8583984375, -1.6905517578125, -1.522705078125, -1.3548583984375, -1.18701171875, -1.0191650390625, -0.851318359375, -0.6834716796875, -0.515625, -0.3477783203125, -0.179931640625, -0.0120849609375, 0.15576171875, 0.3236083984375, 0.491455078125, 0.6593017578125, 0.8271484375, 0.9949951171875, 1.162841796875, 1.3306884765625, 1.49853515625, 1.6663818359375, 1.834228515625, 2.0020751953125, 2.169921875, 2.3377685546875, 2.505615234375, 2.6734619140625, 2.84130859375, 3.0091552734375, 3.177001953125, 3.3448486328125, 3.5126953125, 3.6805419921875, 3.848388671875, 4.0162353515625, 4.18408203125, 4.3519287109375, 4.519775390625, 4.6876220703125, 4.85546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 8.0, 18.0, 16.0, 25.0, 36.0, 60.0, 80.0, 83.0, 97.0, 98.0, 96.0, 101.0, 72.0, 49.0, 34.0, 29.0, 16.0, 19.0, 5.0, 12.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.563068389892578, -30.723012924194336, -29.882959365844727, -29.042903900146484, -28.202850341796875, -27.362794876098633, -26.52273941040039, -25.68268585205078, -24.842632293701172, -24.00257682800293, -23.16252326965332, -22.322467803955078, -21.48241424560547, -20.642358779907227, -19.802303314208984, -18.962249755859375, -18.122194290161133, -17.28213882446289, -16.44208526611328, -15.602029800415039, -14.76197624206543, -13.921920776367188, -13.081866264343262, -12.241811752319336, -11.40175724029541, -10.561702728271484, -9.721648216247559, -8.881593704223633, -8.04153823852539, -7.201484203338623, -6.361429214477539, -5.521374702453613, -4.6813201904296875, -3.8412656784057617, -3.001210927963257, -2.161156177520752, -1.3211016654968262, -0.4810471534729004, 0.3590078353881836, 1.1990623474121094, 2.039116859436035, 2.879171371459961, 3.719226121902466, 4.559280872344971, 5.3993353843688965, 6.239389896392822, 7.079444885253906, 7.919499397277832, 8.759553909301758, 9.599608421325684, 10.43966293334961, 11.279718399047852, 12.119771957397461, 12.959827423095703, 13.799881935119629, 14.639936447143555, 15.47999095916748, 16.320045471191406, 17.16010093688965, 18.000154495239258, 18.8402099609375, 19.68026351928711, 20.52031898498535, 21.360374450683594, 22.200428009033203]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 8.0, 3.0, 4.0, 16.0, 6.0, 10.0, 12.0, 17.0, 16.0, 17.0, 25.0, 19.0, 24.0, 33.0, 37.0, 38.0, 25.0, 34.0, 48.0, 37.0, 36.0, 39.0, 22.0, 25.0, 30.0, 40.0, 33.0, 33.0, 32.0, 33.0, 28.0, 34.0, 30.0, 14.0, 22.0, 23.0, 19.0, 26.0, 8.0, 12.0, 5.0, 9.0, 3.0, 5.0, 2.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.10766315460205, -7.854564189910889, -7.601465225219727, -7.348365783691406, -7.095266819000244, -6.842167854309082, -6.589068412780762, -6.3359694480896, -6.0828704833984375, -5.829771518707275, -5.576672554016113, -5.323573112487793, -5.070474147796631, -4.817375183105469, -4.564275741577148, -4.311176776885986, -4.058077812194824, -3.804978847503662, -3.551879644393921, -3.2987804412841797, -3.0456814765930176, -2.7925825119018555, -2.5394833087921143, -2.286384105682373, -2.033285140991211, -1.7801860570907593, -1.5270869731903076, -1.273987889289856, -1.0208888053894043, -0.7677897214889526, -0.514690637588501, -0.2615915536880493, -0.008492469787597656, 0.244606614112854, 0.49770569801330566, 0.7508047819137573, 1.003903865814209, 1.2570029497146606, 1.5101020336151123, 1.763201117515564, 2.0163002014160156, 2.2693991661071777, 2.522498369216919, 2.77559757232666, 3.0286965370178223, 3.2817955017089844, 3.5348947048187256, 3.787993907928467, 4.041092872619629, 4.294191837310791, 4.547290802001953, 4.800390243530273, 5.0534892082214355, 5.306588172912598, 5.559687614440918, 5.81278657913208, 6.065885543823242, 6.318984508514404, 6.572083473205566, 6.825182914733887, 7.078281879425049, 7.331380844116211, 7.584480285644531, 7.837579250335693, 8.090678215026855]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 21.0, 26.0, 51.0, 62.0, 103.0, 141.0, 182.0, 295.0, 486.0, 781.0, 1134.0, 1729.0, 2781.0, 4426.0, 7093.0, 11553.0, 19474.0, 32856.0, 55720.0, 92138.0, 141781.0, 180612.0, 171667.0, 126202.0, 79115.0, 47143.0, 27895.0, 16493.0, 9803.0, 6201.0, 3749.0, 2390.0, 1577.0, 979.0, 645.0, 425.0, 238.0, 174.0, 151.0, 83.0, 46.0, 46.0, 25.0, 18.0, 10.0, 5.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.91015625, -5.72454833984375, -5.5389404296875, -5.35333251953125, -5.167724609375, -4.98211669921875, -4.7965087890625, -4.61090087890625, -4.42529296875, -4.23968505859375, -4.0540771484375, -3.86846923828125, -3.682861328125, -3.49725341796875, -3.3116455078125, -3.12603759765625, -2.9404296875, -2.75482177734375, -2.5692138671875, -2.38360595703125, -2.197998046875, -2.01239013671875, -1.8267822265625, -1.64117431640625, -1.45556640625, -1.26995849609375, -1.0843505859375, -0.89874267578125, -0.713134765625, -0.52752685546875, -0.3419189453125, -0.15631103515625, 0.029296875, 0.21490478515625, 0.4005126953125, 0.58612060546875, 0.771728515625, 0.95733642578125, 1.1429443359375, 1.32855224609375, 1.51416015625, 1.69976806640625, 1.8853759765625, 2.07098388671875, 2.256591796875, 2.44219970703125, 2.6278076171875, 2.81341552734375, 2.9990234375, 3.18463134765625, 3.3702392578125, 3.55584716796875, 3.741455078125, 3.92706298828125, 4.1126708984375, 4.29827880859375, 4.48388671875, 4.66949462890625, 4.8551025390625, 5.04071044921875, 5.226318359375, 5.41192626953125, 5.5975341796875, 5.78314208984375, 5.96875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 8.0, 9.0, 6.0, 10.0, 11.0, 8.0, 28.0, 14.0, 24.0, 26.0, 22.0, 40.0, 38.0, 38.0, 44.0, 45.0, 43.0, 31.0, 26.0, 36.0, 41.0, 37.0, 38.0, 42.0, 34.0, 36.0, 34.0, 21.0, 27.0, 25.0, 23.0, 29.0, 17.0, 20.0, 16.0, 8.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.046875, -9.7335205078125, -9.420166015625, -9.1068115234375, -8.79345703125, -8.4801025390625, -8.166748046875, -7.8533935546875, -7.5400390625, -7.2266845703125, -6.913330078125, -6.5999755859375, -6.28662109375, -5.9732666015625, -5.659912109375, -5.3465576171875, -5.033203125, -4.7198486328125, -4.406494140625, -4.0931396484375, -3.77978515625, -3.4664306640625, -3.153076171875, -2.8397216796875, -2.5263671875, -2.2130126953125, -1.899658203125, -1.5863037109375, -1.27294921875, -0.9595947265625, -0.646240234375, -0.3328857421875, -0.01953125, 0.2938232421875, 0.607177734375, 0.9205322265625, 1.23388671875, 1.5472412109375, 1.860595703125, 2.1739501953125, 2.4873046875, 2.8006591796875, 3.114013671875, 3.4273681640625, 3.74072265625, 4.0540771484375, 4.367431640625, 4.6807861328125, 4.994140625, 5.3074951171875, 5.620849609375, 5.9342041015625, 6.24755859375, 6.5609130859375, 6.874267578125, 7.1876220703125, 7.5009765625, 7.8143310546875, 8.127685546875, 8.4410400390625, 8.75439453125, 9.0677490234375, 9.381103515625, 9.6944580078125, 10.0078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 11.0, 20.0, 27.0, 36.0, 47.0, 85.0, 107.0, 194.0, 266.0, 464.0, 722.0, 1240.0, 2097.0, 3438.0, 6419.0, 12125.0, 23300.0, 47875.0, 101407.0, 203506.0, 278494.0, 186119.0, 91192.0, 43290.0, 21175.0, 10827.0, 5720.0, 3352.0, 1948.0, 1162.0, 702.0, 403.0, 283.0, 181.0, 123.0, 52.0, 40.0, 23.0, 22.0, 18.0, 11.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.875, -9.560791015625, -9.24658203125, -8.932373046875, -8.6181640625, -8.303955078125, -7.98974609375, -7.675537109375, -7.361328125, -7.047119140625, -6.73291015625, -6.418701171875, -6.1044921875, -5.790283203125, -5.47607421875, -5.161865234375, -4.84765625, -4.533447265625, -4.21923828125, -3.905029296875, -3.5908203125, -3.276611328125, -2.96240234375, -2.648193359375, -2.333984375, -2.019775390625, -1.70556640625, -1.391357421875, -1.0771484375, -0.762939453125, -0.44873046875, -0.134521484375, 0.1796875, 0.493896484375, 0.80810546875, 1.122314453125, 1.4365234375, 1.750732421875, 2.06494140625, 2.379150390625, 2.693359375, 3.007568359375, 3.32177734375, 3.635986328125, 3.9501953125, 4.264404296875, 4.57861328125, 4.892822265625, 5.20703125, 5.521240234375, 5.83544921875, 6.149658203125, 6.4638671875, 6.778076171875, 7.09228515625, 7.406494140625, 7.720703125, 8.034912109375, 8.34912109375, 8.663330078125, 8.9775390625, 9.291748046875, 9.60595703125, 9.920166015625, 10.234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 12.0, 9.0, 14.0, 13.0, 14.0, 16.0, 14.0, 23.0, 29.0, 29.0, 41.0, 38.0, 31.0, 37.0, 56.0, 39.0, 49.0, 41.0, 33.0, 46.0, 43.0, 36.0, 46.0, 28.0, 27.0, 39.0, 27.0, 20.0, 13.0, 18.0, 11.0, 17.0, 11.0, 15.0, 8.0, 8.0, 10.0, 5.0, 1.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.974853515625, -5.78955078125, -5.604248046875, -5.4189453125, -5.233642578125, -5.04833984375, -4.863037109375, -4.677734375, -4.492431640625, -4.30712890625, -4.121826171875, -3.9365234375, -3.751220703125, -3.56591796875, -3.380615234375, -3.1953125, -3.010009765625, -2.82470703125, -2.639404296875, -2.4541015625, -2.268798828125, -2.08349609375, -1.898193359375, -1.712890625, -1.527587890625, -1.34228515625, -1.156982421875, -0.9716796875, -0.786376953125, -0.60107421875, -0.415771484375, -0.23046875, -0.045166015625, 0.14013671875, 0.325439453125, 0.5107421875, 0.696044921875, 0.88134765625, 1.066650390625, 1.251953125, 1.437255859375, 1.62255859375, 1.807861328125, 1.9931640625, 2.178466796875, 2.36376953125, 2.549072265625, 2.734375, 2.919677734375, 3.10498046875, 3.290283203125, 3.4755859375, 3.660888671875, 3.84619140625, 4.031494140625, 4.216796875, 4.402099609375, 4.58740234375, 4.772705078125, 4.9580078125, 5.143310546875, 5.32861328125, 5.513916015625, 5.69921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 19.0, 23.0, 29.0, 42.0, 74.0, 92.0, 133.0, 213.0, 321.0, 412.0, 631.0, 961.0, 1430.0, 2341.0, 3672.0, 6003.0, 10150.0, 17903.0, 32789.0, 61919.0, 119947.0, 220980.0, 249909.0, 148595.0, 77352.0, 39928.0, 21342.0, 12052.0, 7231.0, 4227.0, 2669.0, 1773.0, 1096.0, 716.0, 468.0, 330.0, 235.0, 156.0, 107.0, 75.0, 59.0, 45.0, 30.0, 18.0, 18.0, 6.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.0126953125, -2.916015625, -2.8193359375, -2.72265625, -2.6259765625, -2.529296875, -2.4326171875, -2.3359375, -2.2392578125, -2.142578125, -2.0458984375, -1.94921875, -1.8525390625, -1.755859375, -1.6591796875, -1.5625, -1.4658203125, -1.369140625, -1.2724609375, -1.17578125, -1.0791015625, -0.982421875, -0.8857421875, -0.7890625, -0.6923828125, -0.595703125, -0.4990234375, -0.40234375, -0.3056640625, -0.208984375, -0.1123046875, -0.015625, 0.0810546875, 0.177734375, 0.2744140625, 0.37109375, 0.4677734375, 0.564453125, 0.6611328125, 0.7578125, 0.8544921875, 0.951171875, 1.0478515625, 1.14453125, 1.2412109375, 1.337890625, 1.4345703125, 1.53125, 1.6279296875, 1.724609375, 1.8212890625, 1.91796875, 2.0146484375, 2.111328125, 2.2080078125, 2.3046875, 2.4013671875, 2.498046875, 2.5947265625, 2.69140625, 2.7880859375, 2.884765625, 2.9814453125, 3.078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 8.0, 9.0, 10.0, 18.0, 22.0, 33.0, 32.0, 50.0, 69.0, 60.0, 69.0, 73.0, 75.0, 64.0, 77.0, 65.0, 61.0, 38.0, 45.0, 29.0, 23.0, 18.0, 10.0, 11.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000278472900390625, -0.0002697482705116272, -0.0002610236406326294, -0.0002522990107536316, -0.0002435743808746338, -0.00023484975099563599, -0.00022612512111663818, -0.00021740049123764038, -0.00020867586135864258, -0.00019995123147964478, -0.00019122660160064697, -0.00018250197172164917, -0.00017377734184265137, -0.00016505271196365356, -0.00015632808208465576, -0.00014760345220565796, -0.00013887882232666016, -0.00013015419244766235, -0.00012142956256866455, -0.00011270493268966675, -0.00010398030281066895, -9.525567293167114e-05, -8.653104305267334e-05, -7.780641317367554e-05, -6.908178329467773e-05, -6.035715341567993e-05, -5.163252353668213e-05, -4.2907893657684326e-05, -3.4183263778686523e-05, -2.545863389968872e-05, -1.6734004020690918e-05, -8.009374141693115e-06, 7.152557373046875e-07, 9.43988561630249e-06, 1.8164515495300293e-05, 2.6889145374298096e-05, 3.56137752532959e-05, 4.43384051322937e-05, 5.3063035011291504e-05, 6.17876648902893e-05, 7.051229476928711e-05, 7.923692464828491e-05, 8.796155452728271e-05, 9.668618440628052e-05, 0.00010541081428527832, 0.00011413544416427612, 0.00012286007404327393, 0.00013158470392227173, 0.00014030933380126953, 0.00014903396368026733, 0.00015775859355926514, 0.00016648322343826294, 0.00017520785331726074, 0.00018393248319625854, 0.00019265711307525635, 0.00020138174295425415, 0.00021010637283325195, 0.00021883100271224976, 0.00022755563259124756, 0.00023628026247024536, 0.00024500489234924316, 0.00025372952222824097, 0.00026245415210723877, 0.00027117878198623657, 0.0002799034118652344]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 8.0, 5.0, 14.0, 21.0, 23.0, 30.0, 47.0, 57.0, 104.0, 126.0, 216.0, 307.0, 492.0, 785.0, 1245.0, 2107.0, 3465.0, 5825.0, 10613.0, 19238.0, 36080.0, 71083.0, 134953.0, 216855.0, 226758.0, 148628.0, 79693.0, 40688.0, 21390.0, 11546.0, 6403.0, 3732.0, 2300.0, 1314.0, 806.0, 542.0, 338.0, 268.0, 150.0, 90.0, 56.0, 48.0, 42.0, 23.0, 15.0, 15.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73828125, -2.63330078125, -2.5283203125, -2.42333984375, -2.318359375, -2.21337890625, -2.1083984375, -2.00341796875, -1.8984375, -1.79345703125, -1.6884765625, -1.58349609375, -1.478515625, -1.37353515625, -1.2685546875, -1.16357421875, -1.05859375, -0.95361328125, -0.8486328125, -0.74365234375, -0.638671875, -0.53369140625, -0.4287109375, -0.32373046875, -0.21875, -0.11376953125, -0.0087890625, 0.09619140625, 0.201171875, 0.30615234375, 0.4111328125, 0.51611328125, 0.62109375, 0.72607421875, 0.8310546875, 0.93603515625, 1.041015625, 1.14599609375, 1.2509765625, 1.35595703125, 1.4609375, 1.56591796875, 1.6708984375, 1.77587890625, 1.880859375, 1.98583984375, 2.0908203125, 2.19580078125, 2.30078125, 2.40576171875, 2.5107421875, 2.61572265625, 2.720703125, 2.82568359375, 2.9306640625, 3.03564453125, 3.140625, 3.24560546875, 3.3505859375, 3.45556640625, 3.560546875, 3.66552734375, 3.7705078125, 3.87548828125, 3.98046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 9.0, 11.0, 18.0, 14.0, 27.0, 30.0, 27.0, 31.0, 38.0, 49.0, 49.0, 68.0, 69.0, 53.0, 50.0, 67.0, 60.0, 38.0, 48.0, 39.0, 35.0, 28.0, 30.0, 25.0, 15.0, 10.0, 13.0, 14.0, 8.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86572265625, -0.8377761840820312, -0.8098297119140625, -0.7818832397460938, -0.753936767578125, -0.7259902954101562, -0.6980438232421875, -0.6700973510742188, -0.64215087890625, -0.6142044067382812, -0.5862579345703125, -0.5583114624023438, -0.530364990234375, -0.5024185180664062, -0.4744720458984375, -0.44652557373046875, -0.4185791015625, -0.39063262939453125, -0.3626861572265625, -0.33473968505859375, -0.306793212890625, -0.27884674072265625, -0.2509002685546875, -0.22295379638671875, -0.19500732421875, -0.16706085205078125, -0.1391143798828125, -0.11116790771484375, -0.083221435546875, -0.05527496337890625, -0.0273284912109375, 0.00061798095703125, 0.028564453125, 0.05651092529296875, 0.0844573974609375, 0.11240386962890625, 0.140350341796875, 0.16829681396484375, 0.1962432861328125, 0.22418975830078125, 0.25213623046875, 0.28008270263671875, 0.3080291748046875, 0.33597564697265625, 0.363922119140625, 0.39186859130859375, 0.4198150634765625, 0.44776153564453125, 0.4757080078125, 0.5036544799804688, 0.5316009521484375, 0.5595474243164062, 0.587493896484375, 0.6154403686523438, 0.6433868408203125, 0.6713333129882812, 0.69927978515625, 0.7272262573242188, 0.7551727294921875, 0.7831192016601562, 0.811065673828125, 0.8390121459960938, 0.8669586181640625, 0.8949050903320312, 0.9228515625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 17.0, 15.0, 27.0, 28.0, 60.0, 88.0, 67.0, 104.0, 84.0, 109.0, 94.0, 89.0, 45.0, 32.0, 26.0, 24.0, 15.0, 11.0, 11.0, 12.0, 1.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.42422866821289, -30.589895248413086, -29.75556182861328, -28.92123031616211, -28.086896896362305, -27.2525634765625, -26.418231964111328, -25.583898544311523, -24.74956512451172, -23.915231704711914, -23.08089828491211, -22.246566772460938, -21.412233352661133, -20.577899932861328, -19.743568420410156, -18.90923500061035, -18.074901580810547, -17.240568161010742, -16.406234741210938, -15.571903228759766, -14.737569808959961, -13.903236389160156, -13.068903923034668, -12.23457145690918, -11.400238037109375, -10.56590461730957, -9.731572151184082, -8.897239685058594, -8.062906265258789, -7.228573322296143, -6.394240379333496, -5.55990743637085, -4.72557258605957, -3.891239643096924, -3.0569067001342773, -2.222573757171631, -1.3882408142089844, -0.5539078712463379, 0.2804250717163086, 1.114758014678955, 1.9490909576416016, 2.783423900604248, 3.6177568435668945, 4.452089786529541, 5.2864227294921875, 6.120755672454834, 6.9550886154174805, 7.789421558380127, 8.623754501342773, 9.458087921142578, 10.292420387268066, 11.126752853393555, 11.96108627319336, 12.795419692993164, 13.629752159118652, 14.46408462524414, 15.298418045043945, 16.13275146484375, 16.967082977294922, 17.801416397094727, 18.63574981689453, 19.470083236694336, 20.30441665649414, 21.138748168945312, 21.973081588745117]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 3.0, 10.0, 13.0, 4.0, 12.0, 7.0, 19.0, 14.0, 22.0, 23.0, 19.0, 23.0, 28.0, 36.0, 37.0, 29.0, 34.0, 44.0, 34.0, 38.0, 38.0, 24.0, 32.0, 27.0, 35.0, 28.0, 35.0, 35.0, 39.0, 25.0, 21.0, 36.0, 26.0, 17.0, 23.0, 20.0, 20.0, 15.0, 9.0, 9.0, 10.0, 1.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.997335910797119, -7.750179767608643, -7.503023147583008, -7.255867004394531, -7.008710861206055, -6.761554718017578, -6.514398097991943, -6.267241954803467, -6.020085334777832, -5.7729291915893555, -5.525772571563721, -5.278616428375244, -5.031460285186768, -4.784303665161133, -4.537147521972656, -4.28999137878418, -4.042835235595703, -3.7956788539886475, -3.548522710800171, -3.3013663291931152, -3.0542101860046387, -2.807053804397583, -2.5598974227905273, -2.312741279602051, -2.065584897994995, -1.818428635597229, -1.571272373199463, -1.3241159915924072, -1.0769597291946411, -0.829803466796875, -0.5826470851898193, -0.3354908227920532, -0.08833456039428711, 0.1588217318058014, 0.4059780240058899, 0.6531343460083008, 0.9002906084060669, 1.147446870803833, 1.3946032524108887, 1.6417595148086548, 1.888915777206421, 2.1360721588134766, 2.383228302001953, 2.630384683609009, 2.8775410652160645, 3.124697208404541, 3.3718535900115967, 3.6190099716186523, 3.866166114807129, 4.1133222579956055, 4.36047887802124, 4.607635021209717, 4.854791164398193, 5.101947784423828, 5.349103927612305, 5.596260070800781, 5.843416213989258, 6.090572357177734, 6.337728977203369, 6.584885120391846, 6.832041263580322, 7.079197883605957, 7.326354026794434, 7.57351016998291, 7.820666790008545]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 17.0, 19.0, 26.0, 33.0, 55.0, 76.0, 111.0, 206.0, 324.0, 469.0, 701.0, 1165.0, 1713.0, 2808.0, 4503.0, 7167.0, 11349.0, 17982.0, 28399.0, 44252.0, 68793.0, 100597.0, 133880.0, 152438.0, 142701.0, 110873.0, 77604.0, 51172.0, 32874.0, 20778.0, 12954.0, 8541.0, 5189.0, 3104.0, 2076.0, 1320.0, 778.0, 524.0, 349.0, 225.0, 137.0, 102.0, 45.0, 42.0, 19.0, 19.0, 18.0, 15.0, 6.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.625, -11.26904296875, -10.9130859375, -10.55712890625, -10.201171875, -9.84521484375, -9.4892578125, -9.13330078125, -8.77734375, -8.42138671875, -8.0654296875, -7.70947265625, -7.353515625, -6.99755859375, -6.6416015625, -6.28564453125, -5.9296875, -5.57373046875, -5.2177734375, -4.86181640625, -4.505859375, -4.14990234375, -3.7939453125, -3.43798828125, -3.08203125, -2.72607421875, -2.3701171875, -2.01416015625, -1.658203125, -1.30224609375, -0.9462890625, -0.59033203125, -0.234375, 0.12158203125, 0.4775390625, 0.83349609375, 1.189453125, 1.54541015625, 1.9013671875, 2.25732421875, 2.61328125, 2.96923828125, 3.3251953125, 3.68115234375, 4.037109375, 4.39306640625, 4.7490234375, 5.10498046875, 5.4609375, 5.81689453125, 6.1728515625, 6.52880859375, 6.884765625, 7.24072265625, 7.5966796875, 7.95263671875, 8.30859375, 8.66455078125, 9.0205078125, 9.37646484375, 9.732421875, 10.08837890625, 10.4443359375, 10.80029296875, 11.15625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 11.0, 23.0, 13.0, 12.0, 20.0, 14.0, 31.0, 15.0, 26.0, 26.0, 38.0, 38.0, 44.0, 42.0, 41.0, 31.0, 36.0, 46.0, 32.0, 25.0, 36.0, 34.0, 35.0, 38.0, 29.0, 28.0, 30.0, 30.0, 25.0, 21.0, 22.0, 15.0, 19.0, 9.0, 12.0, 9.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.916015625, -9.62109375, -9.326171875, -9.03125, -8.736328125, -8.44140625, -8.146484375, -7.8515625, -7.556640625, -7.26171875, -6.966796875, -6.671875, -6.376953125, -6.08203125, -5.787109375, -5.4921875, -5.197265625, -4.90234375, -4.607421875, -4.3125, -4.017578125, -3.72265625, -3.427734375, -3.1328125, -2.837890625, -2.54296875, -2.248046875, -1.953125, -1.658203125, -1.36328125, -1.068359375, -0.7734375, -0.478515625, -0.18359375, 0.111328125, 0.40625, 0.701171875, 0.99609375, 1.291015625, 1.5859375, 1.880859375, 2.17578125, 2.470703125, 2.765625, 3.060546875, 3.35546875, 3.650390625, 3.9453125, 4.240234375, 4.53515625, 4.830078125, 5.125, 5.419921875, 5.71484375, 6.009765625, 6.3046875, 6.599609375, 6.89453125, 7.189453125, 7.484375, 7.779296875, 8.07421875, 8.369140625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 14.0, 22.0, 28.0, 45.0, 63.0, 116.0, 157.0, 270.0, 403.0, 620.0, 993.0, 1535.0, 2505.0, 4017.0, 6493.0, 10540.0, 17329.0, 28287.0, 46008.0, 72705.0, 108436.0, 144506.0, 159874.0, 144256.0, 108111.0, 72303.0, 45800.0, 28284.0, 17109.0, 10625.0, 6595.0, 3843.0, 2488.0, 1487.0, 940.0, 655.0, 367.0, 243.0, 164.0, 113.0, 63.0, 33.0, 36.0, 23.0, 10.0, 11.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.748291015625, -12.35595703125, -11.963623046875, -11.5712890625, -11.178955078125, -10.78662109375, -10.394287109375, -10.001953125, -9.609619140625, -9.21728515625, -8.824951171875, -8.4326171875, -8.040283203125, -7.64794921875, -7.255615234375, -6.86328125, -6.470947265625, -6.07861328125, -5.686279296875, -5.2939453125, -4.901611328125, -4.50927734375, -4.116943359375, -3.724609375, -3.332275390625, -2.93994140625, -2.547607421875, -2.1552734375, -1.762939453125, -1.37060546875, -0.978271484375, -0.5859375, -0.193603515625, 0.19873046875, 0.591064453125, 0.9833984375, 1.375732421875, 1.76806640625, 2.160400390625, 2.552734375, 2.945068359375, 3.33740234375, 3.729736328125, 4.1220703125, 4.514404296875, 4.90673828125, 5.299072265625, 5.69140625, 6.083740234375, 6.47607421875, 6.868408203125, 7.2607421875, 7.653076171875, 8.04541015625, 8.437744140625, 8.830078125, 9.222412109375, 9.61474609375, 10.007080078125, 10.3994140625, 10.791748046875, 11.18408203125, 11.576416015625, 11.96875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 9.0, 4.0, 9.0, 8.0, 10.0, 9.0, 10.0, 14.0, 18.0, 19.0, 23.0, 25.0, 25.0, 25.0, 35.0, 44.0, 35.0, 29.0, 23.0, 42.0, 27.0, 24.0, 37.0, 49.0, 40.0, 44.0, 30.0, 37.0, 35.0, 33.0, 42.0, 24.0, 18.0, 23.0, 17.0, 22.0, 13.0, 13.0, 9.0, 13.0, 9.0, 4.0, 8.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.48828125, -5.31610107421875, -5.1439208984375, -4.97174072265625, -4.799560546875, -4.62738037109375, -4.4552001953125, -4.28302001953125, -4.11083984375, -3.93865966796875, -3.7664794921875, -3.59429931640625, -3.422119140625, -3.24993896484375, -3.0777587890625, -2.90557861328125, -2.7333984375, -2.56121826171875, -2.3890380859375, -2.21685791015625, -2.044677734375, -1.87249755859375, -1.7003173828125, -1.52813720703125, -1.35595703125, -1.18377685546875, -1.0115966796875, -0.83941650390625, -0.667236328125, -0.49505615234375, -0.3228759765625, -0.15069580078125, 0.021484375, 0.19366455078125, 0.3658447265625, 0.53802490234375, 0.710205078125, 0.88238525390625, 1.0545654296875, 1.22674560546875, 1.39892578125, 1.57110595703125, 1.7432861328125, 1.91546630859375, 2.087646484375, 2.25982666015625, 2.4320068359375, 2.60418701171875, 2.7763671875, 2.94854736328125, 3.1207275390625, 3.29290771484375, 3.465087890625, 3.63726806640625, 3.8094482421875, 3.98162841796875, 4.15380859375, 4.32598876953125, 4.4981689453125, 4.67034912109375, 4.842529296875, 5.01470947265625, 5.1868896484375, 5.35906982421875, 5.53125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 15.0, 32.0, 34.0, 53.0, 73.0, 101.0, 168.0, 223.0, 321.0, 495.0, 752.0, 1168.0, 1743.0, 2909.0, 4825.0, 8403.0, 14833.0, 29136.0, 60990.0, 132857.0, 253592.0, 261777.0, 140906.0, 64245.0, 30869.0, 15810.0, 8692.0, 4863.0, 3030.0, 1919.0, 1231.0, 839.0, 515.0, 332.0, 250.0, 155.0, 101.0, 77.0, 64.0, 46.0, 34.0, 11.0, 17.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.1953125, -7.947265625, -7.69921875, -7.451171875, -7.203125, -6.955078125, -6.70703125, -6.458984375, -6.2109375, -5.962890625, -5.71484375, -5.466796875, -5.21875, -4.970703125, -4.72265625, -4.474609375, -4.2265625, -3.978515625, -3.73046875, -3.482421875, -3.234375, -2.986328125, -2.73828125, -2.490234375, -2.2421875, -1.994140625, -1.74609375, -1.498046875, -1.25, -1.001953125, -0.75390625, -0.505859375, -0.2578125, -0.009765625, 0.23828125, 0.486328125, 0.734375, 0.982421875, 1.23046875, 1.478515625, 1.7265625, 1.974609375, 2.22265625, 2.470703125, 2.71875, 2.966796875, 3.21484375, 3.462890625, 3.7109375, 3.958984375, 4.20703125, 4.455078125, 4.703125, 4.951171875, 5.19921875, 5.447265625, 5.6953125, 5.943359375, 6.19140625, 6.439453125, 6.6875, 6.935546875, 7.18359375, 7.431640625, 7.6796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 17.0, 15.0, 19.0, 29.0, 41.0, 41.0, 55.0, 52.0, 71.0, 77.0, 92.0, 72.0, 63.0, 75.0, 55.0, 42.0, 21.0, 23.0, 22.0, 11.0, 11.0, 13.0, 8.0, 5.0, 4.0, 3.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008358955383300781, -0.0008091703057289124, -0.0007824450731277466, -0.0007557198405265808, -0.000728994607925415, -0.0007022693753242493, -0.0006755441427230835, -0.0006488189101219177, -0.000622093677520752, -0.0005953684449195862, -0.0005686432123184204, -0.0005419179797172546, -0.0005151927471160889, -0.0004884675145149231, -0.0004617422819137573, -0.00043501704931259155, -0.0004082918167114258, -0.00038156658411026, -0.00035484135150909424, -0.00032811611890792847, -0.0003013908863067627, -0.0002746656537055969, -0.00024794042110443115, -0.00022121518850326538, -0.0001944899559020996, -0.00016776472330093384, -0.00014103949069976807, -0.0001143142580986023, -8.758902549743652e-05, -6.086379289627075e-05, -3.413856029510498e-05, -7.413327693939209e-06, 1.9311904907226562e-05, 4.6037137508392334e-05, 7.27623701095581e-05, 9.948760271072388e-05, 0.00012621283531188965, 0.00015293806791305542, 0.0001796633005142212, 0.00020638853311538696, 0.00023311376571655273, 0.0002598389983177185, 0.0002865642309188843, 0.00031328946352005005, 0.0003400146961212158, 0.0003667399287223816, 0.00039346516132354736, 0.00042019039392471313, 0.0004469156265258789, 0.0004736408591270447, 0.0005003660917282104, 0.0005270913243293762, 0.000553816556930542, 0.0005805417895317078, 0.0006072670221328735, 0.0006339922547340393, 0.0006607174873352051, 0.0006874427199363708, 0.0007141679525375366, 0.0007408931851387024, 0.0007676184177398682, 0.0007943436503410339, 0.0008210688829421997, 0.0008477941155433655, 0.0008745193481445312]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 1.0, 3.0, 5.0, 10.0, 13.0, 19.0, 27.0, 46.0, 74.0, 105.0, 152.0, 242.0, 344.0, 589.0, 962.0, 1662.0, 2916.0, 5205.0, 10340.0, 20061.0, 42869.0, 91711.0, 194056.0, 286068.0, 203508.0, 97601.0, 44991.0, 21436.0, 10477.0, 5523.0, 3042.0, 1690.0, 1030.0, 688.0, 373.0, 247.0, 140.0, 80.0, 80.0, 55.0, 36.0, 24.0, 19.0, 14.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.54296875, -7.29595947265625, -7.0489501953125, -6.80194091796875, -6.554931640625, -6.30792236328125, -6.0609130859375, -5.81390380859375, -5.56689453125, -5.31988525390625, -5.0728759765625, -4.82586669921875, -4.578857421875, -4.33184814453125, -4.0848388671875, -3.83782958984375, -3.5908203125, -3.34381103515625, -3.0968017578125, -2.84979248046875, -2.602783203125, -2.35577392578125, -2.1087646484375, -1.86175537109375, -1.61474609375, -1.36773681640625, -1.1207275390625, -0.87371826171875, -0.626708984375, -0.37969970703125, -0.1326904296875, 0.11431884765625, 0.361328125, 0.60833740234375, 0.8553466796875, 1.10235595703125, 1.349365234375, 1.59637451171875, 1.8433837890625, 2.09039306640625, 2.33740234375, 2.58441162109375, 2.8314208984375, 3.07843017578125, 3.325439453125, 3.57244873046875, 3.8194580078125, 4.06646728515625, 4.3134765625, 4.56048583984375, 4.8074951171875, 5.05450439453125, 5.301513671875, 5.54852294921875, 5.7955322265625, 6.04254150390625, 6.28955078125, 6.53656005859375, 6.7835693359375, 7.03057861328125, 7.277587890625, 7.52459716796875, 7.7716064453125, 8.01861572265625, 8.265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 6.0, 11.0, 13.0, 15.0, 15.0, 18.0, 11.0, 23.0, 26.0, 31.0, 44.0, 36.0, 45.0, 35.0, 47.0, 52.0, 56.0, 49.0, 43.0, 46.0, 50.0, 40.0, 37.0, 39.0, 25.0, 18.0, 26.0, 18.0, 8.0, 21.0, 20.0, 12.0, 6.0, 10.0, 7.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3056640625, -1.2625885009765625, -1.219512939453125, -1.1764373779296875, -1.13336181640625, -1.0902862548828125, -1.047210693359375, -1.0041351318359375, -0.9610595703125, -0.9179840087890625, -0.874908447265625, -0.8318328857421875, -0.78875732421875, -0.7456817626953125, -0.702606201171875, -0.6595306396484375, -0.616455078125, -0.5733795166015625, -0.530303955078125, -0.4872283935546875, -0.44415283203125, -0.4010772705078125, -0.358001708984375, -0.3149261474609375, -0.2718505859375, -0.2287750244140625, -0.185699462890625, -0.1426239013671875, -0.09954833984375, -0.0564727783203125, -0.013397216796875, 0.0296783447265625, 0.07275390625, 0.1158294677734375, 0.158905029296875, 0.2019805908203125, 0.24505615234375, 0.2881317138671875, 0.331207275390625, 0.3742828369140625, 0.4173583984375, 0.4604339599609375, 0.503509521484375, 0.5465850830078125, 0.58966064453125, 0.6327362060546875, 0.675811767578125, 0.7188873291015625, 0.761962890625, 0.8050384521484375, 0.848114013671875, 0.8911895751953125, 0.93426513671875, 0.9773406982421875, 1.020416259765625, 1.0634918212890625, 1.1065673828125, 1.1496429443359375, 1.192718505859375, 1.2357940673828125, 1.27886962890625, 1.3219451904296875, 1.365020751953125, 1.4080963134765625, 1.451171875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 8.0, 10.0, 18.0, 33.0, 45.0, 83.0, 89.0, 125.0, 118.0, 125.0, 105.0, 70.0, 44.0, 31.0, 20.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-41.80689239501953, -40.80168533325195, -39.796478271484375, -38.7912712097168, -37.78606414794922, -36.78085708618164, -35.77565002441406, -34.77044677734375, -33.765235900878906, -32.76002883911133, -31.75482177734375, -30.749614715576172, -29.744407653808594, -28.739200592041016, -27.73399543762207, -26.728788375854492, -25.723583221435547, -24.71837615966797, -23.71316909790039, -22.707962036132812, -21.702754974365234, -20.697547912597656, -19.69234275817871, -18.687135696411133, -17.681928634643555, -16.676721572875977, -15.671514511108398, -14.666308403015137, -13.661101341247559, -12.65589427947998, -11.650688171386719, -10.64548110961914, -9.640270233154297, -8.635063171386719, -7.629856586456299, -6.624650001525879, -5.619442939758301, -4.614235877990723, -3.6090292930603027, -2.603822708129883, -1.5986156463623047, -0.5934088230133057, 0.41179800033569336, 1.4170048236846924, 2.4222116470336914, 3.4274187088012695, 4.4326252937316895, 5.437831878662109, 6.4430389404296875, 7.448246002197266, 8.453453063964844, 9.458659172058105, 10.463866233825684, 11.469073295593262, 12.474279403686523, 13.479486465454102, 14.48469352722168, 15.489900588989258, 16.495107650756836, 17.500314712524414, 18.50551986694336, 19.510726928710938, 20.515933990478516, 21.521141052246094, 22.526348114013672]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 6.0, 13.0, 8.0, 14.0, 13.0, 20.0, 18.0, 20.0, 18.0, 27.0, 31.0, 30.0, 32.0, 32.0, 45.0, 36.0, 48.0, 49.0, 44.0, 33.0, 43.0, 36.0, 35.0, 38.0, 36.0, 29.0, 33.0, 24.0, 30.0, 25.0, 19.0, 17.0, 17.0, 19.0, 18.0, 11.0, 14.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.87194538116455, -9.583544731140137, -9.295143127441406, -9.006742477416992, -8.718341827392578, -8.429941177368164, -8.141539573669434, -7.8531389236450195, -7.5647382736206055, -7.276337146759033, -6.987936496734619, -6.699535369873047, -6.411134719848633, -6.1227335929870605, -5.834332466125488, -5.545931816101074, -5.257530689239502, -4.96912956237793, -4.680728912353516, -4.392327785491943, -4.103927135467529, -3.815526008605957, -3.527125120162964, -3.2387242317199707, -2.9503233432769775, -2.6619224548339844, -2.373521566390991, -2.085120677947998, -1.7967196702957153, -1.5083187818527222, -1.2199177742004395, -0.9315168857574463, -0.6431159973144531, -0.3547150790691376, -0.06631416082382202, 0.22208678722381592, 0.5104876756668091, 0.7988885641098022, 1.087289571762085, 1.3756904602050781, 1.6640913486480713, 1.9524922370910645, 2.2408931255340576, 2.529294013977051, 2.817695140838623, 3.106095790863037, 3.3944969177246094, 3.6828978061676025, 3.9712986946105957, 4.259699821472168, 4.548100471496582, 4.836501598358154, 5.124902248382568, 5.413303375244141, 5.701704025268555, 5.990105152130127, 6.278506278991699, 6.5669074058532715, 6.8553080558776855, 7.143709182739258, 7.432109832763672, 7.720510959625244, 8.008912086486816, 8.29731273651123, 8.585713386535645]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 9.0, 8.0, 12.0, 20.0, 33.0, 38.0, 65.0, 100.0, 155.0, 257.0, 371.0, 628.0, 1013.0, 1666.0, 2971.0, 5443.0, 10076.0, 19378.0, 39645.0, 85456.0, 206799.0, 583575.0, 1424364.0, 1137368.0, 399460.0, 148983.0, 63446.0, 29864.0, 14972.0, 7753.0, 4247.0, 2438.0, 1439.0, 821.0, 527.0, 317.0, 214.0, 116.0, 86.0, 44.0, 30.0, 25.0, 18.0, 13.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.860107421875, -20.20458984375, -19.549072265625, -18.8935546875, -18.238037109375, -17.58251953125, -16.927001953125, -16.271484375, -15.615966796875, -14.96044921875, -14.304931640625, -13.6494140625, -12.993896484375, -12.33837890625, -11.682861328125, -11.02734375, -10.371826171875, -9.71630859375, -9.060791015625, -8.4052734375, -7.749755859375, -7.09423828125, -6.438720703125, -5.783203125, -5.127685546875, -4.47216796875, -3.816650390625, -3.1611328125, -2.505615234375, -1.85009765625, -1.194580078125, -0.5390625, 0.116455078125, 0.77197265625, 1.427490234375, 2.0830078125, 2.738525390625, 3.39404296875, 4.049560546875, 4.705078125, 5.360595703125, 6.01611328125, 6.671630859375, 7.3271484375, 7.982666015625, 8.63818359375, 9.293701171875, 9.94921875, 10.604736328125, 11.26025390625, 11.915771484375, 12.5712890625, 13.226806640625, 13.88232421875, 14.537841796875, 15.193359375, 15.848876953125, 16.50439453125, 17.159912109375, 17.8154296875, 18.470947265625, 19.12646484375, 19.781982421875, 20.4375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 11.0, 12.0, 10.0, 21.0, 20.0, 24.0, 30.0, 16.0, 29.0, 25.0, 28.0, 41.0, 42.0, 42.0, 37.0, 38.0, 39.0, 36.0, 50.0, 42.0, 38.0, 29.0, 29.0, 30.0, 31.0, 24.0, 23.0, 26.0, 22.0, 23.0, 14.0, 19.0, 14.0, 19.0, 11.0, 8.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.52734375, -7.30157470703125, -7.0758056640625, -6.85003662109375, -6.624267578125, -6.39849853515625, -6.1727294921875, -5.94696044921875, -5.72119140625, -5.49542236328125, -5.2696533203125, -5.04388427734375, -4.818115234375, -4.59234619140625, -4.3665771484375, -4.14080810546875, -3.9150390625, -3.68927001953125, -3.4635009765625, -3.23773193359375, -3.011962890625, -2.78619384765625, -2.5604248046875, -2.33465576171875, -2.10888671875, -1.88311767578125, -1.6573486328125, -1.43157958984375, -1.205810546875, -0.98004150390625, -0.7542724609375, -0.52850341796875, -0.302734375, -0.07696533203125, 0.1488037109375, 0.37457275390625, 0.600341796875, 0.82611083984375, 1.0518798828125, 1.27764892578125, 1.50341796875, 1.72918701171875, 1.9549560546875, 2.18072509765625, 2.406494140625, 2.63226318359375, 2.8580322265625, 3.08380126953125, 3.3095703125, 3.53533935546875, 3.7611083984375, 3.98687744140625, 4.212646484375, 4.43841552734375, 4.6641845703125, 4.88995361328125, 5.11572265625, 5.34149169921875, 5.5672607421875, 5.79302978515625, 6.018798828125, 6.24456787109375, 6.4703369140625, 6.69610595703125, 6.921875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 10.0, 10.0, 12.0, 17.0, 21.0, 32.0, 43.0, 68.0, 89.0, 136.0, 199.0, 272.0, 428.0, 654.0, 955.0, 1425.0, 2128.0, 3377.0, 5258.0, 8381.0, 14030.0, 24099.0, 42622.0, 79368.0, 154592.0, 316321.0, 658469.0, 1134154.0, 874204.0, 430051.0, 206840.0, 103619.0, 55543.0, 30258.0, 17527.0, 10656.0, 6453.0, 4048.0, 2611.0, 1755.0, 1117.0, 756.0, 558.0, 406.0, 250.0, 152.0, 112.0, 72.0, 53.0, 35.0, 13.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-17.90625, -17.341552734375, -16.77685546875, -16.212158203125, -15.6474609375, -15.082763671875, -14.51806640625, -13.953369140625, -13.388671875, -12.823974609375, -12.25927734375, -11.694580078125, -11.1298828125, -10.565185546875, -10.00048828125, -9.435791015625, -8.87109375, -8.306396484375, -7.74169921875, -7.177001953125, -6.6123046875, -6.047607421875, -5.48291015625, -4.918212890625, -4.353515625, -3.788818359375, -3.22412109375, -2.659423828125, -2.0947265625, -1.530029296875, -0.96533203125, -0.400634765625, 0.1640625, 0.728759765625, 1.29345703125, 1.858154296875, 2.4228515625, 2.987548828125, 3.55224609375, 4.116943359375, 4.681640625, 5.246337890625, 5.81103515625, 6.375732421875, 6.9404296875, 7.505126953125, 8.06982421875, 8.634521484375, 9.19921875, 9.763916015625, 10.32861328125, 10.893310546875, 11.4580078125, 12.022705078125, 12.58740234375, 13.152099609375, 13.716796875, 14.281494140625, 14.84619140625, 15.410888671875, 15.9755859375, 16.540283203125, 17.10498046875, 17.669677734375, 18.234375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 8.0, 11.0, 13.0, 16.0, 27.0, 42.0, 40.0, 59.0, 77.0, 93.0, 123.0, 158.0, 170.0, 238.0, 276.0, 320.0, 351.0, 382.0, 321.0, 279.0, 211.0, 179.0, 148.0, 114.0, 93.0, 100.0, 50.0, 47.0, 31.0, 14.0, 15.0, 12.0, 8.0, 9.0, 10.0, 3.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.7998046875, -4.615234375, -4.4306640625, -4.24609375, -4.0615234375, -3.876953125, -3.6923828125, -3.5078125, -3.3232421875, -3.138671875, -2.9541015625, -2.76953125, -2.5849609375, -2.400390625, -2.2158203125, -2.03125, -1.8466796875, -1.662109375, -1.4775390625, -1.29296875, -1.1083984375, -0.923828125, -0.7392578125, -0.5546875, -0.3701171875, -0.185546875, -0.0009765625, 0.18359375, 0.3681640625, 0.552734375, 0.7373046875, 0.921875, 1.1064453125, 1.291015625, 1.4755859375, 1.66015625, 1.8447265625, 2.029296875, 2.2138671875, 2.3984375, 2.5830078125, 2.767578125, 2.9521484375, 3.13671875, 3.3212890625, 3.505859375, 3.6904296875, 3.875, 4.0595703125, 4.244140625, 4.4287109375, 4.61328125, 4.7978515625, 4.982421875, 5.1669921875, 5.3515625, 5.5361328125, 5.720703125, 5.9052734375, 6.08984375, 6.2744140625, 6.458984375, 6.6435546875, 6.828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 11.0, 10.0, 25.0, 22.0, 32.0, 55.0, 66.0, 81.0, 104.0, 109.0, 105.0, 86.0, 64.0, 48.0, 39.0, 36.0, 27.0, 17.0, 17.0, 4.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.340173721313477, -29.491859436035156, -28.64354705810547, -27.79523277282715, -26.946918487548828, -26.09860610961914, -25.25029182434082, -24.4019775390625, -23.553665161132812, -22.705350875854492, -21.857038497924805, -21.008724212646484, -20.160409927368164, -19.312097549438477, -18.463783264160156, -17.61547088623047, -16.767154693603516, -15.918841361999512, -15.070527076721191, -14.222213745117188, -13.373900413513184, -12.52558708190918, -11.67727279663086, -10.828959465026855, -9.980646133422852, -9.132332801818848, -8.284018516540527, -7.435705184936523, -6.5873918533325195, -5.739078044891357, -4.890764236450195, -4.042450904846191, -3.1941375732421875, -2.3458240032196045, -1.497510313987732, -0.6491966247558594, 0.19911694526672363, 1.0474305152893066, 1.8957443237304688, 2.7440576553344727, 3.5923714637756348, 4.440685272216797, 5.288998603820801, 6.137312412261963, 6.985626220703125, 7.833939552307129, 8.682252883911133, 9.530567169189453, 10.378880500793457, 11.227193832397461, 12.075508117675781, 12.923821449279785, 13.772134780883789, 14.62044906616211, 15.468762397766113, 16.317075729370117, 17.165390014648438, 18.013704299926758, 18.862016677856445, 19.710330963134766, 20.558645248413086, 21.406957626342773, 22.255271911621094, 23.10358428955078, 23.9518985748291]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 9.0, 7.0, 7.0, 7.0, 9.0, 14.0, 13.0, 28.0, 18.0, 17.0, 21.0, 28.0, 28.0, 38.0, 33.0, 31.0, 34.0, 42.0, 42.0, 34.0, 38.0, 33.0, 52.0, 23.0, 29.0, 35.0, 35.0, 38.0, 17.0, 30.0, 38.0, 23.0, 24.0, 13.0, 20.0, 20.0, 18.0, 11.0, 11.0, 9.0, 6.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.113921165466309, -9.834427833557129, -9.55493450164795, -9.27544116973877, -8.99594783782959, -8.71645450592041, -8.43696117401123, -8.157466888427734, -7.877974033355713, -7.598480701446533, -7.3189873695373535, -7.039494037628174, -6.760000228881836, -6.480506896972656, -6.201013565063477, -5.921520233154297, -5.642026901245117, -5.3625335693359375, -5.083040237426758, -4.803546905517578, -4.524053573608398, -4.244560241699219, -3.965066432952881, -3.685573101043701, -3.4060797691345215, -3.126586437225342, -2.847093105316162, -2.5675995349884033, -2.2881062030792236, -2.008612871170044, -1.7291194200515747, -1.4496259689331055, -1.1701335906982422, -0.8906401991844177, -0.6111468076705933, -0.3316534161567688, -0.052160024642944336, 0.22733330726623535, 0.5068267583847046, 0.7863202095031738, 1.0658135414123535, 1.3453068733215332, 1.6248003244400024, 1.9042937755584717, 2.1837871074676514, 2.463280439376831, 2.74277400970459, 3.0222673416137695, 3.301760673522949, 3.581254005432129, 3.8607473373413086, 4.140240669250488, 4.419734001159668, 4.699227333068848, 4.9787211418151855, 5.258214473724365, 5.537707805633545, 5.817201137542725, 6.096694469451904, 6.376187801361084, 6.655681610107422, 6.935174942016602, 7.214668273925781, 7.494161605834961, 7.773654937744141]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 16.0, 24.0, 19.0, 33.0, 35.0, 57.0, 80.0, 121.0, 217.0, 307.0, 459.0, 718.0, 1131.0, 2037.0, 3921.0, 8432.0, 20570.0, 55689.0, 161836.0, 354161.0, 274708.0, 101690.0, 35527.0, 13694.0, 5890.0, 2883.0, 1568.0, 935.0, 630.0, 371.0, 214.0, 182.0, 129.0, 66.0, 59.0, 44.0, 25.0, 21.0, 11.0, 12.0, 13.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.46630859375, -14.9638671875, -14.46142578125, -13.958984375, -13.45654296875, -12.9541015625, -12.45166015625, -11.94921875, -11.44677734375, -10.9443359375, -10.44189453125, -9.939453125, -9.43701171875, -8.9345703125, -8.43212890625, -7.9296875, -7.42724609375, -6.9248046875, -6.42236328125, -5.919921875, -5.41748046875, -4.9150390625, -4.41259765625, -3.91015625, -3.40771484375, -2.9052734375, -2.40283203125, -1.900390625, -1.39794921875, -0.8955078125, -0.39306640625, 0.109375, 0.61181640625, 1.1142578125, 1.61669921875, 2.119140625, 2.62158203125, 3.1240234375, 3.62646484375, 4.12890625, 4.63134765625, 5.1337890625, 5.63623046875, 6.138671875, 6.64111328125, 7.1435546875, 7.64599609375, 8.1484375, 8.65087890625, 9.1533203125, 9.65576171875, 10.158203125, 10.66064453125, 11.1630859375, 11.66552734375, 12.16796875, 12.67041015625, 13.1728515625, 13.67529296875, 14.177734375, 14.68017578125, 15.1826171875, 15.68505859375, 16.1875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 4.0, 7.0, 3.0, 8.0, 13.0, 17.0, 18.0, 12.0, 13.0, 21.0, 27.0, 28.0, 27.0, 33.0, 28.0, 38.0, 43.0, 39.0, 39.0, 34.0, 30.0, 32.0, 35.0, 40.0, 31.0, 44.0, 31.0, 32.0, 36.0, 28.0, 37.0, 19.0, 18.0, 24.0, 16.0, 18.0, 18.0, 11.0, 11.0, 7.0, 2.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.5625, -10.2435302734375, -9.924560546875, -9.6055908203125, -9.28662109375, -8.9676513671875, -8.648681640625, -8.3297119140625, -8.0107421875, -7.6917724609375, -7.372802734375, -7.0538330078125, -6.73486328125, -6.4158935546875, -6.096923828125, -5.7779541015625, -5.458984375, -5.1400146484375, -4.821044921875, -4.5020751953125, -4.18310546875, -3.8641357421875, -3.545166015625, -3.2261962890625, -2.9072265625, -2.5882568359375, -2.269287109375, -1.9503173828125, -1.63134765625, -1.3123779296875, -0.993408203125, -0.6744384765625, -0.35546875, -0.0364990234375, 0.282470703125, 0.6014404296875, 0.92041015625, 1.2393798828125, 1.558349609375, 1.8773193359375, 2.1962890625, 2.5152587890625, 2.834228515625, 3.1531982421875, 3.47216796875, 3.7911376953125, 4.110107421875, 4.4290771484375, 4.748046875, 5.0670166015625, 5.385986328125, 5.7049560546875, 6.02392578125, 6.3428955078125, 6.661865234375, 6.9808349609375, 7.2998046875, 7.6187744140625, 7.937744140625, 8.2567138671875, 8.57568359375, 8.8946533203125, 9.213623046875, 9.5325927734375, 9.8515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 11.0, 15.0, 19.0, 29.0, 28.0, 35.0, 41.0, 79.0, 84.0, 129.0, 199.0, 263.0, 428.0, 720.0, 1245.0, 2476.0, 4868.0, 11569.0, 32223.0, 112125.0, 389216.0, 348207.0, 96300.0, 28030.0, 10347.0, 4429.0, 2203.0, 1209.0, 663.0, 418.0, 275.0, 178.0, 135.0, 76.0, 78.0, 49.0, 44.0, 25.0, 13.0, 13.0, 13.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.796875, -21.114501953125, -20.43212890625, -19.749755859375, -19.0673828125, -18.385009765625, -17.70263671875, -17.020263671875, -16.337890625, -15.655517578125, -14.97314453125, -14.290771484375, -13.6083984375, -12.926025390625, -12.24365234375, -11.561279296875, -10.87890625, -10.196533203125, -9.51416015625, -8.831787109375, -8.1494140625, -7.467041015625, -6.78466796875, -6.102294921875, -5.419921875, -4.737548828125, -4.05517578125, -3.372802734375, -2.6904296875, -2.008056640625, -1.32568359375, -0.643310546875, 0.0390625, 0.721435546875, 1.40380859375, 2.086181640625, 2.7685546875, 3.450927734375, 4.13330078125, 4.815673828125, 5.498046875, 6.180419921875, 6.86279296875, 7.545166015625, 8.2275390625, 8.909912109375, 9.59228515625, 10.274658203125, 10.95703125, 11.639404296875, 12.32177734375, 13.004150390625, 13.6865234375, 14.368896484375, 15.05126953125, 15.733642578125, 16.416015625, 17.098388671875, 17.78076171875, 18.463134765625, 19.1455078125, 19.827880859375, 20.51025390625, 21.192626953125, 21.875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 14.0, 13.0, 18.0, 20.0, 25.0, 29.0, 20.0, 28.0, 35.0, 32.0, 37.0, 31.0, 42.0, 42.0, 41.0, 36.0, 38.0, 36.0, 35.0, 29.0, 42.0, 42.0, 30.0, 33.0, 34.0, 28.0, 23.0, 18.0, 15.0, 17.0, 13.0, 9.0, 10.0, 6.0, 6.0, 7.0, 4.0, 10.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.703125, -6.50433349609375, -6.3055419921875, -6.10675048828125, -5.907958984375, -5.70916748046875, -5.5103759765625, -5.31158447265625, -5.11279296875, -4.91400146484375, -4.7152099609375, -4.51641845703125, -4.317626953125, -4.11883544921875, -3.9200439453125, -3.72125244140625, -3.5224609375, -3.32366943359375, -3.1248779296875, -2.92608642578125, -2.727294921875, -2.52850341796875, -2.3297119140625, -2.13092041015625, -1.93212890625, -1.73333740234375, -1.5345458984375, -1.33575439453125, -1.136962890625, -0.93817138671875, -0.7393798828125, -0.54058837890625, -0.341796875, -0.14300537109375, 0.0557861328125, 0.25457763671875, 0.453369140625, 0.65216064453125, 0.8509521484375, 1.04974365234375, 1.24853515625, 1.44732666015625, 1.6461181640625, 1.84490966796875, 2.043701171875, 2.24249267578125, 2.4412841796875, 2.64007568359375, 2.8388671875, 3.03765869140625, 3.2364501953125, 3.43524169921875, 3.634033203125, 3.83282470703125, 4.0316162109375, 4.23040771484375, 4.42919921875, 4.62799072265625, 4.8267822265625, 5.02557373046875, 5.224365234375, 5.42315673828125, 5.6219482421875, 5.82073974609375, 6.01953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 11.0, 25.0, 19.0, 28.0, 31.0, 47.0, 72.0, 109.0, 131.0, 196.0, 245.0, 357.0, 489.0, 776.0, 1097.0, 1628.0, 2517.0, 4584.0, 12430.0, 135020.0, 801301.0, 67327.0, 8963.0, 3882.0, 2328.0, 1481.0, 1022.0, 667.0, 482.0, 366.0, 255.0, 158.0, 140.0, 91.0, 75.0, 61.0, 34.0, 27.0, 9.0, 18.0, 4.0, 8.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.296875, -19.670166015625, -19.04345703125, -18.416748046875, -17.7900390625, -17.163330078125, -16.53662109375, -15.909912109375, -15.283203125, -14.656494140625, -14.02978515625, -13.403076171875, -12.7763671875, -12.149658203125, -11.52294921875, -10.896240234375, -10.26953125, -9.642822265625, -9.01611328125, -8.389404296875, -7.7626953125, -7.135986328125, -6.50927734375, -5.882568359375, -5.255859375, -4.629150390625, -4.00244140625, -3.375732421875, -2.7490234375, -2.122314453125, -1.49560546875, -0.868896484375, -0.2421875, 0.384521484375, 1.01123046875, 1.637939453125, 2.2646484375, 2.891357421875, 3.51806640625, 4.144775390625, 4.771484375, 5.398193359375, 6.02490234375, 6.651611328125, 7.2783203125, 7.905029296875, 8.53173828125, 9.158447265625, 9.78515625, 10.411865234375, 11.03857421875, 11.665283203125, 12.2919921875, 12.918701171875, 13.54541015625, 14.172119140625, 14.798828125, 15.425537109375, 16.05224609375, 16.678955078125, 17.3056640625, 17.932373046875, 18.55908203125, 19.185791015625, 19.8125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 35.0, 82.0, 229.0, 343.0, 174.0, 75.0, 20.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016126632690429688, -0.0015612393617630005, -0.0015098154544830322, -0.001458391547203064, -0.0014069676399230957, -0.0013555437326431274, -0.0013041198253631592, -0.001252695918083191, -0.0012012720108032227, -0.0011498481035232544, -0.0010984241962432861, -0.0010470002889633179, -0.0009955763816833496, -0.0009441524744033813, -0.0008927285671234131, -0.0008413046598434448, -0.0007898807525634766, -0.0007384568452835083, -0.00068703293800354, -0.0006356090307235718, -0.0005841851234436035, -0.0005327612161636353, -0.000481337308883667, -0.00042991340160369873, -0.00037848949432373047, -0.0003270655870437622, -0.00027564167976379395, -0.00022421777248382568, -0.00017279386520385742, -0.00012136995792388916, -6.99460506439209e-05, -1.8522143363952637e-05, 3.2901763916015625e-05, 8.432567119598389e-05, 0.00013574957847595215, 0.0001871734857559204, 0.00023859739303588867, 0.00029002130031585693, 0.0003414452075958252, 0.00039286911487579346, 0.0004442930221557617, 0.00049571692943573, 0.0005471408367156982, 0.0005985647439956665, 0.0006499886512756348, 0.000701412558555603, 0.0007528364658355713, 0.0008042603731155396, 0.0008556842803955078, 0.0009071081876754761, 0.0009585320949554443, 0.0010099560022354126, 0.0010613799095153809, 0.0011128038167953491, 0.0011642277240753174, 0.0012156516313552856, 0.001267075538635254, 0.0013184994459152222, 0.0013699233531951904, 0.0014213472604751587, 0.001472771167755127, 0.0015241950750350952, 0.0015756189823150635, 0.0016270428895950317, 0.001678466796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 15.0, 24.0, 30.0, 34.0, 48.0, 67.0, 76.0, 147.0, 151.0, 218.0, 289.0, 387.0, 522.0, 686.0, 996.0, 1255.0, 1918.0, 2628.0, 3989.0, 7384.0, 25360.0, 162974.0, 598512.0, 190508.0, 28448.0, 7939.0, 4161.0, 2720.0, 1862.0, 1417.0, 1004.0, 687.0, 567.0, 412.0, 259.0, 234.0, 169.0, 123.0, 75.0, 66.0, 68.0, 30.0, 24.0, 24.0, 16.0, 6.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.765625, -13.3670654296875, -12.968505859375, -12.5699462890625, -12.17138671875, -11.7728271484375, -11.374267578125, -10.9757080078125, -10.5771484375, -10.1785888671875, -9.780029296875, -9.3814697265625, -8.98291015625, -8.5843505859375, -8.185791015625, -7.7872314453125, -7.388671875, -6.9901123046875, -6.591552734375, -6.1929931640625, -5.79443359375, -5.3958740234375, -4.997314453125, -4.5987548828125, -4.2001953125, -3.8016357421875, -3.403076171875, -3.0045166015625, -2.60595703125, -2.2073974609375, -1.808837890625, -1.4102783203125, -1.01171875, -0.6131591796875, -0.214599609375, 0.1839599609375, 0.58251953125, 0.9810791015625, 1.379638671875, 1.7781982421875, 2.1767578125, 2.5753173828125, 2.973876953125, 3.3724365234375, 3.77099609375, 4.1695556640625, 4.568115234375, 4.9666748046875, 5.365234375, 5.7637939453125, 6.162353515625, 6.5609130859375, 6.95947265625, 7.3580322265625, 7.756591796875, 8.1551513671875, 8.5537109375, 8.9522705078125, 9.350830078125, 9.7493896484375, 10.14794921875, 10.5465087890625, 10.945068359375, 11.3436279296875, 11.7421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 10.0, 14.0, 27.0, 39.0, 88.0, 101.0, 159.0, 154.0, 151.0, 90.0, 55.0, 41.0, 24.0, 14.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.73046875, -2.645843505859375, -2.56121826171875, -2.476593017578125, -2.3919677734375, -2.307342529296875, -2.22271728515625, -2.138092041015625, -2.053466796875, -1.968841552734375, -1.88421630859375, -1.799591064453125, -1.7149658203125, -1.630340576171875, -1.54571533203125, -1.461090087890625, -1.37646484375, -1.291839599609375, -1.20721435546875, -1.122589111328125, -1.0379638671875, -0.953338623046875, -0.86871337890625, -0.784088134765625, -0.699462890625, -0.614837646484375, -0.53021240234375, -0.445587158203125, -0.3609619140625, -0.276336669921875, -0.19171142578125, -0.107086181640625, -0.0224609375, 0.062164306640625, 0.14678955078125, 0.231414794921875, 0.3160400390625, 0.400665283203125, 0.48529052734375, 0.569915771484375, 0.654541015625, 0.739166259765625, 0.82379150390625, 0.908416748046875, 0.9930419921875, 1.077667236328125, 1.16229248046875, 1.246917724609375, 1.33154296875, 1.416168212890625, 1.50079345703125, 1.585418701171875, 1.6700439453125, 1.754669189453125, 1.83929443359375, 1.923919677734375, 2.008544921875, 2.093170166015625, 2.17779541015625, 2.262420654296875, 2.3470458984375, 2.431671142578125, 2.51629638671875, 2.600921630859375, 2.685546875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 6.0, 8.0, 8.0, 15.0, 9.0, 33.0, 32.0, 46.0, 77.0, 73.0, 104.0, 115.0, 108.0, 81.0, 62.0, 52.0, 34.0, 33.0, 32.0, 17.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.375194549560547, -29.5250244140625, -28.674854278564453, -27.824682235717773, -26.974512100219727, -26.12434196472168, -25.274169921875, -24.423999786376953, -23.573829650878906, -22.72365951538086, -21.873489379882812, -21.023317337036133, -20.173147201538086, -19.32297706604004, -18.47280502319336, -17.622634887695312, -16.772464752197266, -15.922294616699219, -15.072123527526855, -14.221952438354492, -13.371782302856445, -12.521612167358398, -11.671441078186035, -10.821269989013672, -9.971099853515625, -9.120929718017578, -8.270758628845215, -7.42058801651001, -6.570417404174805, -5.7202467918396, -4.8700761795043945, -4.0199055671691895, -3.1697330474853516, -2.3195624351501465, -1.4693918228149414, -0.6192212104797363, 0.23094940185546875, 1.0811200141906738, 1.931290626525879, 2.781461238861084, 3.631631851196289, 4.481802463531494, 5.331973075866699, 6.182143688201904, 7.032314300537109, 7.8824849128723145, 8.73265552520752, 9.582826614379883, 10.43299674987793, 11.283166885375977, 12.13333797454834, 12.983509063720703, 13.83367919921875, 14.683849334716797, 15.53402042388916, 16.384191513061523, 17.23436164855957, 18.084531784057617, 18.934703826904297, 19.784873962402344, 20.63504409790039, 21.485214233398438, 22.335384368896484, 23.185556411743164, 24.03572654724121]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 10.0, 9.0, 7.0, 7.0, 8.0, 11.0, 19.0, 18.0, 23.0, 24.0, 17.0, 19.0, 25.0, 39.0, 39.0, 36.0, 39.0, 37.0, 35.0, 38.0, 33.0, 48.0, 32.0, 39.0, 24.0, 29.0, 34.0, 36.0, 27.0, 33.0, 23.0, 28.0, 30.0, 14.0, 18.0, 16.0, 19.0, 15.0, 10.0, 7.0, 9.0, 8.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.759055137634277, -9.482192039489746, -9.205327987670898, -8.928464889526367, -8.651601791381836, -8.374738693237305, -8.097875595092773, -7.821011543273926, -7.5441484451293945, -7.267285346984863, -6.990421772003174, -6.713558197021484, -6.436695098876953, -6.159832000732422, -5.882968425750732, -5.606104850769043, -5.329241752624512, -5.0523786544799805, -4.775515079498291, -4.498651504516602, -4.22178840637207, -3.94492506980896, -3.6680617332458496, -3.3911983966827393, -3.114335060119629, -2.8374717235565186, -2.560608386993408, -2.283745050430298, -2.0068817138671875, -1.7300183773040771, -1.4531550407409668, -1.1762917041778564, -0.8994288444519043, -0.622565507888794, -0.3457021713256836, -0.06883883476257324, 0.2080245018005371, 0.48488783836364746, 0.7617511749267578, 1.0386145114898682, 1.3154778480529785, 1.5923411846160889, 1.8692045211791992, 2.1460678577423096, 2.42293119430542, 2.6997945308685303, 2.9766578674316406, 3.253521203994751, 3.5303845405578613, 3.8072478771209717, 4.084111213684082, 4.360974311828613, 4.637837886810303, 4.914701461791992, 5.191564559936523, 5.468427658081055, 5.745291233062744, 6.022154808044434, 6.299017906188965, 6.575881004333496, 6.8527445793151855, 7.129608154296875, 7.406471252441406, 7.6833343505859375, 7.960197925567627]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 4.0, 4.0, 13.0, 16.0, 23.0, 46.0, 47.0, 77.0, 122.0, 192.0, 324.0, 530.0, 827.0, 1321.0, 2094.0, 3631.0, 5817.0, 9615.0, 16236.0, 26571.0, 42992.0, 68960.0, 104640.0, 143871.0, 164709.0, 149578.0, 111097.0, 74558.0, 46901.0, 29212.0, 17540.0, 10652.0, 6355.0, 3863.0, 2361.0, 1460.0, 864.0, 520.0, 340.0, 223.0, 130.0, 75.0, 37.0, 38.0, 27.0, 21.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.43701171875, -11.0068359375, -10.57666015625, -10.146484375, -9.71630859375, -9.2861328125, -8.85595703125, -8.42578125, -7.99560546875, -7.5654296875, -7.13525390625, -6.705078125, -6.27490234375, -5.8447265625, -5.41455078125, -4.984375, -4.55419921875, -4.1240234375, -3.69384765625, -3.263671875, -2.83349609375, -2.4033203125, -1.97314453125, -1.54296875, -1.11279296875, -0.6826171875, -0.25244140625, 0.177734375, 0.60791015625, 1.0380859375, 1.46826171875, 1.8984375, 2.32861328125, 2.7587890625, 3.18896484375, 3.619140625, 4.04931640625, 4.4794921875, 4.90966796875, 5.33984375, 5.77001953125, 6.2001953125, 6.63037109375, 7.060546875, 7.49072265625, 7.9208984375, 8.35107421875, 8.78125, 9.21142578125, 9.6416015625, 10.07177734375, 10.501953125, 10.93212890625, 11.3623046875, 11.79248046875, 12.22265625, 12.65283203125, 13.0830078125, 13.51318359375, 13.943359375, 14.37353515625, 14.8037109375, 15.23388671875, 15.6640625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 9.0, 4.0, 9.0, 14.0, 15.0, 18.0, 23.0, 20.0, 25.0, 41.0, 31.0, 35.0, 44.0, 34.0, 32.0, 40.0, 61.0, 54.0, 38.0, 38.0, 49.0, 32.0, 42.0, 36.0, 33.0, 26.0, 27.0, 34.0, 20.0, 18.0, 18.0, 13.0, 15.0, 14.0, 9.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.8529052734375, -12.494873046875, -12.1368408203125, -11.77880859375, -11.4207763671875, -11.062744140625, -10.7047119140625, -10.3466796875, -9.9886474609375, -9.630615234375, -9.2725830078125, -8.91455078125, -8.5565185546875, -8.198486328125, -7.8404541015625, -7.482421875, -7.1243896484375, -6.766357421875, -6.4083251953125, -6.05029296875, -5.6922607421875, -5.334228515625, -4.9761962890625, -4.6181640625, -4.2601318359375, -3.902099609375, -3.5440673828125, -3.18603515625, -2.8280029296875, -2.469970703125, -2.1119384765625, -1.75390625, -1.3958740234375, -1.037841796875, -0.6798095703125, -0.32177734375, 0.0362548828125, 0.394287109375, 0.7523193359375, 1.1103515625, 1.4683837890625, 1.826416015625, 2.1844482421875, 2.54248046875, 2.9005126953125, 3.258544921875, 3.6165771484375, 3.974609375, 4.3326416015625, 4.690673828125, 5.0487060546875, 5.40673828125, 5.7647705078125, 6.122802734375, 6.4808349609375, 6.8388671875, 7.1968994140625, 7.554931640625, 7.9129638671875, 8.27099609375, 8.6290283203125, 8.987060546875, 9.3450927734375, 9.703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 12.0, 29.0, 38.0, 51.0, 88.0, 119.0, 161.0, 266.0, 425.0, 674.0, 1095.0, 1707.0, 2715.0, 4535.0, 7550.0, 12685.0, 21700.0, 37079.0, 63363.0, 103041.0, 150483.0, 179358.0, 162906.0, 116654.0, 73974.0, 43786.0, 26189.0, 15249.0, 8697.0, 5255.0, 3184.0, 1981.0, 1297.0, 756.0, 536.0, 319.0, 224.0, 134.0, 75.0, 62.0, 34.0, 19.0, 15.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.625, -14.1318359375, -13.638671875, -13.1455078125, -12.65234375, -12.1591796875, -11.666015625, -11.1728515625, -10.6796875, -10.1865234375, -9.693359375, -9.2001953125, -8.70703125, -8.2138671875, -7.720703125, -7.2275390625, -6.734375, -6.2412109375, -5.748046875, -5.2548828125, -4.76171875, -4.2685546875, -3.775390625, -3.2822265625, -2.7890625, -2.2958984375, -1.802734375, -1.3095703125, -0.81640625, -0.3232421875, 0.169921875, 0.6630859375, 1.15625, 1.6494140625, 2.142578125, 2.6357421875, 3.12890625, 3.6220703125, 4.115234375, 4.6083984375, 5.1015625, 5.5947265625, 6.087890625, 6.5810546875, 7.07421875, 7.5673828125, 8.060546875, 8.5537109375, 9.046875, 9.5400390625, 10.033203125, 10.5263671875, 11.01953125, 11.5126953125, 12.005859375, 12.4990234375, 12.9921875, 13.4853515625, 13.978515625, 14.4716796875, 14.96484375, 15.4580078125, 15.951171875, 16.4443359375, 16.9375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 8.0, 8.0, 7.0, 9.0, 12.0, 17.0, 13.0, 22.0, 17.0, 29.0, 43.0, 35.0, 24.0, 32.0, 39.0, 37.0, 52.0, 50.0, 34.0, 34.0, 46.0, 35.0, 44.0, 31.0, 45.0, 42.0, 28.0, 18.0, 26.0, 29.0, 24.0, 14.0, 23.0, 13.0, 10.0, 8.0, 6.0, 7.0, 7.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.4296875, -7.21636962890625, -7.0030517578125, -6.78973388671875, -6.576416015625, -6.36309814453125, -6.1497802734375, -5.93646240234375, -5.72314453125, -5.50982666015625, -5.2965087890625, -5.08319091796875, -4.869873046875, -4.65655517578125, -4.4432373046875, -4.22991943359375, -4.0166015625, -3.80328369140625, -3.5899658203125, -3.37664794921875, -3.163330078125, -2.95001220703125, -2.7366943359375, -2.52337646484375, -2.31005859375, -2.09674072265625, -1.8834228515625, -1.67010498046875, -1.456787109375, -1.24346923828125, -1.0301513671875, -0.81683349609375, -0.603515625, -0.39019775390625, -0.1768798828125, 0.03643798828125, 0.249755859375, 0.46307373046875, 0.6763916015625, 0.88970947265625, 1.10302734375, 1.31634521484375, 1.5296630859375, 1.74298095703125, 1.956298828125, 2.16961669921875, 2.3829345703125, 2.59625244140625, 2.8095703125, 3.02288818359375, 3.2362060546875, 3.44952392578125, 3.662841796875, 3.87615966796875, 4.0894775390625, 4.30279541015625, 4.51611328125, 4.72943115234375, 4.9427490234375, 5.15606689453125, 5.369384765625, 5.58270263671875, 5.7960205078125, 6.00933837890625, 6.22265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 11.0, 12.0, 23.0, 27.0, 37.0, 81.0, 88.0, 112.0, 152.0, 241.0, 401.0, 594.0, 812.0, 1250.0, 1949.0, 3089.0, 5005.0, 8278.0, 13986.0, 24963.0, 45288.0, 86016.0, 158884.0, 236117.0, 203224.0, 116700.0, 61830.0, 33101.0, 18418.0, 10615.0, 6238.0, 3775.0, 2400.0, 1580.0, 1029.0, 708.0, 475.0, 311.0, 227.0, 139.0, 102.0, 61.0, 58.0, 43.0, 35.0, 23.0, 14.0, 6.0, 7.0, 9.0, 5.0, 0.0, 5.0], "bins": [-8.4140625, -8.171875, -7.9296875, -7.6875, -7.4453125, -7.203125, -6.9609375, -6.71875, -6.4765625, -6.234375, -5.9921875, -5.75, -5.5078125, -5.265625, -5.0234375, -4.78125, -4.5390625, -4.296875, -4.0546875, -3.8125, -3.5703125, -3.328125, -3.0859375, -2.84375, -2.6015625, -2.359375, -2.1171875, -1.875, -1.6328125, -1.390625, -1.1484375, -0.90625, -0.6640625, -0.421875, -0.1796875, 0.0625, 0.3046875, 0.546875, 0.7890625, 1.03125, 1.2734375, 1.515625, 1.7578125, 2.0, 2.2421875, 2.484375, 2.7265625, 2.96875, 3.2109375, 3.453125, 3.6953125, 3.9375, 4.1796875, 4.421875, 4.6640625, 4.90625, 5.1484375, 5.390625, 5.6328125, 5.875, 6.1171875, 6.359375, 6.6015625, 6.84375, 7.0859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 9.0, 10.0, 9.0, 12.0, 15.0, 30.0, 26.0, 43.0, 39.0, 61.0, 108.0, 98.0, 82.0, 87.0, 95.0, 56.0, 49.0, 28.0, 34.0, 16.0, 13.0, 15.0, 12.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011739730834960938, -0.0011376142501831055, -0.0011012554168701172, -0.001064896583557129, -0.0010285377502441406, -0.0009921789169311523, -0.0009558200836181641, -0.0009194612503051758, -0.0008831024169921875, -0.0008467435836791992, -0.0008103847503662109, -0.0007740259170532227, -0.0007376670837402344, -0.0007013082504272461, -0.0006649494171142578, -0.0006285905838012695, -0.0005922317504882812, -0.000555872917175293, -0.0005195140838623047, -0.0004831552505493164, -0.0004467964172363281, -0.00041043758392333984, -0.00037407875061035156, -0.0003377199172973633, -0.000301361083984375, -0.0002650022506713867, -0.00022864341735839844, -0.00019228458404541016, -0.00015592575073242188, -0.0001195669174194336, -8.320808410644531e-05, -4.684925079345703e-05, -1.049041748046875e-05, 2.586841583251953e-05, 6.222724914550781e-05, 9.85860824584961e-05, 0.00013494491577148438, 0.00017130374908447266, 0.00020766258239746094, 0.00024402141571044922, 0.0002803802490234375, 0.0003167390823364258, 0.00035309791564941406, 0.00038945674896240234, 0.0004258155822753906, 0.0004621744155883789, 0.0004985332489013672, 0.0005348920822143555, 0.0005712509155273438, 0.000607609748840332, 0.0006439685821533203, 0.0006803274154663086, 0.0007166862487792969, 0.0007530450820922852, 0.0007894039154052734, 0.0008257627487182617, 0.00086212158203125, 0.0008984804153442383, 0.0009348392486572266, 0.0009711980819702148, 0.0010075569152832031, 0.0010439157485961914, 0.0010802745819091797, 0.001116633415222168, 0.0011529922485351562]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 14.0, 12.0, 19.0, 34.0, 49.0, 44.0, 89.0, 131.0, 185.0, 284.0, 390.0, 599.0, 916.0, 1365.0, 2172.0, 3535.0, 5761.0, 9520.0, 16469.0, 28703.0, 52877.0, 96932.0, 168115.0, 223623.0, 185713.0, 110796.0, 60528.0, 32963.0, 18608.0, 10828.0, 6411.0, 3904.0, 2446.0, 1571.0, 974.0, 647.0, 422.0, 286.0, 195.0, 137.0, 105.0, 51.0, 48.0, 25.0, 18.0, 19.0, 10.0, 4.0, 5.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.1785888671875, -5.962646484375, -5.7467041015625, -5.53076171875, -5.3148193359375, -5.098876953125, -4.8829345703125, -4.6669921875, -4.4510498046875, -4.235107421875, -4.0191650390625, -3.80322265625, -3.5872802734375, -3.371337890625, -3.1553955078125, -2.939453125, -2.7235107421875, -2.507568359375, -2.2916259765625, -2.07568359375, -1.8597412109375, -1.643798828125, -1.4278564453125, -1.2119140625, -0.9959716796875, -0.780029296875, -0.5640869140625, -0.34814453125, -0.1322021484375, 0.083740234375, 0.2996826171875, 0.515625, 0.7315673828125, 0.947509765625, 1.1634521484375, 1.37939453125, 1.5953369140625, 1.811279296875, 2.0272216796875, 2.2431640625, 2.4591064453125, 2.675048828125, 2.8909912109375, 3.10693359375, 3.3228759765625, 3.538818359375, 3.7547607421875, 3.970703125, 4.1866455078125, 4.402587890625, 4.6185302734375, 4.83447265625, 5.0504150390625, 5.266357421875, 5.4822998046875, 5.6982421875, 5.9141845703125, 6.130126953125, 6.3460693359375, 6.56201171875, 6.7779541015625, 6.993896484375, 7.2098388671875, 7.42578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 9.0, 3.0, 5.0, 8.0, 7.0, 12.0, 7.0, 15.0, 15.0, 26.0, 35.0, 35.0, 29.0, 55.0, 47.0, 57.0, 85.0, 68.0, 73.0, 73.0, 63.0, 49.0, 34.0, 36.0, 36.0, 26.0, 20.0, 10.0, 13.0, 12.0, 14.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5393218994140625, -1.476104736328125, -1.4128875732421875, -1.34967041015625, -1.2864532470703125, -1.223236083984375, -1.1600189208984375, -1.0968017578125, -1.0335845947265625, -0.970367431640625, -0.9071502685546875, -0.84393310546875, -0.7807159423828125, -0.717498779296875, -0.6542816162109375, -0.591064453125, -0.5278472900390625, -0.464630126953125, -0.4014129638671875, -0.33819580078125, -0.2749786376953125, -0.211761474609375, -0.1485443115234375, -0.0853271484375, -0.0221099853515625, 0.041107177734375, 0.1043243408203125, 0.16754150390625, 0.2307586669921875, 0.293975830078125, 0.3571929931640625, 0.42041015625, 0.4836273193359375, 0.546844482421875, 0.6100616455078125, 0.67327880859375, 0.7364959716796875, 0.799713134765625, 0.8629302978515625, 0.9261474609375, 0.9893646240234375, 1.052581787109375, 1.1157989501953125, 1.17901611328125, 1.2422332763671875, 1.305450439453125, 1.3686676025390625, 1.431884765625, 1.4951019287109375, 1.558319091796875, 1.6215362548828125, 1.68475341796875, 1.7479705810546875, 1.811187744140625, 1.8744049072265625, 1.9376220703125, 2.0008392333984375, 2.064056396484375, 2.1272735595703125, 2.19049072265625, 2.2537078857421875, 2.316925048828125, 2.3801422119140625, 2.443359375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 11.0, 12.0, 10.0, 13.0, 16.0, 32.0, 43.0, 50.0, 62.0, 76.0, 79.0, 76.0, 91.0, 76.0, 58.0, 60.0, 47.0, 45.0, 23.0, 30.0, 19.0, 13.0, 7.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.13949203491211, -24.40159797668457, -23.66370391845703, -22.925809860229492, -22.187915802001953, -21.45001983642578, -20.712125778198242, -19.974231719970703, -19.236337661743164, -18.498443603515625, -17.760549545288086, -17.022655487060547, -16.284759521484375, -15.546866416931152, -14.808971405029297, -14.071077346801758, -13.333183288574219, -12.59528923034668, -11.85739517211914, -11.119500160217285, -10.381606101989746, -9.643712043762207, -8.905817031860352, -8.167922973632812, -7.430028915405273, -6.692134857177734, -5.954240322113037, -5.21634578704834, -4.478451728820801, -3.7405574321746826, -3.0026631355285645, -2.264768600463867, -1.526876449584961, -0.7889821529388428, -0.05108785629272461, 0.6868064403533936, 1.4247007369995117, 2.16259503364563, 2.900489330291748, 3.6383838653564453, 4.376277923583984, 5.114171981811523, 5.852066516876221, 6.589961051940918, 7.327855110168457, 8.065749168395996, 8.803644180297852, 9.54153823852539, 10.27943229675293, 11.017326354980469, 11.755220413208008, 12.493115425109863, 13.231009483337402, 13.968903541564941, 14.706798553466797, 15.444692611694336, 16.182586669921875, 16.920480728149414, 17.658374786376953, 18.396268844604492, 19.13416290283203, 19.872058868408203, 20.609952926635742, 21.34784698486328, 22.08574104309082]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 14.0, 9.0, 10.0, 15.0, 17.0, 14.0, 21.0, 23.0, 23.0, 26.0, 39.0, 20.0, 37.0, 38.0, 28.0, 38.0, 46.0, 36.0, 37.0, 36.0, 31.0, 24.0, 44.0, 33.0, 34.0, 38.0, 26.0, 26.0, 30.0, 28.0, 22.0, 23.0, 20.0, 16.0, 12.0, 14.0, 10.0, 5.0, 11.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.364797592163086, -8.079201698303223, -7.793605804443359, -7.508009910583496, -7.222414016723633, -6.9368181228637695, -6.651222229003906, -6.365626335144043, -6.08003044128418, -5.794434547424316, -5.508838653564453, -5.22324275970459, -4.937646865844727, -4.652050971984863, -4.366455078125, -4.080859184265137, -3.7952632904052734, -3.50966739654541, -3.224071502685547, -2.9384756088256836, -2.6528797149658203, -2.367283821105957, -2.0816879272460938, -1.7960920333862305, -1.5104961395263672, -1.224900245666504, -0.9393043518066406, -0.6537084579467773, -0.36811256408691406, -0.08251667022705078, 0.2030792236328125, 0.4886751174926758, 0.7742719650268555, 1.0598678588867188, 1.345463752746582, 1.6310596466064453, 1.9166555404663086, 2.202251434326172, 2.487847328186035, 2.7734432220458984, 3.0590391159057617, 3.344635009765625, 3.6302309036254883, 3.9158267974853516, 4.201422691345215, 4.487018585205078, 4.772614479064941, 5.058210372924805, 5.343806266784668, 5.629402160644531, 5.9149980545043945, 6.200593948364258, 6.486189842224121, 6.771785736083984, 7.057381629943848, 7.342977523803711, 7.628573417663574, 7.9141693115234375, 8.1997652053833, 8.485361099243164, 8.770956993103027, 9.05655288696289, 9.342148780822754, 9.627744674682617, 9.91334056854248]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 10.0, 12.0, 21.0, 28.0, 46.0, 59.0, 81.0, 140.0, 235.0, 319.0, 467.0, 846.0, 1245.0, 2060.0, 3485.0, 5831.0, 10521.0, 19676.0, 38580.0, 82272.0, 194879.0, 524960.0, 1326373.0, 1221086.0, 448406.0, 167891.0, 71534.0, 33666.0, 17124.0, 9360.0, 5170.0, 2984.0, 1772.0, 1121.0, 676.0, 434.0, 300.0, 165.0, 127.0, 93.0, 56.0, 46.0, 36.0, 25.0, 7.0, 21.0, 13.0, 9.0, 10.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.65625, -19.966064453125, -19.27587890625, -18.585693359375, -17.8955078125, -17.205322265625, -16.51513671875, -15.824951171875, -15.134765625, -14.444580078125, -13.75439453125, -13.064208984375, -12.3740234375, -11.683837890625, -10.99365234375, -10.303466796875, -9.61328125, -8.923095703125, -8.23291015625, -7.542724609375, -6.8525390625, -6.162353515625, -5.47216796875, -4.781982421875, -4.091796875, -3.401611328125, -2.71142578125, -2.021240234375, -1.3310546875, -0.640869140625, 0.04931640625, 0.739501953125, 1.4296875, 2.119873046875, 2.81005859375, 3.500244140625, 4.1904296875, 4.880615234375, 5.57080078125, 6.260986328125, 6.951171875, 7.641357421875, 8.33154296875, 9.021728515625, 9.7119140625, 10.402099609375, 11.09228515625, 11.782470703125, 12.47265625, 13.162841796875, 13.85302734375, 14.543212890625, 15.2333984375, 15.923583984375, 16.61376953125, 17.303955078125, 17.994140625, 18.684326171875, 19.37451171875, 20.064697265625, 20.7548828125, 21.445068359375, 22.13525390625, 22.825439453125, 23.515625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 13.0, 4.0, 7.0, 13.0, 19.0, 15.0, 18.0, 25.0, 23.0, 25.0, 29.0, 37.0, 42.0, 36.0, 36.0, 35.0, 53.0, 44.0, 38.0, 37.0, 36.0, 40.0, 27.0, 31.0, 36.0, 38.0, 39.0, 25.0, 20.0, 26.0, 16.0, 17.0, 21.0, 14.0, 14.0, 10.0, 8.0, 3.0, 4.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6953125, -7.4495849609375, -7.203857421875, -6.9581298828125, -6.71240234375, -6.4666748046875, -6.220947265625, -5.9752197265625, -5.7294921875, -5.4837646484375, -5.238037109375, -4.9923095703125, -4.74658203125, -4.5008544921875, -4.255126953125, -4.0093994140625, -3.763671875, -3.5179443359375, -3.272216796875, -3.0264892578125, -2.78076171875, -2.5350341796875, -2.289306640625, -2.0435791015625, -1.7978515625, -1.5521240234375, -1.306396484375, -1.0606689453125, -0.81494140625, -0.5692138671875, -0.323486328125, -0.0777587890625, 0.16796875, 0.4136962890625, 0.659423828125, 0.9051513671875, 1.15087890625, 1.3966064453125, 1.642333984375, 1.8880615234375, 2.1337890625, 2.3795166015625, 2.625244140625, 2.8709716796875, 3.11669921875, 3.3624267578125, 3.608154296875, 3.8538818359375, 4.099609375, 4.3453369140625, 4.591064453125, 4.8367919921875, 5.08251953125, 5.3282470703125, 5.573974609375, 5.8197021484375, 6.0654296875, 6.3111572265625, 6.556884765625, 6.8026123046875, 7.04833984375, 7.2940673828125, 7.539794921875, 7.7855224609375, 8.03125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 10.0, 15.0, 22.0, 23.0, 63.0, 74.0, 109.0, 156.0, 218.0, 349.0, 537.0, 817.0, 1272.0, 1946.0, 3092.0, 5046.0, 8097.0, 13708.0, 24096.0, 43745.0, 84309.0, 172522.0, 372771.0, 821839.0, 1243017.0, 736677.0, 331985.0, 154697.0, 76242.0, 40362.0, 22616.0, 12940.0, 7781.0, 4844.0, 2927.0, 1906.0, 1231.0, 762.0, 527.0, 327.0, 215.0, 125.0, 87.0, 58.0, 45.0, 24.0, 15.0, 7.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.9990234375, -19.341796875, -18.6845703125, -18.02734375, -17.3701171875, -16.712890625, -16.0556640625, -15.3984375, -14.7412109375, -14.083984375, -13.4267578125, -12.76953125, -12.1123046875, -11.455078125, -10.7978515625, -10.140625, -9.4833984375, -8.826171875, -8.1689453125, -7.51171875, -6.8544921875, -6.197265625, -5.5400390625, -4.8828125, -4.2255859375, -3.568359375, -2.9111328125, -2.25390625, -1.5966796875, -0.939453125, -0.2822265625, 0.375, 1.0322265625, 1.689453125, 2.3466796875, 3.00390625, 3.6611328125, 4.318359375, 4.9755859375, 5.6328125, 6.2900390625, 6.947265625, 7.6044921875, 8.26171875, 8.9189453125, 9.576171875, 10.2333984375, 10.890625, 11.5478515625, 12.205078125, 12.8623046875, 13.51953125, 14.1767578125, 14.833984375, 15.4912109375, 16.1484375, 16.8056640625, 17.462890625, 18.1201171875, 18.77734375, 19.4345703125, 20.091796875, 20.7490234375, 21.40625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 6.0, 3.0, 11.0, 15.0, 25.0, 37.0, 46.0, 53.0, 67.0, 103.0, 126.0, 159.0, 196.0, 247.0, 321.0, 337.0, 385.0, 347.0, 337.0, 257.0, 222.0, 151.0, 149.0, 100.0, 83.0, 62.0, 47.0, 43.0, 37.0, 23.0, 8.0, 13.0, 13.0, 5.0, 9.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.0020751953125, -4.801025390625, -4.5999755859375, -4.39892578125, -4.1978759765625, -3.996826171875, -3.7957763671875, -3.5947265625, -3.3936767578125, -3.192626953125, -2.9915771484375, -2.79052734375, -2.5894775390625, -2.388427734375, -2.1873779296875, -1.986328125, -1.7852783203125, -1.584228515625, -1.3831787109375, -1.18212890625, -0.9810791015625, -0.780029296875, -0.5789794921875, -0.3779296875, -0.1768798828125, 0.024169921875, 0.2252197265625, 0.42626953125, 0.6273193359375, 0.828369140625, 1.0294189453125, 1.23046875, 1.4315185546875, 1.632568359375, 1.8336181640625, 2.03466796875, 2.2357177734375, 2.436767578125, 2.6378173828125, 2.8388671875, 3.0399169921875, 3.240966796875, 3.4420166015625, 3.64306640625, 3.8441162109375, 4.045166015625, 4.2462158203125, 4.447265625, 4.6483154296875, 4.849365234375, 5.0504150390625, 5.25146484375, 5.4525146484375, 5.653564453125, 5.8546142578125, 6.0556640625, 6.2567138671875, 6.457763671875, 6.6588134765625, 6.85986328125, 7.0609130859375, 7.261962890625, 7.4630126953125, 7.6640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 13.0, 11.0, 14.0, 28.0, 36.0, 40.0, 52.0, 79.0, 95.0, 96.0, 81.0, 93.0, 74.0, 67.0, 43.0, 43.0, 28.0, 22.0, 11.0, 16.0, 9.0, 9.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.252614974975586, -27.404245376586914, -26.555875778198242, -25.707504272460938, -24.859134674072266, -24.010765075683594, -23.162395477294922, -22.31402587890625, -21.465654373168945, -20.617284774780273, -19.7689151763916, -18.920543670654297, -18.072174072265625, -17.223804473876953, -16.37543487548828, -15.527064323425293, -14.678694725036621, -13.83032512664795, -12.981954574584961, -12.133584976196289, -11.2852144241333, -10.436844825744629, -9.58847427368164, -8.740104675292969, -7.891734600067139, -7.043364524841309, -6.1949944496154785, -5.346624374389648, -4.498254776000977, -3.6498847007751465, -2.8015146255493164, -1.9531445503234863, -1.1047744750976562, -0.25640445947647095, 0.5919655561447144, 1.4403355121612549, 2.288705587387085, 3.137075424194336, 3.985445499420166, 4.833815574645996, 5.682185649871826, 6.530555725097656, 7.378925800323486, 8.227295875549316, 9.075665473937988, 9.924036026000977, 10.772405624389648, 11.62077522277832, 12.469145774841309, 13.31751537322998, 14.165885925292969, 15.01425552368164, 15.862626075744629, 16.710994720458984, 17.55936622619629, 18.40773582458496, 19.256105422973633, 20.104475021362305, 20.952844619750977, 21.80121612548828, 22.649585723876953, 23.497955322265625, 24.346324920654297, 25.19469451904297, 26.043066024780273]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 7.0, 5.0, 11.0, 10.0, 9.0, 20.0, 23.0, 13.0, 21.0, 21.0, 23.0, 38.0, 18.0, 39.0, 28.0, 33.0, 40.0, 46.0, 36.0, 25.0, 33.0, 35.0, 38.0, 36.0, 43.0, 25.0, 34.0, 30.0, 23.0, 23.0, 29.0, 25.0, 31.0, 14.0, 25.0, 12.0, 15.0, 5.0, 15.0, 8.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.791970252990723, -8.51536750793457, -8.238763809204102, -7.962160587310791, -7.6855573654174805, -7.408954620361328, -7.132351398468018, -6.855748176574707, -6.5791449546813965, -6.302541732788086, -6.025938510894775, -5.749335289001465, -5.4727325439453125, -5.196128845214844, -4.919526100158691, -4.642922878265381, -4.36631965637207, -4.08971643447876, -3.813113212585449, -3.5365102291107178, -3.2599070072174072, -2.9833037853240967, -2.7067008018493652, -2.4300975799560547, -2.153494358062744, -1.8768911361694336, -1.6002880334854126, -1.3236849308013916, -1.047081708908081, -0.7704784870147705, -0.4938753843307495, -0.21727228164672852, 0.059329986572265625, 0.3359331488609314, 0.6125363111495972, 0.8891394734382629, 1.1657426357269287, 1.4423458576202393, 1.7189489603042603, 1.9955520629882812, 2.272155284881592, 2.5487585067749023, 2.825361728668213, 3.1019647121429443, 3.378567934036255, 3.6551711559295654, 3.931774139404297, 4.208377361297607, 4.484980583190918, 4.7615838050842285, 5.038187026977539, 5.31479024887085, 5.59139347076416, 5.8679962158203125, 6.144599437713623, 6.421202659606934, 6.697805881500244, 6.974409103393555, 7.251012325286865, 7.527615547180176, 7.804218292236328, 8.080821990966797, 8.35742473602295, 8.634027481079102, 8.91063117980957]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 13.0, 32.0, 44.0, 63.0, 83.0, 117.0, 238.0, 375.0, 668.0, 1017.0, 1761.0, 3090.0, 5106.0, 8611.0, 14774.0, 24693.0, 41915.0, 68403.0, 106949.0, 153944.0, 179201.0, 155385.0, 108779.0, 69215.0, 42275.0, 25237.0, 14744.0, 8855.0, 5311.0, 3102.0, 1787.0, 1074.0, 631.0, 445.0, 222.0, 130.0, 84.0, 57.0, 33.0, 28.0, 16.0, 9.0, 15.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98046875, -6.75897216796875, -6.5374755859375, -6.31597900390625, -6.094482421875, -5.87298583984375, -5.6514892578125, -5.42999267578125, -5.20849609375, -4.98699951171875, -4.7655029296875, -4.54400634765625, -4.322509765625, -4.10101318359375, -3.8795166015625, -3.65802001953125, -3.4365234375, -3.21502685546875, -2.9935302734375, -2.77203369140625, -2.550537109375, -2.32904052734375, -2.1075439453125, -1.88604736328125, -1.66455078125, -1.44305419921875, -1.2215576171875, -1.00006103515625, -0.778564453125, -0.55706787109375, -0.3355712890625, -0.11407470703125, 0.107421875, 0.32891845703125, 0.5504150390625, 0.77191162109375, 0.993408203125, 1.21490478515625, 1.4364013671875, 1.65789794921875, 1.87939453125, 2.10089111328125, 2.3223876953125, 2.54388427734375, 2.765380859375, 2.98687744140625, 3.2083740234375, 3.42987060546875, 3.6513671875, 3.87286376953125, 4.0943603515625, 4.31585693359375, 4.537353515625, 4.75885009765625, 4.9803466796875, 5.20184326171875, 5.42333984375, 5.64483642578125, 5.8663330078125, 6.08782958984375, 6.309326171875, 6.53082275390625, 6.7523193359375, 6.97381591796875, 7.1953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 15.0, 16.0, 8.0, 12.0, 20.0, 24.0, 23.0, 20.0, 23.0, 38.0, 44.0, 38.0, 39.0, 34.0, 39.0, 39.0, 45.0, 50.0, 45.0, 47.0, 35.0, 34.0, 33.0, 33.0, 40.0, 28.0, 21.0, 21.0, 21.0, 22.0, 16.0, 16.0, 12.0, 10.0, 12.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.6796875, -11.3138427734375, -10.947998046875, -10.5821533203125, -10.21630859375, -9.8504638671875, -9.484619140625, -9.1187744140625, -8.7529296875, -8.3870849609375, -8.021240234375, -7.6553955078125, -7.28955078125, -6.9237060546875, -6.557861328125, -6.1920166015625, -5.826171875, -5.4603271484375, -5.094482421875, -4.7286376953125, -4.36279296875, -3.9969482421875, -3.631103515625, -3.2652587890625, -2.8994140625, -2.5335693359375, -2.167724609375, -1.8018798828125, -1.43603515625, -1.0701904296875, -0.704345703125, -0.3385009765625, 0.02734375, 0.3931884765625, 0.759033203125, 1.1248779296875, 1.49072265625, 1.8565673828125, 2.222412109375, 2.5882568359375, 2.9541015625, 3.3199462890625, 3.685791015625, 4.0516357421875, 4.41748046875, 4.7833251953125, 5.149169921875, 5.5150146484375, 5.880859375, 6.2467041015625, 6.612548828125, 6.9783935546875, 7.34423828125, 7.7100830078125, 8.075927734375, 8.4417724609375, 8.8076171875, 9.1734619140625, 9.539306640625, 9.9051513671875, 10.27099609375, 10.6368408203125, 11.002685546875, 11.3685302734375, 11.734375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 17.0, 15.0, 29.0, 26.0, 45.0, 61.0, 115.0, 154.0, 200.0, 301.0, 446.0, 665.0, 993.0, 1484.0, 2397.0, 3864.0, 6316.0, 10354.0, 17940.0, 31295.0, 57085.0, 103949.0, 178029.0, 229826.0, 172972.0, 100428.0, 55448.0, 30256.0, 17329.0, 9937.0, 6095.0, 3660.0, 2371.0, 1445.0, 937.0, 648.0, 455.0, 277.0, 217.0, 138.0, 102.0, 74.0, 51.0, 42.0, 14.0, 16.0, 10.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.8828125, -9.5875244140625, -9.292236328125, -8.9969482421875, -8.70166015625, -8.4063720703125, -8.111083984375, -7.8157958984375, -7.5205078125, -7.2252197265625, -6.929931640625, -6.6346435546875, -6.33935546875, -6.0440673828125, -5.748779296875, -5.4534912109375, -5.158203125, -4.8629150390625, -4.567626953125, -4.2723388671875, -3.97705078125, -3.6817626953125, -3.386474609375, -3.0911865234375, -2.7958984375, -2.5006103515625, -2.205322265625, -1.9100341796875, -1.61474609375, -1.3194580078125, -1.024169921875, -0.7288818359375, -0.43359375, -0.1383056640625, 0.156982421875, 0.4522705078125, 0.74755859375, 1.0428466796875, 1.338134765625, 1.6334228515625, 1.9287109375, 2.2239990234375, 2.519287109375, 2.8145751953125, 3.10986328125, 3.4051513671875, 3.700439453125, 3.9957275390625, 4.291015625, 4.5863037109375, 4.881591796875, 5.1768798828125, 5.47216796875, 5.7674560546875, 6.062744140625, 6.3580322265625, 6.6533203125, 6.9486083984375, 7.243896484375, 7.5391845703125, 7.83447265625, 8.1297607421875, 8.425048828125, 8.7203369140625, 9.015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 6.0, 11.0, 12.0, 16.0, 10.0, 9.0, 23.0, 19.0, 36.0, 31.0, 27.0, 35.0, 44.0, 40.0, 36.0, 39.0, 38.0, 35.0, 47.0, 39.0, 37.0, 37.0, 29.0, 32.0, 44.0, 27.0, 28.0, 34.0, 29.0, 22.0, 13.0, 14.0, 15.0, 16.0, 5.0, 10.0, 6.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7191162109375, -5.516357421875, -5.3135986328125, -5.11083984375, -4.9080810546875, -4.705322265625, -4.5025634765625, -4.2998046875, -4.0970458984375, -3.894287109375, -3.6915283203125, -3.48876953125, -3.2860107421875, -3.083251953125, -2.8804931640625, -2.677734375, -2.4749755859375, -2.272216796875, -2.0694580078125, -1.86669921875, -1.6639404296875, -1.461181640625, -1.2584228515625, -1.0556640625, -0.8529052734375, -0.650146484375, -0.4473876953125, -0.24462890625, -0.0418701171875, 0.160888671875, 0.3636474609375, 0.56640625, 0.7691650390625, 0.971923828125, 1.1746826171875, 1.37744140625, 1.5802001953125, 1.782958984375, 1.9857177734375, 2.1884765625, 2.3912353515625, 2.593994140625, 2.7967529296875, 2.99951171875, 3.2022705078125, 3.405029296875, 3.6077880859375, 3.810546875, 4.0133056640625, 4.216064453125, 4.4188232421875, 4.62158203125, 4.8243408203125, 5.027099609375, 5.2298583984375, 5.4326171875, 5.6353759765625, 5.838134765625, 6.0408935546875, 6.24365234375, 6.4464111328125, 6.649169921875, 6.8519287109375, 7.0546875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 6.0, 2.0, 5.0, 4.0, 6.0, 3.0, 27.0, 28.0, 37.0, 62.0, 59.0, 89.0, 169.0, 266.0, 405.0, 662.0, 1122.0, 2003.0, 3427.0, 6216.0, 11959.0, 23636.0, 49967.0, 107142.0, 223667.0, 292169.0, 171176.0, 78856.0, 36782.0, 17859.0, 8974.0, 4806.0, 2733.0, 1644.0, 947.0, 599.0, 382.0, 220.0, 136.0, 89.0, 72.0, 48.0, 26.0, 22.0, 13.0, 11.0, 13.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.30078125, -4.16339111328125, -4.0260009765625, -3.88861083984375, -3.751220703125, -3.61383056640625, -3.4764404296875, -3.33905029296875, -3.20166015625, -3.06427001953125, -2.9268798828125, -2.78948974609375, -2.652099609375, -2.51470947265625, -2.3773193359375, -2.23992919921875, -2.1025390625, -1.96514892578125, -1.8277587890625, -1.69036865234375, -1.552978515625, -1.41558837890625, -1.2781982421875, -1.14080810546875, -1.00341796875, -0.86602783203125, -0.7286376953125, -0.59124755859375, -0.453857421875, -0.31646728515625, -0.1790771484375, -0.04168701171875, 0.095703125, 0.23309326171875, 0.3704833984375, 0.50787353515625, 0.645263671875, 0.78265380859375, 0.9200439453125, 1.05743408203125, 1.19482421875, 1.33221435546875, 1.4696044921875, 1.60699462890625, 1.744384765625, 1.88177490234375, 2.0191650390625, 2.15655517578125, 2.2939453125, 2.43133544921875, 2.5687255859375, 2.70611572265625, 2.843505859375, 2.98089599609375, 3.1182861328125, 3.25567626953125, 3.39306640625, 3.53045654296875, 3.6678466796875, 3.80523681640625, 3.942626953125, 4.08001708984375, 4.2174072265625, 4.35479736328125, 4.4921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 9.0, 10.0, 13.0, 21.0, 21.0, 31.0, 48.0, 45.0, 58.0, 68.0, 86.0, 80.0, 93.0, 74.0, 68.0, 54.0, 50.0, 39.0, 39.0, 23.0, 10.0, 17.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002608299255371094, -0.00025025755167007446, -0.00023968517780303955, -0.00022911280393600464, -0.00021854043006896973, -0.00020796805620193481, -0.0001973956823348999, -0.000186823308467865, -0.00017625093460083008, -0.00016567856073379517, -0.00015510618686676025, -0.00014453381299972534, -0.00013396143913269043, -0.00012338906526565552, -0.0001128166913986206, -0.0001022443175315857, -9.167194366455078e-05, -8.109956979751587e-05, -7.052719593048096e-05, -5.9954822063446045e-05, -4.938244819641113e-05, -3.881007432937622e-05, -2.823770046234131e-05, -1.7665326595306396e-05, -7.092952728271484e-06, 3.4794211387634277e-06, 1.405179500579834e-05, 2.4624168872833252e-05, 3.5196542739868164e-05, 4.5768916606903076e-05, 5.634129047393799e-05, 6.69136643409729e-05, 7.748603820800781e-05, 8.805841207504272e-05, 9.863078594207764e-05, 0.00010920315980911255, 0.00011977553367614746, 0.00013034790754318237, 0.00014092028141021729, 0.0001514926552772522, 0.0001620650291442871, 0.00017263740301132202, 0.00018320977687835693, 0.00019378215074539185, 0.00020435452461242676, 0.00021492689847946167, 0.00022549927234649658, 0.0002360716462135315, 0.0002466440200805664, 0.0002572163939476013, 0.00026778876781463623, 0.00027836114168167114, 0.00028893351554870605, 0.00029950588941574097, 0.0003100782632827759, 0.0003206506371498108, 0.0003312230110168457, 0.0003417953848838806, 0.00035236775875091553, 0.00036294013261795044, 0.00037351250648498535, 0.00038408488035202026, 0.0003946572542190552, 0.0004052296280860901, 0.000415802001953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 11.0, 9.0, 9.0, 19.0, 34.0, 45.0, 67.0, 93.0, 150.0, 218.0, 296.0, 469.0, 738.0, 1142.0, 1804.0, 2941.0, 4760.0, 7826.0, 13271.0, 23021.0, 39977.0, 68289.0, 111571.0, 162614.0, 187564.0, 157966.0, 106632.0, 64817.0, 38351.0, 21838.0, 12479.0, 7270.0, 4467.0, 2783.0, 1786.0, 1122.0, 695.0, 496.0, 296.0, 200.0, 144.0, 83.0, 60.0, 46.0, 29.0, 13.0, 14.0, 13.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.373046875, -3.26910400390625, -3.1651611328125, -3.06121826171875, -2.957275390625, -2.85333251953125, -2.7493896484375, -2.64544677734375, -2.54150390625, -2.43756103515625, -2.3336181640625, -2.22967529296875, -2.125732421875, -2.02178955078125, -1.9178466796875, -1.81390380859375, -1.7099609375, -1.60601806640625, -1.5020751953125, -1.39813232421875, -1.294189453125, -1.19024658203125, -1.0863037109375, -0.98236083984375, -0.87841796875, -0.77447509765625, -0.6705322265625, -0.56658935546875, -0.462646484375, -0.35870361328125, -0.2547607421875, -0.15081787109375, -0.046875, 0.05706787109375, 0.1610107421875, 0.26495361328125, 0.368896484375, 0.47283935546875, 0.5767822265625, 0.68072509765625, 0.78466796875, 0.88861083984375, 0.9925537109375, 1.09649658203125, 1.200439453125, 1.30438232421875, 1.4083251953125, 1.51226806640625, 1.6162109375, 1.72015380859375, 1.8240966796875, 1.92803955078125, 2.031982421875, 2.13592529296875, 2.2398681640625, 2.34381103515625, 2.44775390625, 2.55169677734375, 2.6556396484375, 2.75958251953125, 2.863525390625, 2.96746826171875, 3.0714111328125, 3.17535400390625, 3.279296875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 10.0, 13.0, 21.0, 22.0, 29.0, 22.0, 38.0, 40.0, 34.0, 53.0, 61.0, 45.0, 38.0, 54.0, 54.0, 49.0, 43.0, 33.0, 43.0, 37.0, 43.0, 28.0, 34.0, 25.0, 18.0, 22.0, 13.0, 10.0, 6.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.985137939453125, -0.95758056640625, -0.930023193359375, -0.9024658203125, -0.874908447265625, -0.84735107421875, -0.819793701171875, -0.792236328125, -0.764678955078125, -0.73712158203125, -0.709564208984375, -0.6820068359375, -0.654449462890625, -0.62689208984375, -0.599334716796875, -0.57177734375, -0.544219970703125, -0.51666259765625, -0.489105224609375, -0.4615478515625, -0.433990478515625, -0.40643310546875, -0.378875732421875, -0.351318359375, -0.323760986328125, -0.29620361328125, -0.268646240234375, -0.2410888671875, -0.213531494140625, -0.18597412109375, -0.158416748046875, -0.130859375, -0.103302001953125, -0.07574462890625, -0.048187255859375, -0.0206298828125, 0.006927490234375, 0.03448486328125, 0.062042236328125, 0.089599609375, 0.117156982421875, 0.14471435546875, 0.172271728515625, 0.1998291015625, 0.227386474609375, 0.25494384765625, 0.282501220703125, 0.31005859375, 0.337615966796875, 0.36517333984375, 0.392730712890625, 0.4202880859375, 0.447845458984375, 0.47540283203125, 0.502960205078125, 0.530517578125, 0.558074951171875, 0.58563232421875, 0.613189697265625, 0.6407470703125, 0.668304443359375, 0.69586181640625, 0.723419189453125, 0.7509765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 5.0, 8.0, 7.0, 10.0, 15.0, 26.0, 25.0, 39.0, 47.0, 55.0, 92.0, 89.0, 85.0, 90.0, 85.0, 67.0, 59.0, 46.0, 27.0, 39.0, 18.0, 12.0, 12.0, 9.0, 7.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.385204315185547, -25.559053421020508, -24.73290252685547, -23.90675163269043, -23.08060073852539, -22.25444984436035, -21.428298950195312, -20.602148056030273, -19.775997161865234, -18.949846267700195, -18.123695373535156, -17.297544479370117, -16.471393585205078, -15.645242691040039, -14.819091796875, -13.992940902709961, -13.166790008544922, -12.340639114379883, -11.514488220214844, -10.688337326049805, -9.862186431884766, -9.036035537719727, -8.209884643554688, -7.383733749389648, -6.557582855224609, -5.73143196105957, -4.905281066894531, -4.079130172729492, -3.252979278564453, -2.426828384399414, -1.600677490234375, -0.7745265960693359, 0.051624298095703125, 0.8777751922607422, 1.7039260864257812, 2.5300769805908203, 3.3562278747558594, 4.182378768920898, 5.0085296630859375, 5.834680557250977, 6.660831451416016, 7.486982345581055, 8.313133239746094, 9.139284133911133, 9.965435028076172, 10.791585922241211, 11.61773681640625, 12.443887710571289, 13.270038604736328, 14.096189498901367, 14.922340393066406, 15.748491287231445, 16.574642181396484, 17.400793075561523, 18.226943969726562, 19.0530948638916, 19.87924575805664, 20.70539665222168, 21.53154754638672, 22.357698440551758, 23.183849334716797, 24.010000228881836, 24.836151123046875, 25.662302017211914, 26.488452911376953]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 3.0, 9.0, 14.0, 12.0, 16.0, 18.0, 18.0, 21.0, 22.0, 24.0, 30.0, 31.0, 34.0, 25.0, 31.0, 46.0, 42.0, 36.0, 26.0, 38.0, 35.0, 36.0, 45.0, 32.0, 27.0, 26.0, 39.0, 22.0, 27.0, 26.0, 28.0, 25.0, 28.0, 9.0, 20.0, 4.0, 15.0, 12.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-8.70146369934082, -8.426247596740723, -8.151031494140625, -7.8758158683776855, -7.600600242614746, -7.325384140014648, -7.050168037414551, -6.774951934814453, -6.499736309051514, -6.224520206451416, -5.949304580688477, -5.674088478088379, -5.398872375488281, -5.123656749725342, -4.848440647125244, -4.573225021362305, -4.298008918762207, -4.022792816162109, -3.74757719039917, -3.4723610877990723, -3.1971452236175537, -2.921929359436035, -2.6467132568359375, -2.371497392654419, -2.0962815284729004, -1.8210656642913818, -1.5458496809005737, -1.2706336975097656, -0.9954178333282471, -0.7202019691467285, -0.4449859857559204, -0.1697700023651123, 0.10544586181640625, 0.3806617856025696, 0.6558777093887329, 0.9310936331748962, 1.2063095569610596, 1.4815254211425781, 1.7567414045333862, 2.0319573879241943, 2.307173252105713, 2.5823891162872314, 2.85760498046875, 3.1328210830688477, 3.408036947250366, 3.6832528114318848, 3.9584689140319824, 4.233684539794922, 4.5089006423950195, 4.784116744995117, 5.059332370758057, 5.334548473358154, 5.609764099121094, 5.884980201721191, 6.160196304321289, 6.435412406921387, 6.710628032684326, 6.985844135284424, 7.261059761047363, 7.536275863647461, 7.811491966247559, 8.086708068847656, 8.361923217773438, 8.637139320373535, 8.912355422973633]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 18.0, 29.0, 36.0, 51.0, 88.0, 135.0, 167.0, 253.0, 354.0, 560.0, 862.0, 1266.0, 2102.0, 3155.0, 5121.0, 8057.0, 13579.0, 22610.0, 37230.0, 59979.0, 92642.0, 132912.0, 161046.0, 157300.0, 124376.0, 84649.0, 54029.0, 33386.0, 19985.0, 12263.0, 7556.0, 4495.0, 2895.0, 1808.0, 1164.0, 782.0, 494.0, 303.0, 243.0, 197.0, 116.0, 63.0, 47.0, 29.0, 26.0, 24.0, 14.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-16.03125, -15.528564453125, -15.02587890625, -14.523193359375, -14.0205078125, -13.517822265625, -13.01513671875, -12.512451171875, -12.009765625, -11.507080078125, -11.00439453125, -10.501708984375, -9.9990234375, -9.496337890625, -8.99365234375, -8.490966796875, -7.98828125, -7.485595703125, -6.98291015625, -6.480224609375, -5.9775390625, -5.474853515625, -4.97216796875, -4.469482421875, -3.966796875, -3.464111328125, -2.96142578125, -2.458740234375, -1.9560546875, -1.453369140625, -0.95068359375, -0.447998046875, 0.0546875, 0.557373046875, 1.06005859375, 1.562744140625, 2.0654296875, 2.568115234375, 3.07080078125, 3.573486328125, 4.076171875, 4.578857421875, 5.08154296875, 5.584228515625, 6.0869140625, 6.589599609375, 7.09228515625, 7.594970703125, 8.09765625, 8.600341796875, 9.10302734375, 9.605712890625, 10.1083984375, 10.611083984375, 11.11376953125, 11.616455078125, 12.119140625, 12.621826171875, 13.12451171875, 13.627197265625, 14.1298828125, 14.632568359375, 15.13525390625, 15.637939453125, 16.140625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 3.0, 7.0, 7.0, 8.0, 15.0, 14.0, 26.0, 40.0, 21.0, 23.0, 22.0, 43.0, 39.0, 46.0, 44.0, 35.0, 41.0, 40.0, 45.0, 33.0, 49.0, 39.0, 34.0, 36.0, 44.0, 31.0, 20.0, 27.0, 33.0, 19.0, 23.0, 17.0, 21.0, 5.0, 11.0, 7.0, 6.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.25, -10.8936767578125, -10.537353515625, -10.1810302734375, -9.82470703125, -9.4683837890625, -9.112060546875, -8.7557373046875, -8.3994140625, -8.0430908203125, -7.686767578125, -7.3304443359375, -6.97412109375, -6.6177978515625, -6.261474609375, -5.9051513671875, -5.548828125, -5.1925048828125, -4.836181640625, -4.4798583984375, -4.12353515625, -3.7672119140625, -3.410888671875, -3.0545654296875, -2.6982421875, -2.3419189453125, -1.985595703125, -1.6292724609375, -1.27294921875, -0.9166259765625, -0.560302734375, -0.2039794921875, 0.15234375, 0.5086669921875, 0.864990234375, 1.2213134765625, 1.57763671875, 1.9339599609375, 2.290283203125, 2.6466064453125, 3.0029296875, 3.3592529296875, 3.715576171875, 4.0718994140625, 4.42822265625, 4.7845458984375, 5.140869140625, 5.4971923828125, 5.853515625, 6.2098388671875, 6.566162109375, 6.9224853515625, 7.27880859375, 7.6351318359375, 7.991455078125, 8.3477783203125, 8.7041015625, 9.0604248046875, 9.416748046875, 9.7730712890625, 10.12939453125, 10.4857177734375, 10.842041015625, 11.1983642578125, 11.5546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 19.0, 19.0, 43.0, 65.0, 91.0, 162.0, 258.0, 376.0, 590.0, 950.0, 1481.0, 2292.0, 3628.0, 5818.0, 9440.0, 15508.0, 24817.0, 39823.0, 62589.0, 93942.0, 129140.0, 153775.0, 148700.0, 120342.0, 84889.0, 56430.0, 35428.0, 22085.0, 13467.0, 8423.0, 5079.0, 3224.0, 2068.0, 1243.0, 843.0, 536.0, 346.0, 217.0, 156.0, 86.0, 61.0, 40.0, 24.0, 14.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6640625, -13.1907958984375, -12.717529296875, -12.2442626953125, -11.77099609375, -11.2977294921875, -10.824462890625, -10.3511962890625, -9.8779296875, -9.4046630859375, -8.931396484375, -8.4581298828125, -7.98486328125, -7.5115966796875, -7.038330078125, -6.5650634765625, -6.091796875, -5.6185302734375, -5.145263671875, -4.6719970703125, -4.19873046875, -3.7254638671875, -3.252197265625, -2.7789306640625, -2.3056640625, -1.8323974609375, -1.359130859375, -0.8858642578125, -0.41259765625, 0.0606689453125, 0.533935546875, 1.0072021484375, 1.48046875, 1.9537353515625, 2.427001953125, 2.9002685546875, 3.37353515625, 3.8468017578125, 4.320068359375, 4.7933349609375, 5.2666015625, 5.7398681640625, 6.213134765625, 6.6864013671875, 7.15966796875, 7.6329345703125, 8.106201171875, 8.5794677734375, 9.052734375, 9.5260009765625, 9.999267578125, 10.4725341796875, 10.94580078125, 11.4190673828125, 11.892333984375, 12.3656005859375, 12.8388671875, 13.3121337890625, 13.785400390625, 14.2586669921875, 14.73193359375, 15.2052001953125, 15.678466796875, 16.1517333984375, 16.625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 13.0, 14.0, 11.0, 14.0, 15.0, 21.0, 24.0, 31.0, 26.0, 35.0, 29.0, 37.0, 43.0, 39.0, 49.0, 39.0, 52.0, 37.0, 37.0, 34.0, 53.0, 44.0, 44.0, 29.0, 37.0, 26.0, 18.0, 25.0, 11.0, 19.0, 11.0, 15.0, 7.0, 5.0, 8.0, 4.0, 9.0, 3.0, 7.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-7.00390625, -6.78948974609375, -6.5750732421875, -6.36065673828125, -6.146240234375, -5.93182373046875, -5.7174072265625, -5.50299072265625, -5.28857421875, -5.07415771484375, -4.8597412109375, -4.64532470703125, -4.430908203125, -4.21649169921875, -4.0020751953125, -3.78765869140625, -3.5732421875, -3.35882568359375, -3.1444091796875, -2.92999267578125, -2.715576171875, -2.50115966796875, -2.2867431640625, -2.07232666015625, -1.85791015625, -1.64349365234375, -1.4290771484375, -1.21466064453125, -1.000244140625, -0.78582763671875, -0.5714111328125, -0.35699462890625, -0.142578125, 0.07183837890625, 0.2862548828125, 0.50067138671875, 0.715087890625, 0.92950439453125, 1.1439208984375, 1.35833740234375, 1.57275390625, 1.78717041015625, 2.0015869140625, 2.21600341796875, 2.430419921875, 2.64483642578125, 2.8592529296875, 3.07366943359375, 3.2880859375, 3.50250244140625, 3.7169189453125, 3.93133544921875, 4.145751953125, 4.36016845703125, 4.5745849609375, 4.78900146484375, 5.00341796875, 5.21783447265625, 5.4322509765625, 5.64666748046875, 5.861083984375, 6.07550048828125, 6.2899169921875, 6.50433349609375, 6.71875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 3.0, 8.0, 7.0, 12.0, 17.0, 24.0, 31.0, 34.0, 56.0, 74.0, 92.0, 132.0, 199.0, 287.0, 382.0, 618.0, 876.0, 1355.0, 2068.0, 3110.0, 5130.0, 8509.0, 15021.0, 28799.0, 58497.0, 124026.0, 234504.0, 260313.0, 152877.0, 72181.0, 35021.0, 17925.0, 10075.0, 5653.0, 3709.0, 2291.0, 1507.0, 945.0, 657.0, 486.0, 282.0, 219.0, 152.0, 122.0, 62.0, 65.0, 38.0, 28.0, 23.0, 20.0, 13.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-9.78125, -9.4671630859375, -9.153076171875, -8.8389892578125, -8.52490234375, -8.2108154296875, -7.896728515625, -7.5826416015625, -7.2685546875, -6.9544677734375, -6.640380859375, -6.3262939453125, -6.01220703125, -5.6981201171875, -5.384033203125, -5.0699462890625, -4.755859375, -4.4417724609375, -4.127685546875, -3.8135986328125, -3.49951171875, -3.1854248046875, -2.871337890625, -2.5572509765625, -2.2431640625, -1.9290771484375, -1.614990234375, -1.3009033203125, -0.98681640625, -0.6727294921875, -0.358642578125, -0.0445556640625, 0.26953125, 0.5836181640625, 0.897705078125, 1.2117919921875, 1.52587890625, 1.8399658203125, 2.154052734375, 2.4681396484375, 2.7822265625, 3.0963134765625, 3.410400390625, 3.7244873046875, 4.03857421875, 4.3526611328125, 4.666748046875, 4.9808349609375, 5.294921875, 5.6090087890625, 5.923095703125, 6.2371826171875, 6.55126953125, 6.8653564453125, 7.179443359375, 7.4935302734375, 7.8076171875, 8.1217041015625, 8.435791015625, 8.7498779296875, 9.06396484375, 9.3780517578125, 9.692138671875, 10.0062255859375, 10.3203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 3.0, 11.0, 12.0, 18.0, 19.0, 31.0, 31.0, 36.0, 53.0, 62.0, 106.0, 88.0, 101.0, 86.0, 61.0, 63.0, 35.0, 42.0, 22.0, 18.0, 16.0, 7.0, 16.0, 16.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.001407623291015625, -0.001367717981338501, -0.001327812671661377, -0.001287907361984253, -0.001248002052307129, -0.0012080967426300049, -0.0011681914329528809, -0.0011282861232757568, -0.0010883808135986328, -0.0010484755039215088, -0.0010085701942443848, -0.0009686648845672607, -0.0009287595748901367, -0.0008888542652130127, -0.0008489489555358887, -0.0008090436458587646, -0.0007691383361816406, -0.0007292330265045166, -0.0006893277168273926, -0.0006494224071502686, -0.0006095170974731445, -0.0005696117877960205, -0.0005297064781188965, -0.0004898011684417725, -0.00044989585876464844, -0.0004099905490875244, -0.0003700852394104004, -0.00033017992973327637, -0.00029027462005615234, -0.0002503693103790283, -0.0002104640007019043, -0.00017055869102478027, -0.00013065338134765625, -9.074807167053223e-05, -5.08427619934082e-05, -1.093745231628418e-05, 2.8967857360839844e-05, 6.887316703796387e-05, 0.00010877847671508789, 0.00014868378639221191, 0.00018858909606933594, 0.00022849440574645996, 0.000268399715423584, 0.000308305025100708, 0.00034821033477783203, 0.00038811564445495605, 0.0004280209541320801, 0.0004679262638092041, 0.0005078315734863281, 0.0005477368831634521, 0.0005876421928405762, 0.0006275475025177002, 0.0006674528121948242, 0.0007073581218719482, 0.0007472634315490723, 0.0007871687412261963, 0.0008270740509033203, 0.0008669793605804443, 0.0009068846702575684, 0.0009467899799346924, 0.0009866952896118164, 0.0010266005992889404, 0.0010665059089660645, 0.0011064112186431885, 0.0011463165283203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [7.0, 3.0, 4.0, 6.0, 13.0, 16.0, 17.0, 26.0, 32.0, 65.0, 63.0, 106.0, 133.0, 169.0, 236.0, 285.0, 400.0, 537.0, 762.0, 1105.0, 1519.0, 2216.0, 3246.0, 5296.0, 8239.0, 13630.0, 23263.0, 41848.0, 77628.0, 142420.0, 217717.0, 209067.0, 132262.0, 71007.0, 38428.0, 21280.0, 12490.0, 7674.0, 4861.0, 3190.0, 2161.0, 1425.0, 1000.0, 725.0, 556.0, 389.0, 261.0, 187.0, 147.0, 117.0, 87.0, 55.0, 63.0, 39.0, 29.0, 27.0, 14.0, 13.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0], "bins": [-7.7734375, -7.5220947265625, -7.270751953125, -7.0194091796875, -6.76806640625, -6.5167236328125, -6.265380859375, -6.0140380859375, -5.7626953125, -5.5113525390625, -5.260009765625, -5.0086669921875, -4.75732421875, -4.5059814453125, -4.254638671875, -4.0032958984375, -3.751953125, -3.5006103515625, -3.249267578125, -2.9979248046875, -2.74658203125, -2.4952392578125, -2.243896484375, -1.9925537109375, -1.7412109375, -1.4898681640625, -1.238525390625, -0.9871826171875, -0.73583984375, -0.4844970703125, -0.233154296875, 0.0181884765625, 0.26953125, 0.5208740234375, 0.772216796875, 1.0235595703125, 1.27490234375, 1.5262451171875, 1.777587890625, 2.0289306640625, 2.2802734375, 2.5316162109375, 2.782958984375, 3.0343017578125, 3.28564453125, 3.5369873046875, 3.788330078125, 4.0396728515625, 4.291015625, 4.5423583984375, 4.793701171875, 5.0450439453125, 5.29638671875, 5.5477294921875, 5.799072265625, 6.0504150390625, 6.3017578125, 6.5531005859375, 6.804443359375, 7.0557861328125, 7.30712890625, 7.5584716796875, 7.809814453125, 8.0611572265625, 8.3125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 12.0, 14.0, 17.0, 16.0, 25.0, 29.0, 42.0, 42.0, 55.0, 60.0, 72.0, 78.0, 73.0, 74.0, 75.0, 64.0, 46.0, 40.0, 25.0, 22.0, 19.0, 24.0, 7.0, 13.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.91015625, -2.823394775390625, -2.73663330078125, -2.649871826171875, -2.5631103515625, -2.476348876953125, -2.38958740234375, -2.302825927734375, -2.216064453125, -2.129302978515625, -2.04254150390625, -1.955780029296875, -1.8690185546875, -1.782257080078125, -1.69549560546875, -1.608734130859375, -1.52197265625, -1.435211181640625, -1.34844970703125, -1.261688232421875, -1.1749267578125, -1.088165283203125, -1.00140380859375, -0.914642333984375, -0.827880859375, -0.741119384765625, -0.65435791015625, -0.567596435546875, -0.4808349609375, -0.394073486328125, -0.30731201171875, -0.220550537109375, -0.1337890625, -0.047027587890625, 0.03973388671875, 0.126495361328125, 0.2132568359375, 0.300018310546875, 0.38677978515625, 0.473541259765625, 0.560302734375, 0.647064208984375, 0.73382568359375, 0.820587158203125, 0.9073486328125, 0.994110107421875, 1.08087158203125, 1.167633056640625, 1.25439453125, 1.341156005859375, 1.42791748046875, 1.514678955078125, 1.6014404296875, 1.688201904296875, 1.77496337890625, 1.861724853515625, 1.948486328125, 2.035247802734375, 2.12200927734375, 2.208770751953125, 2.2955322265625, 2.382293701171875, 2.46905517578125, 2.555816650390625, 2.642578125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 2.0, 5.0, 8.0, 12.0, 18.0, 14.0, 23.0, 26.0, 42.0, 50.0, 57.0, 88.0, 71.0, 91.0, 87.0, 79.0, 62.0, 53.0, 50.0, 38.0, 24.0, 25.0, 14.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.215232849121094, -21.419559478759766, -20.623886108398438, -19.82821273803711, -19.032541275024414, -18.236867904663086, -17.441194534301758, -16.64552116394043, -15.849847793579102, -15.054174423217773, -14.258502006530762, -13.462828636169434, -12.667155265808105, -11.871482849121094, -11.075809478759766, -10.280136108398438, -9.484463691711426, -8.688790321350098, -7.893117427825928, -7.097444534301758, -6.30177116394043, -5.50609827041626, -4.71042537689209, -3.9147520065307617, -3.119079113006592, -2.3234059810638428, -1.5277329683303833, -0.7320599555969238, 0.0636131763458252, 0.8592863082885742, 1.6549592018127441, 2.4506325721740723, 3.246305465698242, 4.041978359222412, 4.83765172958374, 5.63332462310791, 6.428997993469238, 7.224670886993408, 8.020343780517578, 8.816017150878906, 9.611690521240234, 10.407363891601562, 11.203036308288574, 11.998709678649902, 12.79438304901123, 13.590055465698242, 14.38572883605957, 15.181402206420898, 15.97707462310791, 16.772747039794922, 17.56842041015625, 18.364093780517578, 19.159767150878906, 19.955440521240234, 20.751113891601562, 21.54678726196289, 22.342458724975586, 23.138132095336914, 23.933805465698242, 24.729476928710938, 25.525150299072266, 26.320823669433594, 27.116497039794922, 27.91217041015625, 28.707843780517578]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 9.0, 12.0, 11.0, 11.0, 20.0, 16.0, 18.0, 17.0, 24.0, 37.0, 31.0, 31.0, 30.0, 35.0, 41.0, 46.0, 41.0, 27.0, 44.0, 35.0, 41.0, 30.0, 35.0, 51.0, 32.0, 35.0, 29.0, 28.0, 30.0, 28.0, 14.0, 23.0, 14.0, 12.0, 14.0, 4.0, 7.0, 5.0, 8.0, 3.0, 4.0, 0.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.837150573730469, -9.527704238891602, -9.218257904052734, -8.90881061553955, -8.599364280700684, -8.289917945861816, -7.980471611022949, -7.671024799346924, -7.361577987670898, -7.052131652832031, -6.742684841156006, -6.433238506317139, -6.123791694641113, -5.814345359802246, -5.504899024963379, -5.1954522132873535, -4.886005878448486, -4.576559543609619, -4.267112731933594, -3.9576663970947266, -3.648219585418701, -3.338773250579834, -3.0293266773223877, -2.7198801040649414, -2.410433530807495, -2.100986957550049, -1.7915403842926025, -1.4820939302444458, -1.1726473569869995, -0.8632007837295532, -0.5537543296813965, -0.2443077564239502, 0.0651388168334961, 0.37458536028862, 0.6840319037437439, 0.9934784173965454, 1.3029249906539917, 1.612371563911438, 1.9218180179595947, 2.231264591217041, 2.5407111644744873, 2.8501577377319336, 3.15960431098938, 3.469050884246826, 3.7784972190856934, 4.087944030761719, 4.397390365600586, 4.706836700439453, 5.0162835121154785, 5.325729846954346, 5.635176658630371, 5.944622993469238, 6.254069805145264, 6.563516139984131, 6.872962951660156, 7.182409286499023, 7.491855621337891, 7.801301956176758, 8.110748291015625, 8.420195579528809, 8.729641914367676, 9.039088249206543, 9.34853458404541, 9.657981872558594, 9.967428207397461]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 13.0, 15.0, 21.0, 28.0, 56.0, 55.0, 93.0, 137.0, 185.0, 274.0, 383.0, 599.0, 900.0, 1304.0, 2167.0, 3492.0, 5621.0, 10378.0, 19156.0, 38941.0, 87611.0, 217238.0, 607038.0, 1418050.0, 1100973.0, 401109.0, 150834.0, 63747.0, 29385.0, 14743.0, 7934.0, 4601.0, 2689.0, 1623.0, 982.0, 682.0, 404.0, 246.0, 162.0, 112.0, 85.0, 71.0, 45.0, 26.0, 30.0, 15.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.9375, -23.160400390625, -22.38330078125, -21.606201171875, -20.8291015625, -20.052001953125, -19.27490234375, -18.497802734375, -17.720703125, -16.943603515625, -16.16650390625, -15.389404296875, -14.6123046875, -13.835205078125, -13.05810546875, -12.281005859375, -11.50390625, -10.726806640625, -9.94970703125, -9.172607421875, -8.3955078125, -7.618408203125, -6.84130859375, -6.064208984375, -5.287109375, -4.510009765625, -3.73291015625, -2.955810546875, -2.1787109375, -1.401611328125, -0.62451171875, 0.152587890625, 0.9296875, 1.706787109375, 2.48388671875, 3.260986328125, 4.0380859375, 4.815185546875, 5.59228515625, 6.369384765625, 7.146484375, 7.923583984375, 8.70068359375, 9.477783203125, 10.2548828125, 11.031982421875, 11.80908203125, 12.586181640625, 13.36328125, 14.140380859375, 14.91748046875, 15.694580078125, 16.4716796875, 17.248779296875, 18.02587890625, 18.802978515625, 19.580078125, 20.357177734375, 21.13427734375, 21.911376953125, 22.6884765625, 23.465576171875, 24.24267578125, 25.019775390625, 25.796875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 14.0, 17.0, 16.0, 15.0, 22.0, 13.0, 34.0, 26.0, 33.0, 31.0, 36.0, 46.0, 45.0, 47.0, 37.0, 50.0, 50.0, 44.0, 36.0, 40.0, 32.0, 33.0, 43.0, 33.0, 39.0, 29.0, 28.0, 20.0, 12.0, 15.0, 8.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.171875, -8.8851318359375, -8.598388671875, -8.3116455078125, -8.02490234375, -7.7381591796875, -7.451416015625, -7.1646728515625, -6.8779296875, -6.5911865234375, -6.304443359375, -6.0177001953125, -5.73095703125, -5.4442138671875, -5.157470703125, -4.8707275390625, -4.583984375, -4.2972412109375, -4.010498046875, -3.7237548828125, -3.43701171875, -3.1502685546875, -2.863525390625, -2.5767822265625, -2.2900390625, -2.0032958984375, -1.716552734375, -1.4298095703125, -1.14306640625, -0.8563232421875, -0.569580078125, -0.2828369140625, 0.00390625, 0.2906494140625, 0.577392578125, 0.8641357421875, 1.15087890625, 1.4376220703125, 1.724365234375, 2.0111083984375, 2.2978515625, 2.5845947265625, 2.871337890625, 3.1580810546875, 3.44482421875, 3.7315673828125, 4.018310546875, 4.3050537109375, 4.591796875, 4.8785400390625, 5.165283203125, 5.4520263671875, 5.73876953125, 6.0255126953125, 6.312255859375, 6.5989990234375, 6.8857421875, 7.1724853515625, 7.459228515625, 7.7459716796875, 8.03271484375, 8.3194580078125, 8.606201171875, 8.8929443359375, 9.1796875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 11.0, 16.0, 27.0, 29.0, 66.0, 82.0, 124.0, 182.0, 320.0, 525.0, 780.0, 1232.0, 2117.0, 3602.0, 6873.0, 13220.0, 26876.0, 59489.0, 145020.0, 392073.0, 1085628.0, 1458504.0, 615320.0, 219290.0, 86389.0, 37562.0, 17827.0, 9117.0, 4944.0, 2826.0, 1634.0, 969.0, 596.0, 371.0, 211.0, 143.0, 85.0, 58.0, 46.0, 36.0, 17.0, 15.0, 10.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.953125, -26.996337890625, -26.03955078125, -25.082763671875, -24.1259765625, -23.169189453125, -22.21240234375, -21.255615234375, -20.298828125, -19.342041015625, -18.38525390625, -17.428466796875, -16.4716796875, -15.514892578125, -14.55810546875, -13.601318359375, -12.64453125, -11.687744140625, -10.73095703125, -9.774169921875, -8.8173828125, -7.860595703125, -6.90380859375, -5.947021484375, -4.990234375, -4.033447265625, -3.07666015625, -2.119873046875, -1.1630859375, -0.206298828125, 0.75048828125, 1.707275390625, 2.6640625, 3.620849609375, 4.57763671875, 5.534423828125, 6.4912109375, 7.447998046875, 8.40478515625, 9.361572265625, 10.318359375, 11.275146484375, 12.23193359375, 13.188720703125, 14.1455078125, 15.102294921875, 16.05908203125, 17.015869140625, 17.97265625, 18.929443359375, 19.88623046875, 20.843017578125, 21.7998046875, 22.756591796875, 23.71337890625, 24.670166015625, 25.626953125, 26.583740234375, 27.54052734375, 28.497314453125, 29.4541015625, 30.410888671875, 31.36767578125, 32.324462890625, 33.28125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 9.0, 6.0, 13.0, 13.0, 22.0, 19.0, 35.0, 41.0, 55.0, 74.0, 100.0, 135.0, 151.0, 214.0, 234.0, 306.0, 311.0, 333.0, 315.0, 326.0, 310.0, 238.0, 199.0, 159.0, 113.0, 76.0, 68.0, 47.0, 40.0, 28.0, 17.0, 14.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.0, -5.7857666015625, -5.571533203125, -5.3572998046875, -5.14306640625, -4.9288330078125, -4.714599609375, -4.5003662109375, -4.2861328125, -4.0718994140625, -3.857666015625, -3.6434326171875, -3.42919921875, -3.2149658203125, -3.000732421875, -2.7864990234375, -2.572265625, -2.3580322265625, -2.143798828125, -1.9295654296875, -1.71533203125, -1.5010986328125, -1.286865234375, -1.0726318359375, -0.8583984375, -0.6441650390625, -0.429931640625, -0.2156982421875, -0.00146484375, 0.2127685546875, 0.427001953125, 0.6412353515625, 0.85546875, 1.0697021484375, 1.283935546875, 1.4981689453125, 1.71240234375, 1.9266357421875, 2.140869140625, 2.3551025390625, 2.5693359375, 2.7835693359375, 2.997802734375, 3.2120361328125, 3.42626953125, 3.6405029296875, 3.854736328125, 4.0689697265625, 4.283203125, 4.4974365234375, 4.711669921875, 4.9259033203125, 5.14013671875, 5.3543701171875, 5.568603515625, 5.7828369140625, 5.9970703125, 6.2113037109375, 6.425537109375, 6.6397705078125, 6.85400390625, 7.0682373046875, 7.282470703125, 7.4967041015625, 7.7109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 12.0, 12.0, 20.0, 21.0, 35.0, 45.0, 59.0, 63.0, 101.0, 82.0, 92.0, 99.0, 77.0, 67.0, 44.0, 36.0, 32.0, 21.0, 18.0, 11.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.593488693237305, -22.65788459777832, -21.722280502319336, -20.78667640686035, -19.851070404052734, -18.91546630859375, -17.979862213134766, -17.04425811767578, -16.108654022216797, -15.173049926757812, -14.237445831298828, -13.301840782165527, -12.366236686706543, -11.430632591247559, -10.495027542114258, -9.559423446655273, -8.623819351196289, -7.688215255737305, -6.752610683441162, -5.8170061111450195, -4.881402015686035, -3.945797920227051, -3.010193347930908, -2.0745887756347656, -1.1389846801757812, -0.20338034629821777, 0.7322239875793457, 1.6678283214569092, 2.6034326553344727, 3.539036750793457, 4.4746413230896, 5.410245895385742, 6.345848083496094, 7.281452178955078, 8.217056274414062, 9.152661323547363, 10.088265419006348, 11.023869514465332, 11.959474563598633, 12.895078659057617, 13.830682754516602, 14.766286849975586, 15.70189094543457, 16.637495040893555, 17.573101043701172, 18.508705139160156, 19.44430923461914, 20.379913330078125, 21.31551742553711, 22.251121520996094, 23.186725616455078, 24.122329711914062, 25.057933807373047, 25.99353790283203, 26.92914390563965, 27.864748001098633, 28.800352096557617, 29.7359561920166, 30.671560287475586, 31.60716438293457, 32.54277038574219, 33.47837448120117, 34.413978576660156, 35.34958267211914, 36.285186767578125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 0.0, 14.0, 11.0, 13.0, 6.0, 7.0, 20.0, 21.0, 27.0, 20.0, 26.0, 38.0, 27.0, 35.0, 28.0, 38.0, 45.0, 36.0, 32.0, 27.0, 37.0, 32.0, 40.0, 40.0, 25.0, 34.0, 38.0, 38.0, 22.0, 27.0, 15.0, 21.0, 19.0, 16.0, 14.0, 15.0, 16.0, 13.0, 8.0, 12.0, 5.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.33753490447998, -8.042204856872559, -7.746875762939453, -7.451545715332031, -7.156216144561768, -6.860886573791504, -6.56555700302124, -6.270227432250977, -5.974897384643555, -5.679567813873291, -5.384238243103027, -5.0889081954956055, -4.793578624725342, -4.498249053955078, -4.2029194831848145, -3.9075896739959717, -3.612260341644287, -3.3169307708740234, -3.0216009616851807, -2.726271390914917, -2.430941581726074, -2.1356120109558105, -1.8402824401855469, -1.544952630996704, -1.2496230602264404, -0.9542933702468872, -0.6589637398719788, -0.3636341094970703, -0.06830441951751709, 0.22702527046203613, 0.5223548412322998, 0.8176846504211426, 1.1130142211914062, 1.4083439111709595, 1.7036736011505127, 1.9990031719207764, 2.294332981109619, 2.589662551879883, 2.8849921226501465, 3.1803219318389893, 3.475651502609253, 3.7709810733795166, 4.066310882568359, 4.361640453338623, 4.656970024108887, 4.952300071716309, 5.247629165649414, 5.542959213256836, 5.8382887840271, 6.133618354797363, 6.428947925567627, 6.724277496337891, 7.0196075439453125, 7.314937114715576, 7.61026668548584, 7.905596733093262, 8.200925827026367, 8.496255874633789, 8.791584968566895, 9.086915016174316, 9.382244110107422, 9.677574157714844, 9.972904205322266, 10.268233299255371, 10.563563346862793]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 12.0, 7.0, 23.0, 22.0, 45.0, 55.0, 98.0, 119.0, 177.0, 268.0, 362.0, 559.0, 935.0, 1365.0, 2168.0, 3465.0, 5754.0, 10048.0, 17828.0, 33429.0, 62296.0, 115703.0, 191448.0, 226868.0, 165526.0, 94625.0, 51273.0, 27331.0, 15011.0, 8480.0, 4962.0, 2910.0, 1871.0, 1241.0, 761.0, 502.0, 311.0, 217.0, 162.0, 91.0, 76.0, 38.0, 26.0, 28.0, 25.0, 7.0, 10.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.4765625, -11.1103515625, -10.744140625, -10.3779296875, -10.01171875, -9.6455078125, -9.279296875, -8.9130859375, -8.546875, -8.1806640625, -7.814453125, -7.4482421875, -7.08203125, -6.7158203125, -6.349609375, -5.9833984375, -5.6171875, -5.2509765625, -4.884765625, -4.5185546875, -4.15234375, -3.7861328125, -3.419921875, -3.0537109375, -2.6875, -2.3212890625, -1.955078125, -1.5888671875, -1.22265625, -0.8564453125, -0.490234375, -0.1240234375, 0.2421875, 0.6083984375, 0.974609375, 1.3408203125, 1.70703125, 2.0732421875, 2.439453125, 2.8056640625, 3.171875, 3.5380859375, 3.904296875, 4.2705078125, 4.63671875, 5.0029296875, 5.369140625, 5.7353515625, 6.1015625, 6.4677734375, 6.833984375, 7.2001953125, 7.56640625, 7.9326171875, 8.298828125, 8.6650390625, 9.03125, 9.3974609375, 9.763671875, 10.1298828125, 10.49609375, 10.8623046875, 11.228515625, 11.5947265625, 11.9609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 2.0, 10.0, 6.0, 11.0, 13.0, 13.0, 21.0, 18.0, 30.0, 23.0, 35.0, 27.0, 45.0, 48.0, 36.0, 38.0, 57.0, 33.0, 43.0, 41.0, 34.0, 48.0, 37.0, 41.0, 41.0, 24.0, 30.0, 33.0, 18.0, 24.0, 19.0, 15.0, 14.0, 12.0, 12.0, 12.0, 4.0, 7.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.46875, -13.068359375, -12.66796875, -12.267578125, -11.8671875, -11.466796875, -11.06640625, -10.666015625, -10.265625, -9.865234375, -9.46484375, -9.064453125, -8.6640625, -8.263671875, -7.86328125, -7.462890625, -7.0625, -6.662109375, -6.26171875, -5.861328125, -5.4609375, -5.060546875, -4.66015625, -4.259765625, -3.859375, -3.458984375, -3.05859375, -2.658203125, -2.2578125, -1.857421875, -1.45703125, -1.056640625, -0.65625, -0.255859375, 0.14453125, 0.544921875, 0.9453125, 1.345703125, 1.74609375, 2.146484375, 2.546875, 2.947265625, 3.34765625, 3.748046875, 4.1484375, 4.548828125, 4.94921875, 5.349609375, 5.75, 6.150390625, 6.55078125, 6.951171875, 7.3515625, 7.751953125, 8.15234375, 8.552734375, 8.953125, 9.353515625, 9.75390625, 10.154296875, 10.5546875, 10.955078125, 11.35546875, 11.755859375, 12.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 12.0, 13.0, 23.0, 23.0, 23.0, 39.0, 49.0, 76.0, 116.0, 147.0, 217.0, 290.0, 432.0, 549.0, 811.0, 1273.0, 1933.0, 3152.0, 5155.0, 9127.0, 17017.0, 34499.0, 72511.0, 157662.0, 279769.0, 235762.0, 116378.0, 53464.0, 25808.0, 13111.0, 7212.0, 4217.0, 2511.0, 1722.0, 1021.0, 683.0, 489.0, 348.0, 247.0, 183.0, 122.0, 92.0, 72.0, 56.0, 39.0, 35.0, 19.0, 9.0, 15.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0], "bins": [-15.8046875, -15.3228759765625, -14.841064453125, -14.3592529296875, -13.87744140625, -13.3956298828125, -12.913818359375, -12.4320068359375, -11.9501953125, -11.4683837890625, -10.986572265625, -10.5047607421875, -10.02294921875, -9.5411376953125, -9.059326171875, -8.5775146484375, -8.095703125, -7.6138916015625, -7.132080078125, -6.6502685546875, -6.16845703125, -5.6866455078125, -5.204833984375, -4.7230224609375, -4.2412109375, -3.7593994140625, -3.277587890625, -2.7957763671875, -2.31396484375, -1.8321533203125, -1.350341796875, -0.8685302734375, -0.38671875, 0.0950927734375, 0.576904296875, 1.0587158203125, 1.54052734375, 2.0223388671875, 2.504150390625, 2.9859619140625, 3.4677734375, 3.9495849609375, 4.431396484375, 4.9132080078125, 5.39501953125, 5.8768310546875, 6.358642578125, 6.8404541015625, 7.322265625, 7.8040771484375, 8.285888671875, 8.7677001953125, 9.24951171875, 9.7313232421875, 10.213134765625, 10.6949462890625, 11.1767578125, 11.6585693359375, 12.140380859375, 12.6221923828125, 13.10400390625, 13.5858154296875, 14.067626953125, 14.5494384765625, 15.03125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 8.0, 9.0, 10.0, 14.0, 16.0, 15.0, 16.0, 27.0, 20.0, 33.0, 32.0, 32.0, 37.0, 39.0, 25.0, 42.0, 30.0, 38.0, 44.0, 40.0, 45.0, 40.0, 41.0, 39.0, 30.0, 41.0, 23.0, 26.0, 35.0, 25.0, 13.0, 14.0, 14.0, 16.0, 11.0, 9.0, 9.0, 4.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.76171875, -7.53497314453125, -7.3082275390625, -7.08148193359375, -6.854736328125, -6.62799072265625, -6.4012451171875, -6.17449951171875, -5.94775390625, -5.72100830078125, -5.4942626953125, -5.26751708984375, -5.040771484375, -4.81402587890625, -4.5872802734375, -4.36053466796875, -4.1337890625, -3.90704345703125, -3.6802978515625, -3.45355224609375, -3.226806640625, -3.00006103515625, -2.7733154296875, -2.54656982421875, -2.31982421875, -2.09307861328125, -1.8663330078125, -1.63958740234375, -1.412841796875, -1.18609619140625, -0.9593505859375, -0.73260498046875, -0.505859375, -0.27911376953125, -0.0523681640625, 0.17437744140625, 0.401123046875, 0.62786865234375, 0.8546142578125, 1.08135986328125, 1.30810546875, 1.53485107421875, 1.7615966796875, 1.98834228515625, 2.215087890625, 2.44183349609375, 2.6685791015625, 2.89532470703125, 3.1220703125, 3.34881591796875, 3.5755615234375, 3.80230712890625, 4.029052734375, 4.25579833984375, 4.4825439453125, 4.70928955078125, 4.93603515625, 5.16278076171875, 5.3895263671875, 5.61627197265625, 5.843017578125, 6.06976318359375, 6.2965087890625, 6.52325439453125, 6.75]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 3.0, 2.0, 4.0, 10.0, 19.0, 22.0, 18.0, 22.0, 35.0, 40.0, 58.0, 85.0, 101.0, 147.0, 220.0, 345.0, 419.0, 562.0, 948.0, 1412.0, 2501.0, 4712.0, 11178.0, 33009.0, 136622.0, 541273.0, 235715.0, 49768.0, 14882.0, 6213.0, 3049.0, 1746.0, 1079.0, 675.0, 438.0, 353.0, 255.0, 148.0, 123.0, 93.0, 63.0, 55.0, 36.0, 30.0, 21.0, 12.0, 13.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.676513671875, -10.29052734375, -9.904541015625, -9.5185546875, -9.132568359375, -8.74658203125, -8.360595703125, -7.974609375, -7.588623046875, -7.20263671875, -6.816650390625, -6.4306640625, -6.044677734375, -5.65869140625, -5.272705078125, -4.88671875, -4.500732421875, -4.11474609375, -3.728759765625, -3.3427734375, -2.956787109375, -2.57080078125, -2.184814453125, -1.798828125, -1.412841796875, -1.02685546875, -0.640869140625, -0.2548828125, 0.131103515625, 0.51708984375, 0.903076171875, 1.2890625, 1.675048828125, 2.06103515625, 2.447021484375, 2.8330078125, 3.218994140625, 3.60498046875, 3.990966796875, 4.376953125, 4.762939453125, 5.14892578125, 5.534912109375, 5.9208984375, 6.306884765625, 6.69287109375, 7.078857421875, 7.46484375, 7.850830078125, 8.23681640625, 8.622802734375, 9.0087890625, 9.394775390625, 9.78076171875, 10.166748046875, 10.552734375, 10.938720703125, 11.32470703125, 11.710693359375, 12.0966796875, 12.482666015625, 12.86865234375, 13.254638671875, 13.640625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 9.0, 9.0, 20.0, 25.0, 52.0, 99.0, 153.0, 185.0, 158.0, 121.0, 63.0, 44.0, 18.0, 15.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007781982421875, -0.0007500648498535156, -0.0007219314575195312, -0.0006937980651855469, -0.0006656646728515625, -0.0006375312805175781, -0.0006093978881835938, -0.0005812644958496094, -0.000553131103515625, -0.0005249977111816406, -0.0004968643188476562, -0.0004687309265136719, -0.0004405975341796875, -0.0004124641418457031, -0.00038433074951171875, -0.0003561973571777344, -0.00032806396484375, -0.0002999305725097656, -0.00027179718017578125, -0.00024366378784179688, -0.0002155303955078125, -0.00018739700317382812, -0.00015926361083984375, -0.00013113021850585938, -0.000102996826171875, -7.486343383789062e-05, -4.673004150390625e-05, -1.8596649169921875e-05, 9.5367431640625e-06, 3.7670135498046875e-05, 6.580352783203125e-05, 9.393692016601562e-05, 0.0001220703125, 0.00015020370483398438, 0.00017833709716796875, 0.00020647048950195312, 0.0002346038818359375, 0.0002627372741699219, 0.00029087066650390625, 0.0003190040588378906, 0.000347137451171875, 0.0003752708435058594, 0.00040340423583984375, 0.0004315376281738281, 0.0004596710205078125, 0.0004878044128417969, 0.0005159378051757812, 0.0005440711975097656, 0.00057220458984375, 0.0006003379821777344, 0.0006284713745117188, 0.0006566047668457031, 0.0006847381591796875, 0.0007128715515136719, 0.0007410049438476562, 0.0007691383361816406, 0.000797271728515625, 0.0008254051208496094, 0.0008535385131835938, 0.0008816719055175781, 0.0009098052978515625, 0.0009379386901855469, 0.0009660720825195312, 0.0009942054748535156, 0.0010223388671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 17.0, 28.0, 36.0, 39.0, 55.0, 70.0, 111.0, 149.0, 207.0, 252.0, 349.0, 447.0, 581.0, 817.0, 1037.0, 1553.0, 2237.0, 3440.0, 6096.0, 13101.0, 34543.0, 109532.0, 329728.0, 351845.0, 121925.0, 37982.0, 14064.0, 6461.0, 3563.0, 2220.0, 1595.0, 1158.0, 875.0, 620.0, 456.0, 338.0, 291.0, 192.0, 137.0, 114.0, 75.0, 68.0, 42.0, 28.0, 18.0, 20.0, 12.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-10.7578125, -10.4322509765625, -10.106689453125, -9.7811279296875, -9.45556640625, -9.1300048828125, -8.804443359375, -8.4788818359375, -8.1533203125, -7.8277587890625, -7.502197265625, -7.1766357421875, -6.85107421875, -6.5255126953125, -6.199951171875, -5.8743896484375, -5.548828125, -5.2232666015625, -4.897705078125, -4.5721435546875, -4.24658203125, -3.9210205078125, -3.595458984375, -3.2698974609375, -2.9443359375, -2.6187744140625, -2.293212890625, -1.9676513671875, -1.64208984375, -1.3165283203125, -0.990966796875, -0.6654052734375, -0.33984375, -0.0142822265625, 0.311279296875, 0.6368408203125, 0.96240234375, 1.2879638671875, 1.613525390625, 1.9390869140625, 2.2646484375, 2.5902099609375, 2.915771484375, 3.2413330078125, 3.56689453125, 3.8924560546875, 4.218017578125, 4.5435791015625, 4.869140625, 5.1947021484375, 5.520263671875, 5.8458251953125, 6.17138671875, 6.4969482421875, 6.822509765625, 7.1480712890625, 7.4736328125, 7.7991943359375, 8.124755859375, 8.4503173828125, 8.77587890625, 9.1014404296875, 9.427001953125, 9.7525634765625, 10.078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 15.0, 11.0, 18.0, 23.0, 31.0, 27.0, 54.0, 58.0, 75.0, 86.0, 108.0, 91.0, 82.0, 65.0, 55.0, 49.0, 29.0, 24.0, 14.0, 18.0, 10.0, 5.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.8064422607421875, -1.738861083984375, -1.6712799072265625, -1.60369873046875, -1.5361175537109375, -1.468536376953125, -1.4009552001953125, -1.3333740234375, -1.2657928466796875, -1.198211669921875, -1.1306304931640625, -1.06304931640625, -0.9954681396484375, -0.927886962890625, -0.8603057861328125, -0.792724609375, -0.7251434326171875, -0.657562255859375, -0.5899810791015625, -0.52239990234375, -0.4548187255859375, -0.387237548828125, -0.3196563720703125, -0.2520751953125, -0.1844940185546875, -0.116912841796875, -0.0493316650390625, 0.01824951171875, 0.0858306884765625, 0.153411865234375, 0.2209930419921875, 0.28857421875, 0.3561553955078125, 0.423736572265625, 0.4913177490234375, 0.55889892578125, 0.6264801025390625, 0.694061279296875, 0.7616424560546875, 0.8292236328125, 0.8968048095703125, 0.964385986328125, 1.0319671630859375, 1.09954833984375, 1.1671295166015625, 1.234710693359375, 1.3022918701171875, 1.369873046875, 1.4374542236328125, 1.505035400390625, 1.5726165771484375, 1.64019775390625, 1.7077789306640625, 1.775360107421875, 1.8429412841796875, 1.9105224609375, 1.9781036376953125, 2.045684814453125, 2.1132659912109375, 2.18084716796875, 2.2484283447265625, 2.316009521484375, 2.3835906982421875, 2.451171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 12.0, 25.0, 24.0, 35.0, 40.0, 68.0, 77.0, 86.0, 88.0, 95.0, 80.0, 84.0, 61.0, 52.0, 25.0, 26.0, 20.0, 17.0, 14.0, 11.0, 3.0, 4.0, 4.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.817096710205078, -21.90509605407715, -20.99309539794922, -20.08109474182129, -19.16909408569336, -18.25709342956543, -17.3450927734375, -16.433090209960938, -15.521090507507324, -14.609089851379395, -13.697089195251465, -12.785087585449219, -11.873086929321289, -10.96108627319336, -10.04908561706543, -9.1370849609375, -8.22508430480957, -7.313083648681641, -6.401082992553711, -5.489081859588623, -4.577081203460693, -3.6650805473327637, -2.753079414367676, -1.841078758239746, -0.9290781021118164, -0.017077326774597168, 0.8949234485626221, 1.8069243431091309, 2.7189249992370605, 3.6309256553649902, 4.542926788330078, 5.454927444458008, 6.3669281005859375, 7.278928756713867, 8.190929412841797, 9.102930068969727, 10.014930725097656, 10.926931381225586, 11.838932991027832, 12.750933647155762, 13.662934303283691, 14.574934959411621, 15.48693561553955, 16.398937225341797, 17.310937881469727, 18.222938537597656, 19.134939193725586, 20.046939849853516, 20.958940505981445, 21.870941162109375, 22.782941818237305, 23.694942474365234, 24.606943130493164, 25.518943786621094, 26.430946350097656, 27.342945098876953, 28.254947662353516, 29.166948318481445, 30.078948974609375, 30.990949630737305, 31.902950286865234, 32.8149528503418, 33.726951599121094, 34.638954162597656, 35.55095291137695]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 8.0, 11.0, 11.0, 9.0, 11.0, 9.0, 17.0, 19.0, 22.0, 22.0, 26.0, 28.0, 38.0, 31.0, 27.0, 39.0, 43.0, 25.0, 44.0, 36.0, 32.0, 26.0, 39.0, 34.0, 34.0, 31.0, 37.0, 26.0, 34.0, 24.0, 25.0, 25.0, 17.0, 11.0, 15.0, 16.0, 18.0, 13.0, 13.0, 7.0, 8.0, 6.0, 6.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.32688045501709, -8.037407875061035, -7.747934341430664, -7.458461284637451, -7.168988227844238, -6.879515171051025, -6.5900421142578125, -6.300569534301758, -6.011096000671387, -5.721622943878174, -5.432149887084961, -5.142676830291748, -4.853203773498535, -4.563730716705322, -4.274257659912109, -3.9847848415374756, -3.695312023162842, -3.405838966369629, -3.116365909576416, -2.826892852783203, -2.5374197959899902, -2.2479467391967773, -1.9584739208221436, -1.6690008640289307, -1.3795278072357178, -1.0900547504425049, -0.8005817532539368, -0.5111087560653687, -0.22163569927215576, 0.06783735752105713, 0.35731029510498047, 0.6467833518981934, 0.9362564086914062, 1.2257294654846191, 1.515202522277832, 1.8046754598617554, 2.094148635864258, 2.3836216926574707, 2.6730945110321045, 2.9625675678253174, 3.2520406246185303, 3.541513681411743, 3.830986738204956, 4.12045955657959, 4.409932613372803, 4.699405670166016, 4.9888787269592285, 5.278351783752441, 5.567824840545654, 5.857297897338867, 6.14677095413208, 6.436244010925293, 6.725717067718506, 7.015190124511719, 7.304662704467773, 7.5941362380981445, 7.883608818054199, 8.173081398010254, 8.462554931640625, 8.75202751159668, 9.04150104522705, 9.330973625183105, 9.620447158813477, 9.909919738769531, 10.199393272399902]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 13.0, 14.0, 35.0, 47.0, 61.0, 114.0, 194.0, 343.0, 581.0, 1097.0, 1918.0, 3510.0, 6753.0, 12366.0, 23467.0, 43282.0, 79113.0, 131211.0, 187697.0, 197319.0, 150933.0, 94354.0, 52532.0, 28471.0, 15224.0, 8181.0, 4292.0, 2397.0, 1336.0, 707.0, 399.0, 245.0, 133.0, 74.0, 38.0, 25.0, 23.0, 17.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-21.46875, -20.858154296875, -20.24755859375, -19.636962890625, -19.0263671875, -18.415771484375, -17.80517578125, -17.194580078125, -16.583984375, -15.973388671875, -15.36279296875, -14.752197265625, -14.1416015625, -13.531005859375, -12.92041015625, -12.309814453125, -11.69921875, -11.088623046875, -10.47802734375, -9.867431640625, -9.2568359375, -8.646240234375, -8.03564453125, -7.425048828125, -6.814453125, -6.203857421875, -5.59326171875, -4.982666015625, -4.3720703125, -3.761474609375, -3.15087890625, -2.540283203125, -1.9296875, -1.319091796875, -0.70849609375, -0.097900390625, 0.5126953125, 1.123291015625, 1.73388671875, 2.344482421875, 2.955078125, 3.565673828125, 4.17626953125, 4.786865234375, 5.3974609375, 6.008056640625, 6.61865234375, 7.229248046875, 7.83984375, 8.450439453125, 9.06103515625, 9.671630859375, 10.2822265625, 10.892822265625, 11.50341796875, 12.114013671875, 12.724609375, 13.335205078125, 13.94580078125, 14.556396484375, 15.1669921875, 15.777587890625, 16.38818359375, 16.998779296875, 17.609375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 8.0, 18.0, 12.0, 25.0, 15.0, 24.0, 30.0, 33.0, 49.0, 44.0, 39.0, 58.0, 51.0, 46.0, 59.0, 40.0, 49.0, 52.0, 52.0, 52.0, 31.0, 41.0, 32.0, 20.0, 26.0, 20.0, 13.0, 16.0, 10.0, 13.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.398681640625, -11.93798828125, -11.477294921875, -11.0166015625, -10.555908203125, -10.09521484375, -9.634521484375, -9.173828125, -8.713134765625, -8.25244140625, -7.791748046875, -7.3310546875, -6.870361328125, -6.40966796875, -5.948974609375, -5.48828125, -5.027587890625, -4.56689453125, -4.106201171875, -3.6455078125, -3.184814453125, -2.72412109375, -2.263427734375, -1.802734375, -1.342041015625, -0.88134765625, -0.420654296875, 0.0400390625, 0.500732421875, 0.96142578125, 1.422119140625, 1.8828125, 2.343505859375, 2.80419921875, 3.264892578125, 3.7255859375, 4.186279296875, 4.64697265625, 5.107666015625, 5.568359375, 6.029052734375, 6.48974609375, 6.950439453125, 7.4111328125, 7.871826171875, 8.33251953125, 8.793212890625, 9.25390625, 9.714599609375, 10.17529296875, 10.635986328125, 11.0966796875, 11.557373046875, 12.01806640625, 12.478759765625, 12.939453125, 13.400146484375, 13.86083984375, 14.321533203125, 14.7822265625, 15.242919921875, 15.70361328125, 16.164306640625, 16.625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 15.0, 36.0, 40.0, 69.0, 90.0, 166.0, 198.0, 322.0, 491.0, 906.0, 1351.0, 2128.0, 3451.0, 5755.0, 9216.0, 15169.0, 24164.0, 38932.0, 60242.0, 89284.0, 121722.0, 147490.0, 147776.0, 123737.0, 90546.0, 60990.0, 39202.0, 24669.0, 15321.0, 9611.0, 5766.0, 3622.0, 2219.0, 1415.0, 891.0, 556.0, 366.0, 217.0, 134.0, 89.0, 66.0, 40.0, 21.0, 20.0, 9.0, 12.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.4234619140625, -11.995361328125, -11.5672607421875, -11.13916015625, -10.7110595703125, -10.282958984375, -9.8548583984375, -9.4267578125, -8.9986572265625, -8.570556640625, -8.1424560546875, -7.71435546875, -7.2862548828125, -6.858154296875, -6.4300537109375, -6.001953125, -5.5738525390625, -5.145751953125, -4.7176513671875, -4.28955078125, -3.8614501953125, -3.433349609375, -3.0052490234375, -2.5771484375, -2.1490478515625, -1.720947265625, -1.2928466796875, -0.86474609375, -0.4366455078125, -0.008544921875, 0.4195556640625, 0.84765625, 1.2757568359375, 1.703857421875, 2.1319580078125, 2.56005859375, 2.9881591796875, 3.416259765625, 3.8443603515625, 4.2724609375, 4.7005615234375, 5.128662109375, 5.5567626953125, 5.98486328125, 6.4129638671875, 6.841064453125, 7.2691650390625, 7.697265625, 8.1253662109375, 8.553466796875, 8.9815673828125, 9.40966796875, 9.8377685546875, 10.265869140625, 10.6939697265625, 11.1220703125, 11.5501708984375, 11.978271484375, 12.4063720703125, 12.83447265625, 13.2625732421875, 13.690673828125, 14.1187744140625, 14.546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 1.0, 4.0, 6.0, 9.0, 14.0, 14.0, 27.0, 19.0, 30.0, 34.0, 24.0, 22.0, 46.0, 48.0, 50.0, 41.0, 40.0, 57.0, 40.0, 47.0, 34.0, 42.0, 33.0, 36.0, 27.0, 33.0, 29.0, 32.0, 25.0, 25.0, 23.0, 15.0, 17.0, 9.0, 11.0, 5.0, 7.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.7578125, -6.52874755859375, -6.2996826171875, -6.07061767578125, -5.841552734375, -5.61248779296875, -5.3834228515625, -5.15435791015625, -4.92529296875, -4.69622802734375, -4.4671630859375, -4.23809814453125, -4.009033203125, -3.77996826171875, -3.5509033203125, -3.32183837890625, -3.0927734375, -2.86370849609375, -2.6346435546875, -2.40557861328125, -2.176513671875, -1.94744873046875, -1.7183837890625, -1.48931884765625, -1.26025390625, -1.03118896484375, -0.8021240234375, -0.57305908203125, -0.343994140625, -0.11492919921875, 0.1141357421875, 0.34320068359375, 0.572265625, 0.80133056640625, 1.0303955078125, 1.25946044921875, 1.488525390625, 1.71759033203125, 1.9466552734375, 2.17572021484375, 2.40478515625, 2.63385009765625, 2.8629150390625, 3.09197998046875, 3.321044921875, 3.55010986328125, 3.7791748046875, 4.00823974609375, 4.2373046875, 4.46636962890625, 4.6954345703125, 4.92449951171875, 5.153564453125, 5.38262939453125, 5.6116943359375, 5.84075927734375, 6.06982421875, 6.29888916015625, 6.5279541015625, 6.75701904296875, 6.986083984375, 7.21514892578125, 7.4442138671875, 7.67327880859375, 7.90234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 25.0, 23.0, 35.0, 54.0, 69.0, 97.0, 136.0, 208.0, 344.0, 452.0, 659.0, 1033.0, 1577.0, 2503.0, 3927.0, 6525.0, 10733.0, 18270.0, 31246.0, 53871.0, 91598.0, 143655.0, 187235.0, 178077.0, 126762.0, 77669.0, 45479.0, 26292.0, 15411.0, 9095.0, 5667.0, 3453.0, 2175.0, 1375.0, 887.0, 568.0, 413.0, 298.0, 200.0, 122.0, 98.0, 61.0, 47.0, 24.0, 29.0, 20.0, 12.0, 11.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.81640625, -6.60235595703125, -6.3883056640625, -6.17425537109375, -5.960205078125, -5.74615478515625, -5.5321044921875, -5.31805419921875, -5.10400390625, -4.88995361328125, -4.6759033203125, -4.46185302734375, -4.247802734375, -4.03375244140625, -3.8197021484375, -3.60565185546875, -3.3916015625, -3.17755126953125, -2.9635009765625, -2.74945068359375, -2.535400390625, -2.32135009765625, -2.1072998046875, -1.89324951171875, -1.67919921875, -1.46514892578125, -1.2510986328125, -1.03704833984375, -0.822998046875, -0.60894775390625, -0.3948974609375, -0.18084716796875, 0.033203125, 0.24725341796875, 0.4613037109375, 0.67535400390625, 0.889404296875, 1.10345458984375, 1.3175048828125, 1.53155517578125, 1.74560546875, 1.95965576171875, 2.1737060546875, 2.38775634765625, 2.601806640625, 2.81585693359375, 3.0299072265625, 3.24395751953125, 3.4580078125, 3.67205810546875, 3.8861083984375, 4.10015869140625, 4.314208984375, 4.52825927734375, 4.7423095703125, 4.95635986328125, 5.17041015625, 5.38446044921875, 5.5985107421875, 5.81256103515625, 6.026611328125, 6.24066162109375, 6.4547119140625, 6.66876220703125, 6.8828125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 10.0, 19.0, 13.0, 26.0, 28.0, 37.0, 42.0, 55.0, 66.0, 76.0, 98.0, 87.0, 95.0, 78.0, 66.0, 47.0, 33.0, 26.0, 17.0, 11.0, 11.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010080337524414062, -0.0009734034538269043, -0.0009387731552124023, -0.0009041428565979004, -0.0008695125579833984, -0.0008348822593688965, -0.0008002519607543945, -0.0007656216621398926, -0.0007309913635253906, -0.0006963610649108887, -0.0006617307662963867, -0.0006271004676818848, -0.0005924701690673828, -0.0005578398704528809, -0.0005232095718383789, -0.000488579273223877, -0.000453948974609375, -0.00041931867599487305, -0.0003846883773803711, -0.00035005807876586914, -0.0003154277801513672, -0.00028079748153686523, -0.0002461671829223633, -0.00021153688430786133, -0.00017690658569335938, -0.00014227628707885742, -0.00010764598846435547, -7.301568984985352e-05, -3.838539123535156e-05, -3.7550926208496094e-06, 3.0875205993652344e-05, 6.55055046081543e-05, 0.00010013580322265625, 0.0001347661018371582, 0.00016939640045166016, 0.0002040266990661621, 0.00023865699768066406, 0.000273287296295166, 0.00030791759490966797, 0.0003425478935241699, 0.0003771781921386719, 0.00041180849075317383, 0.0004464387893676758, 0.00048106908798217773, 0.0005156993865966797, 0.0005503296852111816, 0.0005849599838256836, 0.0006195902824401855, 0.0006542205810546875, 0.0006888508796691895, 0.0007234811782836914, 0.0007581114768981934, 0.0007927417755126953, 0.0008273720741271973, 0.0008620023727416992, 0.0008966326713562012, 0.0009312629699707031, 0.0009658932685852051, 0.001000523567199707, 0.001035153865814209, 0.001069784164428711, 0.0011044144630432129, 0.0011390447616577148, 0.0011736750602722168, 0.0012083053588867188]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 14.0, 5.0, 12.0, 24.0, 44.0, 45.0, 125.0, 156.0, 259.0, 425.0, 690.0, 1103.0, 1941.0, 3354.0, 5920.0, 10659.0, 19632.0, 37116.0, 71023.0, 128020.0, 198449.0, 217044.0, 157031.0, 90380.0, 48526.0, 25189.0, 13611.0, 7529.0, 4221.0, 2491.0, 1452.0, 773.0, 515.0, 305.0, 171.0, 108.0, 81.0, 42.0, 32.0, 15.0, 17.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.82781982421875, -8.5697021484375, -8.31158447265625, -8.053466796875, -7.79534912109375, -7.5372314453125, -7.27911376953125, -7.02099609375, -6.76287841796875, -6.5047607421875, -6.24664306640625, -5.988525390625, -5.73040771484375, -5.4722900390625, -5.21417236328125, -4.9560546875, -4.69793701171875, -4.4398193359375, -4.18170166015625, -3.923583984375, -3.66546630859375, -3.4073486328125, -3.14923095703125, -2.89111328125, -2.63299560546875, -2.3748779296875, -2.11676025390625, -1.858642578125, -1.60052490234375, -1.3424072265625, -1.08428955078125, -0.826171875, -0.56805419921875, -0.3099365234375, -0.05181884765625, 0.206298828125, 0.46441650390625, 0.7225341796875, 0.98065185546875, 1.23876953125, 1.49688720703125, 1.7550048828125, 2.01312255859375, 2.271240234375, 2.52935791015625, 2.7874755859375, 3.04559326171875, 3.3037109375, 3.56182861328125, 3.8199462890625, 4.07806396484375, 4.336181640625, 4.59429931640625, 4.8524169921875, 5.11053466796875, 5.36865234375, 5.62677001953125, 5.8848876953125, 6.14300537109375, 6.401123046875, 6.65924072265625, 6.9173583984375, 7.17547607421875, 7.43359375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 7.0, 6.0, 8.0, 18.0, 10.0, 21.0, 17.0, 18.0, 25.0, 25.0, 26.0, 34.0, 36.0, 50.0, 39.0, 72.0, 56.0, 57.0, 40.0, 38.0, 43.0, 60.0, 47.0, 29.0, 27.0, 24.0, 28.0, 17.0, 19.0, 22.0, 10.0, 10.0, 7.0, 7.0, 11.0, 15.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.983001708984375, -1.91912841796875, -1.855255126953125, -1.7913818359375, -1.727508544921875, -1.66363525390625, -1.599761962890625, -1.535888671875, -1.472015380859375, -1.40814208984375, -1.344268798828125, -1.2803955078125, -1.216522216796875, -1.15264892578125, -1.088775634765625, -1.02490234375, -0.961029052734375, -0.89715576171875, -0.833282470703125, -0.7694091796875, -0.705535888671875, -0.64166259765625, -0.577789306640625, -0.513916015625, -0.450042724609375, -0.38616943359375, -0.322296142578125, -0.2584228515625, -0.194549560546875, -0.13067626953125, -0.066802978515625, -0.0029296875, 0.060943603515625, 0.12481689453125, 0.188690185546875, 0.2525634765625, 0.316436767578125, 0.38031005859375, 0.444183349609375, 0.508056640625, 0.571929931640625, 0.63580322265625, 0.699676513671875, 0.7635498046875, 0.827423095703125, 0.89129638671875, 0.955169677734375, 1.01904296875, 1.082916259765625, 1.14678955078125, 1.210662841796875, 1.2745361328125, 1.338409423828125, 1.40228271484375, 1.466156005859375, 1.530029296875, 1.593902587890625, 1.65777587890625, 1.721649169921875, 1.7855224609375, 1.849395751953125, 1.91326904296875, 1.977142333984375, 2.041015625]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 12.0, 8.0, 15.0, 25.0, 22.0, 24.0, 38.0, 49.0, 52.0, 71.0, 85.0, 77.0, 80.0, 79.0, 67.0, 64.0, 50.0, 40.0, 27.0, 17.0, 14.0, 16.0, 8.0, 15.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.304981231689453, -20.486417770385742, -19.66785430908203, -18.84929084777832, -18.03072738647461, -17.2121639251709, -16.393600463867188, -15.575037002563477, -14.756473541259766, -13.937910079956055, -13.119346618652344, -12.300783157348633, -11.482219696044922, -10.663656234741211, -9.8450927734375, -9.026529312133789, -8.207964897155762, -7.389401435852051, -6.57083797454834, -5.752274513244629, -4.933711051940918, -4.115147113800049, -3.296583652496338, -2.478020191192627, -1.659456729888916, -0.8408932089805603, -0.02232968807220459, 0.7962338924407959, 1.6147973537445068, 2.433361053466797, 3.251924514770508, 4.070487976074219, 4.88905143737793, 5.707614898681641, 6.526178359985352, 7.3447418212890625, 8.163305282592773, 8.981868743896484, 9.800432205200195, 10.618995666503906, 11.437559127807617, 12.256122589111328, 13.074686050415039, 13.89324951171875, 14.711812973022461, 15.530376434326172, 16.348939895629883, 17.167503356933594, 17.986068725585938, 18.80463218688965, 19.62319564819336, 20.44175910949707, 21.26032257080078, 22.078886032104492, 22.897449493408203, 23.716012954711914, 24.534576416015625, 25.353139877319336, 26.171703338623047, 26.990266799926758, 27.80883026123047, 28.62739372253418, 29.44595718383789, 30.2645206451416, 31.083084106445312]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 9.0, 10.0, 8.0, 15.0, 8.0, 12.0, 17.0, 17.0, 18.0, 21.0, 25.0, 25.0, 26.0, 26.0, 40.0, 40.0, 31.0, 32.0, 39.0, 41.0, 29.0, 34.0, 39.0, 37.0, 25.0, 34.0, 25.0, 31.0, 33.0, 25.0, 30.0, 14.0, 19.0, 15.0, 21.0, 11.0, 14.0, 12.0, 15.0, 9.0, 8.0, 9.0, 5.0, 6.0, 3.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.12578010559082, -7.842883110046387, -7.559986114501953, -7.2770891189575195, -6.994192123413086, -6.711295127868652, -6.428398609161377, -6.145501613616943, -5.86260461807251, -5.579707622528076, -5.296810626983643, -5.013913631439209, -4.731017112731934, -4.4481201171875, -4.165223121643066, -3.882326126098633, -3.599429130554199, -3.3165321350097656, -3.033635139465332, -2.7507383823394775, -2.467841386795044, -2.1849443912506104, -1.9020475149154663, -1.6191506385803223, -1.3362536430358887, -1.053356647491455, -0.770459771156311, -0.4875628352165222, -0.2046658992767334, 0.0782310962677002, 0.36112797260284424, 0.6440248489379883, 0.9269227981567383, 1.2098197937011719, 1.492716670036316, 1.77561354637146, 2.0585105419158936, 2.341407537460327, 2.6243042945861816, 2.9072012901306152, 3.190098285675049, 3.4729952812194824, 3.755892276763916, 4.03878927230835, 4.321685791015625, 4.604582786560059, 4.887479782104492, 5.170376777648926, 5.453273773193359, 5.736170768737793, 6.019067764282227, 6.30196475982666, 6.584861755371094, 6.867758750915527, 7.150655269622803, 7.433552265167236, 7.71644926071167, 7.9993462562561035, 8.282242774963379, 8.565139770507812, 8.848036766052246, 9.13093376159668, 9.413830757141113, 9.696727752685547, 9.97962474822998]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 11.0, 11.0, 17.0, 25.0, 32.0, 61.0, 72.0, 98.0, 174.0, 278.0, 433.0, 628.0, 995.0, 1662.0, 2646.0, 4622.0, 8258.0, 15521.0, 30661.0, 68161.0, 168702.0, 477298.0, 1261938.0, 1326379.0, 509489.0, 177687.0, 70531.0, 31608.0, 15910.0, 8404.0, 4574.0, 2772.0, 1672.0, 970.0, 704.0, 409.0, 293.0, 188.0, 112.0, 72.0, 67.0, 46.0, 27.0, 20.0, 14.0, 11.0, 10.0, 9.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.828125, -22.912841796875, -21.99755859375, -21.082275390625, -20.1669921875, -19.251708984375, -18.33642578125, -17.421142578125, -16.505859375, -15.590576171875, -14.67529296875, -13.760009765625, -12.8447265625, -11.929443359375, -11.01416015625, -10.098876953125, -9.18359375, -8.268310546875, -7.35302734375, -6.437744140625, -5.5224609375, -4.607177734375, -3.69189453125, -2.776611328125, -1.861328125, -0.946044921875, -0.03076171875, 0.884521484375, 1.7998046875, 2.715087890625, 3.63037109375, 4.545654296875, 5.4609375, 6.376220703125, 7.29150390625, 8.206787109375, 9.1220703125, 10.037353515625, 10.95263671875, 11.867919921875, 12.783203125, 13.698486328125, 14.61376953125, 15.529052734375, 16.4443359375, 17.359619140625, 18.27490234375, 19.190185546875, 20.10546875, 21.020751953125, 21.93603515625, 22.851318359375, 23.7666015625, 24.681884765625, 25.59716796875, 26.512451171875, 27.427734375, 28.343017578125, 29.25830078125, 30.173583984375, 31.0888671875, 32.004150390625, 32.91943359375, 33.834716796875, 34.75]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 1.0, 7.0, 9.0, 10.0, 12.0, 6.0, 12.0, 21.0, 19.0, 18.0, 23.0, 30.0, 24.0, 30.0, 23.0, 36.0, 47.0, 37.0, 27.0, 41.0, 45.0, 43.0, 41.0, 39.0, 25.0, 33.0, 27.0, 26.0, 43.0, 21.0, 29.0, 41.0, 24.0, 13.0, 13.0, 16.0, 11.0, 10.0, 7.0, 10.0, 7.0, 7.0, 4.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.546875, -8.2864990234375, -8.026123046875, -7.7657470703125, -7.50537109375, -7.2449951171875, -6.984619140625, -6.7242431640625, -6.4638671875, -6.2034912109375, -5.943115234375, -5.6827392578125, -5.42236328125, -5.1619873046875, -4.901611328125, -4.6412353515625, -4.380859375, -4.1204833984375, -3.860107421875, -3.5997314453125, -3.33935546875, -3.0789794921875, -2.818603515625, -2.5582275390625, -2.2978515625, -2.0374755859375, -1.777099609375, -1.5167236328125, -1.25634765625, -0.9959716796875, -0.735595703125, -0.4752197265625, -0.21484375, 0.0455322265625, 0.305908203125, 0.5662841796875, 0.82666015625, 1.0870361328125, 1.347412109375, 1.6077880859375, 1.8681640625, 2.1285400390625, 2.388916015625, 2.6492919921875, 2.90966796875, 3.1700439453125, 3.430419921875, 3.6907958984375, 3.951171875, 4.2115478515625, 4.471923828125, 4.7322998046875, 4.99267578125, 5.2530517578125, 5.513427734375, 5.7738037109375, 6.0341796875, 6.2945556640625, 6.554931640625, 6.8153076171875, 7.07568359375, 7.3360595703125, 7.596435546875, 7.8568115234375, 8.1171875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 19.0, 20.0, 41.0, 54.0, 81.0, 120.0, 192.0, 262.0, 415.0, 621.0, 940.0, 1511.0, 2455.0, 3966.0, 6461.0, 11046.0, 19797.0, 37157.0, 76500.0, 172742.0, 427564.0, 1036005.0, 1302501.0, 628555.0, 248436.0, 105454.0, 49958.0, 26005.0, 14232.0, 8156.0, 4864.0, 2877.0, 1896.0, 1160.0, 765.0, 479.0, 317.0, 214.0, 143.0, 96.0, 54.0, 48.0, 34.0, 13.0, 19.0, 8.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.140625, -29.1748046875, -28.208984375, -27.2431640625, -26.27734375, -25.3115234375, -24.345703125, -23.3798828125, -22.4140625, -21.4482421875, -20.482421875, -19.5166015625, -18.55078125, -17.5849609375, -16.619140625, -15.6533203125, -14.6875, -13.7216796875, -12.755859375, -11.7900390625, -10.82421875, -9.8583984375, -8.892578125, -7.9267578125, -6.9609375, -5.9951171875, -5.029296875, -4.0634765625, -3.09765625, -2.1318359375, -1.166015625, -0.2001953125, 0.765625, 1.7314453125, 2.697265625, 3.6630859375, 4.62890625, 5.5947265625, 6.560546875, 7.5263671875, 8.4921875, 9.4580078125, 10.423828125, 11.3896484375, 12.35546875, 13.3212890625, 14.287109375, 15.2529296875, 16.21875, 17.1845703125, 18.150390625, 19.1162109375, 20.08203125, 21.0478515625, 22.013671875, 22.9794921875, 23.9453125, 24.9111328125, 25.876953125, 26.8427734375, 27.80859375, 28.7744140625, 29.740234375, 30.7060546875, 31.671875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 12.0, 15.0, 16.0, 34.0, 27.0, 39.0, 45.0, 55.0, 95.0, 109.0, 172.0, 178.0, 230.0, 244.0, 305.0, 340.0, 351.0, 350.0, 293.0, 244.0, 198.0, 136.0, 132.0, 104.0, 71.0, 55.0, 40.0, 40.0, 27.0, 19.0, 18.0, 17.0, 14.0, 10.0, 7.0, 9.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.171875, -6.9295654296875, -6.687255859375, -6.4449462890625, -6.20263671875, -5.9603271484375, -5.718017578125, -5.4757080078125, -5.2333984375, -4.9910888671875, -4.748779296875, -4.5064697265625, -4.26416015625, -4.0218505859375, -3.779541015625, -3.5372314453125, -3.294921875, -3.0526123046875, -2.810302734375, -2.5679931640625, -2.32568359375, -2.0833740234375, -1.841064453125, -1.5987548828125, -1.3564453125, -1.1141357421875, -0.871826171875, -0.6295166015625, -0.38720703125, -0.1448974609375, 0.097412109375, 0.3397216796875, 0.58203125, 0.8243408203125, 1.066650390625, 1.3089599609375, 1.55126953125, 1.7935791015625, 2.035888671875, 2.2781982421875, 2.5205078125, 2.7628173828125, 3.005126953125, 3.2474365234375, 3.48974609375, 3.7320556640625, 3.974365234375, 4.2166748046875, 4.458984375, 4.7012939453125, 4.943603515625, 5.1859130859375, 5.42822265625, 5.6705322265625, 5.912841796875, 6.1551513671875, 6.3974609375, 6.6397705078125, 6.882080078125, 7.1243896484375, 7.36669921875, 7.6090087890625, 7.851318359375, 8.0936279296875, 8.3359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 7.0, 15.0, 15.0, 21.0, 22.0, 30.0, 34.0, 46.0, 49.0, 64.0, 63.0, 61.0, 70.0, 71.0, 57.0, 56.0, 47.0, 39.0, 39.0, 32.0, 33.0, 19.0, 16.0, 15.0, 14.0, 13.0, 5.0, 3.0, 5.0, 8.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.447826385498047, -24.647003173828125, -23.846179962158203, -23.04535675048828, -22.24453353881836, -21.443710327148438, -20.642887115478516, -19.842063903808594, -19.041240692138672, -18.24041748046875, -17.439594268798828, -16.638771057128906, -15.837947845458984, -15.037124633789062, -14.23630142211914, -13.435478210449219, -12.634654998779297, -11.833831787109375, -11.033008575439453, -10.232185363769531, -9.43136215209961, -8.630538940429688, -7.829715728759766, -7.028892517089844, -6.228069305419922, -5.42724609375, -4.626422882080078, -3.8255996704101562, -3.0247764587402344, -2.2239532470703125, -1.4231300354003906, -0.6223068237304688, 0.17851829528808594, 0.9793415069580078, 1.7801647186279297, 2.5809879302978516, 3.3818111419677734, 4.182634353637695, 4.983457565307617, 5.784280776977539, 6.585103988647461, 7.385927200317383, 8.186750411987305, 8.987573623657227, 9.788396835327148, 10.58922004699707, 11.390043258666992, 12.190866470336914, 12.991689682006836, 13.792512893676758, 14.59333610534668, 15.394159317016602, 16.194982528686523, 16.995805740356445, 17.796628952026367, 18.59745216369629, 19.39827537536621, 20.199098587036133, 20.999921798706055, 21.800745010375977, 22.6015682220459, 23.40239143371582, 24.203214645385742, 25.004037857055664, 25.804861068725586]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 7.0, 10.0, 15.0, 15.0, 13.0, 31.0, 16.0, 25.0, 33.0, 21.0, 22.0, 36.0, 32.0, 36.0, 40.0, 33.0, 36.0, 52.0, 37.0, 38.0, 36.0, 36.0, 34.0, 29.0, 31.0, 32.0, 28.0, 19.0, 15.0, 31.0, 13.0, 24.0, 19.0, 7.0, 7.0, 12.0, 7.0, 7.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.708602905273438, -10.358699798583984, -10.008796691894531, -9.658893585205078, -9.308990478515625, -8.959087371826172, -8.609184265136719, -8.25928020477295, -7.909377098083496, -7.559473991394043, -7.20957088470459, -6.859667778015137, -6.509764194488525, -6.159861087799072, -5.809957981109619, -5.460054397583008, -5.110151767730713, -4.76024866104126, -4.410345554351807, -4.060441970825195, -3.710538864135742, -3.360635757446289, -3.010732650756836, -2.6608293056488037, -2.3109261989593506, -1.961022973060608, -1.6111197471618652, -1.261216640472412, -0.9113134145736694, -0.5614101886749268, -0.21150708198547363, 0.1383962631225586, 0.4882993698120117, 0.8382025957107544, 1.188105821609497, 1.5380089282989502, 1.8879121541976929, 2.2378153800964355, 2.5877184867858887, 2.937621831893921, 3.287524938583374, 3.637428045272827, 3.9873313903808594, 4.3372344970703125, 4.687137603759766, 5.037040710449219, 5.386943817138672, 5.736847400665283, 6.086750507354736, 6.4366536140441895, 6.786556720733643, 7.136460304260254, 7.486363410949707, 7.83626651763916, 8.186169624328613, 8.536072731018066, 8.88597583770752, 9.235878944396973, 9.585782051086426, 9.935685157775879, 10.285588264465332, 10.635492324829102, 10.985395431518555, 11.335298538208008, 11.685201644897461]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 11.0, 8.0, 19.0, 28.0, 52.0, 80.0, 104.0, 171.0, 273.0, 390.0, 592.0, 1022.0, 1614.0, 2505.0, 4082.0, 6533.0, 10528.0, 16583.0, 26884.0, 43193.0, 68205.0, 103074.0, 143221.0, 165996.0, 148239.0, 109478.0, 72930.0, 46417.0, 28922.0, 17791.0, 10988.0, 6894.0, 4383.0, 2710.0, 1752.0, 1004.0, 670.0, 416.0, 269.0, 175.0, 127.0, 82.0, 53.0, 25.0, 17.0, 19.0, 7.0, 11.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-9.265625, -8.99761962890625, -8.7296142578125, -8.46160888671875, -8.193603515625, -7.92559814453125, -7.6575927734375, -7.38958740234375, -7.12158203125, -6.85357666015625, -6.5855712890625, -6.31756591796875, -6.049560546875, -5.78155517578125, -5.5135498046875, -5.24554443359375, -4.9775390625, -4.70953369140625, -4.4415283203125, -4.17352294921875, -3.905517578125, -3.63751220703125, -3.3695068359375, -3.10150146484375, -2.83349609375, -2.56549072265625, -2.2974853515625, -2.02947998046875, -1.761474609375, -1.49346923828125, -1.2254638671875, -0.95745849609375, -0.689453125, -0.42144775390625, -0.1534423828125, 0.11456298828125, 0.382568359375, 0.65057373046875, 0.9185791015625, 1.18658447265625, 1.45458984375, 1.72259521484375, 1.9906005859375, 2.25860595703125, 2.526611328125, 2.79461669921875, 3.0626220703125, 3.33062744140625, 3.5986328125, 3.86663818359375, 4.1346435546875, 4.40264892578125, 4.670654296875, 4.93865966796875, 5.2066650390625, 5.47467041015625, 5.74267578125, 6.01068115234375, 6.2786865234375, 6.54669189453125, 6.814697265625, 7.08270263671875, 7.3507080078125, 7.61871337890625, 7.88671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 2.0, 8.0, 11.0, 9.0, 15.0, 16.0, 15.0, 21.0, 19.0, 26.0, 31.0, 15.0, 27.0, 29.0, 34.0, 48.0, 46.0, 45.0, 38.0, 51.0, 32.0, 43.0, 39.0, 42.0, 41.0, 37.0, 37.0, 24.0, 28.0, 32.0, 29.0, 23.0, 10.0, 11.0, 11.0, 11.0, 9.0, 15.0, 7.0, 6.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.0760498046875, -13.620849609375, -13.1656494140625, -12.71044921875, -12.2552490234375, -11.800048828125, -11.3448486328125, -10.8896484375, -10.4344482421875, -9.979248046875, -9.5240478515625, -9.06884765625, -8.6136474609375, -8.158447265625, -7.7032470703125, -7.248046875, -6.7928466796875, -6.337646484375, -5.8824462890625, -5.42724609375, -4.9720458984375, -4.516845703125, -4.0616455078125, -3.6064453125, -3.1512451171875, -2.696044921875, -2.2408447265625, -1.78564453125, -1.3304443359375, -0.875244140625, -0.4200439453125, 0.03515625, 0.4903564453125, 0.945556640625, 1.4007568359375, 1.85595703125, 2.3111572265625, 2.766357421875, 3.2215576171875, 3.6767578125, 4.1319580078125, 4.587158203125, 5.0423583984375, 5.49755859375, 5.9527587890625, 6.407958984375, 6.8631591796875, 7.318359375, 7.7735595703125, 8.228759765625, 8.6839599609375, 9.13916015625, 9.5943603515625, 10.049560546875, 10.5047607421875, 10.9599609375, 11.4151611328125, 11.870361328125, 12.3255615234375, 12.78076171875, 13.2359619140625, 13.691162109375, 14.1463623046875, 14.6015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 10.0, 15.0, 13.0, 38.0, 39.0, 78.0, 100.0, 150.0, 176.0, 262.0, 360.0, 493.0, 795.0, 1075.0, 1569.0, 2320.0, 3388.0, 5233.0, 7959.0, 12989.0, 20994.0, 34490.0, 56805.0, 91906.0, 142709.0, 186567.0, 169408.0, 116961.0, 73402.0, 44425.0, 27172.0, 16558.0, 10325.0, 6603.0, 4131.0, 2884.0, 1855.0, 1237.0, 866.0, 641.0, 438.0, 307.0, 227.0, 175.0, 124.0, 94.0, 64.0, 42.0, 25.0, 22.0, 14.0, 7.0, 6.0, 2.0, 4.0, 1.0], "bins": [-10.9453125, -10.62109375, -10.296875, -9.97265625, -9.6484375, -9.32421875, -9.0, -8.67578125, -8.3515625, -8.02734375, -7.703125, -7.37890625, -7.0546875, -6.73046875, -6.40625, -6.08203125, -5.7578125, -5.43359375, -5.109375, -4.78515625, -4.4609375, -4.13671875, -3.8125, -3.48828125, -3.1640625, -2.83984375, -2.515625, -2.19140625, -1.8671875, -1.54296875, -1.21875, -0.89453125, -0.5703125, -0.24609375, 0.078125, 0.40234375, 0.7265625, 1.05078125, 1.375, 1.69921875, 2.0234375, 2.34765625, 2.671875, 2.99609375, 3.3203125, 3.64453125, 3.96875, 4.29296875, 4.6171875, 4.94140625, 5.265625, 5.58984375, 5.9140625, 6.23828125, 6.5625, 6.88671875, 7.2109375, 7.53515625, 7.859375, 8.18359375, 8.5078125, 8.83203125, 9.15625, 9.48046875, 9.8046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 4.0, 9.0, 9.0, 7.0, 14.0, 8.0, 11.0, 24.0, 15.0, 14.0, 25.0, 27.0, 37.0, 31.0, 25.0, 30.0, 41.0, 35.0, 37.0, 30.0, 36.0, 25.0, 31.0, 43.0, 39.0, 31.0, 39.0, 26.0, 22.0, 29.0, 29.0, 35.0, 25.0, 22.0, 15.0, 19.0, 17.0, 15.0, 14.0, 10.0, 3.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-8.140625, -7.90020751953125, -7.6597900390625, -7.41937255859375, -7.178955078125, -6.93853759765625, -6.6981201171875, -6.45770263671875, -6.21728515625, -5.97686767578125, -5.7364501953125, -5.49603271484375, -5.255615234375, -5.01519775390625, -4.7747802734375, -4.53436279296875, -4.2939453125, -4.05352783203125, -3.8131103515625, -3.57269287109375, -3.332275390625, -3.09185791015625, -2.8514404296875, -2.61102294921875, -2.37060546875, -2.13018798828125, -1.8897705078125, -1.64935302734375, -1.408935546875, -1.16851806640625, -0.9281005859375, -0.68768310546875, -0.447265625, -0.20684814453125, 0.0335693359375, 0.27398681640625, 0.514404296875, 0.75482177734375, 0.9952392578125, 1.23565673828125, 1.47607421875, 1.71649169921875, 1.9569091796875, 2.19732666015625, 2.437744140625, 2.67816162109375, 2.9185791015625, 3.15899658203125, 3.3994140625, 3.63983154296875, 3.8802490234375, 4.12066650390625, 4.361083984375, 4.60150146484375, 4.8419189453125, 5.08233642578125, 5.32275390625, 5.56317138671875, 5.8035888671875, 6.04400634765625, 6.284423828125, 6.52484130859375, 6.7652587890625, 7.00567626953125, 7.24609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 6.0, 8.0, 10.0, 12.0, 21.0, 39.0, 39.0, 88.0, 125.0, 246.0, 420.0, 767.0, 1490.0, 2730.0, 5229.0, 10250.0, 21736.0, 48052.0, 110235.0, 240599.0, 307740.0, 164736.0, 72136.0, 31741.0, 14937.0, 7176.0, 3607.0, 1976.0, 1019.0, 611.0, 308.0, 181.0, 115.0, 73.0, 44.0, 25.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.049072265625, -4.86376953125, -4.678466796875, -4.4931640625, -4.307861328125, -4.12255859375, -3.937255859375, -3.751953125, -3.566650390625, -3.38134765625, -3.196044921875, -3.0107421875, -2.825439453125, -2.64013671875, -2.454833984375, -2.26953125, -2.084228515625, -1.89892578125, -1.713623046875, -1.5283203125, -1.343017578125, -1.15771484375, -0.972412109375, -0.787109375, -0.601806640625, -0.41650390625, -0.231201171875, -0.0458984375, 0.139404296875, 0.32470703125, 0.510009765625, 0.6953125, 0.880615234375, 1.06591796875, 1.251220703125, 1.4365234375, 1.621826171875, 1.80712890625, 1.992431640625, 2.177734375, 2.363037109375, 2.54833984375, 2.733642578125, 2.9189453125, 3.104248046875, 3.28955078125, 3.474853515625, 3.66015625, 3.845458984375, 4.03076171875, 4.216064453125, 4.4013671875, 4.586669921875, 4.77197265625, 4.957275390625, 5.142578125, 5.327880859375, 5.51318359375, 5.698486328125, 5.8837890625, 6.069091796875, 6.25439453125, 6.439697265625, 6.625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 10.0, 1.0, 7.0, 7.0, 12.0, 17.0, 13.0, 18.0, 16.0, 24.0, 21.0, 31.0, 52.0, 30.0, 46.0, 49.0, 62.0, 43.0, 50.0, 58.0, 47.0, 57.0, 47.0, 40.0, 35.0, 38.0, 28.0, 34.0, 20.0, 16.0, 21.0, 13.0, 4.0, 3.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022029876708984375, -0.00021200254559516907, -0.00020370632410049438, -0.0001954101026058197, -0.00018711388111114502, -0.00017881765961647034, -0.00017052143812179565, -0.00016222521662712097, -0.0001539289951324463, -0.0001456327736377716, -0.00013733655214309692, -0.00012904033064842224, -0.00012074410915374756, -0.00011244788765907288, -0.0001041516661643982, -9.585544466972351e-05, -8.755922317504883e-05, -7.926300168037415e-05, -7.096678018569946e-05, -6.267055869102478e-05, -5.43743371963501e-05, -4.6078115701675415e-05, -3.778189420700073e-05, -2.948567271232605e-05, -2.1189451217651367e-05, -1.2893229722976685e-05, -4.597008228302002e-06, 3.6992132663726807e-06, 1.1995434761047363e-05, 2.0291656255722046e-05, 2.858787775039673e-05, 3.688409924507141e-05, 4.5180320739746094e-05, 5.3476542234420776e-05, 6.177276372909546e-05, 7.006898522377014e-05, 7.836520671844482e-05, 8.666142821311951e-05, 9.495764970779419e-05, 0.00010325387120246887, 0.00011155009269714355, 0.00011984631419181824, 0.00012814253568649292, 0.0001364387571811676, 0.00014473497867584229, 0.00015303120017051697, 0.00016132742166519165, 0.00016962364315986633, 0.00017791986465454102, 0.0001862160861492157, 0.00019451230764389038, 0.00020280852913856506, 0.00021110475063323975, 0.00021940097212791443, 0.0002276971936225891, 0.0002359934151172638, 0.0002442896366119385, 0.00025258585810661316, 0.00026088207960128784, 0.0002691783010959625, 0.0002774745225906372, 0.0002857707440853119, 0.00029406696557998657, 0.00030236318707466125, 0.00031065940856933594]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 11.0, 10.0, 23.0, 48.0, 72.0, 110.0, 135.0, 227.0, 333.0, 472.0, 751.0, 1168.0, 1811.0, 2839.0, 4731.0, 7748.0, 13070.0, 21623.0, 36817.0, 62274.0, 101260.0, 151602.0, 182473.0, 163745.0, 115738.0, 72532.0, 42676.0, 25442.0, 15042.0, 9008.0, 5477.0, 3396.0, 2054.0, 1336.0, 898.0, 544.0, 371.0, 227.0, 132.0, 104.0, 82.0, 49.0, 35.0, 18.0, 16.0, 8.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.02734375, -3.90008544921875, -3.7728271484375, -3.64556884765625, -3.518310546875, -3.39105224609375, -3.2637939453125, -3.13653564453125, -3.00927734375, -2.88201904296875, -2.7547607421875, -2.62750244140625, -2.500244140625, -2.37298583984375, -2.2457275390625, -2.11846923828125, -1.9912109375, -1.86395263671875, -1.7366943359375, -1.60943603515625, -1.482177734375, -1.35491943359375, -1.2276611328125, -1.10040283203125, -0.97314453125, -0.84588623046875, -0.7186279296875, -0.59136962890625, -0.464111328125, -0.33685302734375, -0.2095947265625, -0.08233642578125, 0.044921875, 0.17218017578125, 0.2994384765625, 0.42669677734375, 0.553955078125, 0.68121337890625, 0.8084716796875, 0.93572998046875, 1.06298828125, 1.19024658203125, 1.3175048828125, 1.44476318359375, 1.572021484375, 1.69927978515625, 1.8265380859375, 1.95379638671875, 2.0810546875, 2.20831298828125, 2.3355712890625, 2.46282958984375, 2.590087890625, 2.71734619140625, 2.8446044921875, 2.97186279296875, 3.09912109375, 3.22637939453125, 3.3536376953125, 3.48089599609375, 3.608154296875, 3.73541259765625, 3.8626708984375, 3.98992919921875, 4.1171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 1.0, 7.0, 10.0, 15.0, 25.0, 24.0, 24.0, 31.0, 29.0, 41.0, 47.0, 57.0, 62.0, 65.0, 54.0, 58.0, 56.0, 38.0, 47.0, 57.0, 52.0, 35.0, 24.0, 30.0, 22.0, 25.0, 12.0, 6.0, 9.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2513885498046875, -1.210784912109375, -1.1701812744140625, -1.12957763671875, -1.0889739990234375, -1.048370361328125, -1.0077667236328125, -0.9671630859375, -0.9265594482421875, -0.885955810546875, -0.8453521728515625, -0.80474853515625, -0.7641448974609375, -0.723541259765625, -0.6829376220703125, -0.642333984375, -0.6017303466796875, -0.561126708984375, -0.5205230712890625, -0.47991943359375, -0.4393157958984375, -0.398712158203125, -0.3581085205078125, -0.3175048828125, -0.2769012451171875, -0.236297607421875, -0.1956939697265625, -0.15509033203125, -0.1144866943359375, -0.073883056640625, -0.0332794189453125, 0.00732421875, 0.0479278564453125, 0.088531494140625, 0.1291351318359375, 0.16973876953125, 0.2103424072265625, 0.250946044921875, 0.2915496826171875, 0.3321533203125, 0.3727569580078125, 0.413360595703125, 0.4539642333984375, 0.49456787109375, 0.5351715087890625, 0.575775146484375, 0.6163787841796875, 0.656982421875, 0.6975860595703125, 0.738189697265625, 0.7787933349609375, 0.81939697265625, 0.8600006103515625, 0.900604248046875, 0.9412078857421875, 0.9818115234375, 1.0224151611328125, 1.063018798828125, 1.1036224365234375, 1.14422607421875, 1.1848297119140625, 1.225433349609375, 1.2660369873046875, 1.306640625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 7.0, 17.0, 18.0, 27.0, 24.0, 37.0, 37.0, 44.0, 64.0, 64.0, 56.0, 75.0, 80.0, 69.0, 51.0, 50.0, 41.0, 40.0, 31.0, 33.0, 24.0, 19.0, 11.0, 13.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.555706024169922, -24.733627319335938, -23.911548614501953, -23.08946990966797, -22.267393112182617, -21.445314407348633, -20.62323570251465, -19.801156997680664, -18.979080200195312, -18.157001495361328, -17.334922790527344, -16.51284408569336, -15.690767288208008, -14.868688583374023, -14.046609878540039, -13.224531173706055, -12.40245246887207, -11.580373764038086, -10.758296012878418, -9.936217308044434, -9.114139556884766, -8.292060852050781, -7.469982147216797, -6.647903919219971, -5.8258256912231445, -5.003747463226318, -4.181669235229492, -3.359590530395508, -2.5375123023986816, -1.7154340744018555, -0.8933553695678711, -0.07127714157104492, 0.7508029937744141, 1.5728813409805298, 2.3949596881866455, 3.217038154602051, 4.039116382598877, 4.861194610595703, 5.6832733154296875, 6.505351543426514, 7.32742977142334, 8.149508476257324, 8.971586227416992, 9.793664932250977, 10.615743637084961, 11.437821388244629, 12.259900093078613, 13.081977844238281, 13.904056549072266, 14.72613525390625, 15.548213005065918, 16.37029266357422, 17.19236946105957, 18.014448165893555, 18.83652687072754, 19.658605575561523, 20.480682373046875, 21.30276107788086, 22.124839782714844, 22.946918487548828, 23.76899528503418, 24.591073989868164, 25.41315269470215, 26.235231399536133, 27.057310104370117]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 8.0, 7.0, 6.0, 12.0, 8.0, 5.0, 15.0, 22.0, 11.0, 23.0, 24.0, 22.0, 30.0, 25.0, 25.0, 32.0, 30.0, 36.0, 39.0, 37.0, 42.0, 45.0, 44.0, 38.0, 44.0, 30.0, 33.0, 28.0, 37.0, 29.0, 33.0, 15.0, 22.0, 26.0, 18.0, 20.0, 15.0, 9.0, 11.0, 8.0, 6.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.9366455078125, -10.581901550292969, -10.227157592773438, -9.872413635253906, -9.517669677734375, -9.162925720214844, -8.808181762695312, -8.453437805175781, -8.09869384765625, -7.743949890136719, -7.3892059326171875, -7.034461975097656, -6.679718017578125, -6.324974060058594, -5.9702301025390625, -5.615486145019531, -5.260741710662842, -4.9059977531433105, -4.551253795623779, -4.196509838104248, -3.841765880584717, -3.4870219230651855, -3.132277727127075, -2.777533769607544, -2.4227898120880127, -2.0680458545684814, -1.7133018970489502, -1.3585578203201294, -1.0038138628005981, -0.6490699052810669, -0.2943258285522461, 0.060418128967285156, 0.4151620864868164, 0.7699060440063477, 1.124650001525879, 1.4793940782546997, 1.834138035774231, 2.1888818740844727, 2.543626070022583, 2.8983700275421143, 3.2531139850616455, 3.6078579425811768, 3.962601900100708, 4.317346096038818, 4.67209005355835, 5.026834011077881, 5.381577968597412, 5.736321926116943, 6.091065883636475, 6.445809841156006, 6.800553798675537, 7.155297756195068, 7.5100417137146, 7.864785671234131, 8.21953010559082, 8.574274063110352, 8.929018020629883, 9.283761978149414, 9.638505935668945, 9.993249893188477, 10.347993850708008, 10.702737808227539, 11.05748176574707, 11.412225723266602, 11.766969680786133]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 10.0, 7.0, 20.0, 34.0, 49.0, 84.0, 138.0, 231.0, 449.0, 802.0, 1488.0, 2742.0, 5180.0, 9959.0, 19488.0, 37824.0, 72366.0, 129224.0, 194359.0, 212137.0, 159983.0, 95271.0, 51515.0, 26454.0, 13637.0, 7094.0, 3668.0, 1859.0, 1100.0, 599.0, 328.0, 173.0, 107.0, 76.0, 36.0, 25.0, 10.0, 11.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.3916015625, -16.673828125, -15.9560546875, -15.23828125, -14.5205078125, -13.802734375, -13.0849609375, -12.3671875, -11.6494140625, -10.931640625, -10.2138671875, -9.49609375, -8.7783203125, -8.060546875, -7.3427734375, -6.625, -5.9072265625, -5.189453125, -4.4716796875, -3.75390625, -3.0361328125, -2.318359375, -1.6005859375, -0.8828125, -0.1650390625, 0.552734375, 1.2705078125, 1.98828125, 2.7060546875, 3.423828125, 4.1416015625, 4.859375, 5.5771484375, 6.294921875, 7.0126953125, 7.73046875, 8.4482421875, 9.166015625, 9.8837890625, 10.6015625, 11.3193359375, 12.037109375, 12.7548828125, 13.47265625, 14.1904296875, 14.908203125, 15.6259765625, 16.34375, 17.0615234375, 17.779296875, 18.4970703125, 19.21484375, 19.9326171875, 20.650390625, 21.3681640625, 22.0859375, 22.8037109375, 23.521484375, 24.2392578125, 24.95703125, 25.6748046875, 26.392578125, 27.1103515625, 27.828125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 4.0, 7.0, 14.0, 17.0, 9.0, 17.0, 25.0, 26.0, 32.0, 33.0, 34.0, 35.0, 47.0, 47.0, 55.0, 49.0, 52.0, 64.0, 49.0, 51.0, 41.0, 46.0, 41.0, 40.0, 29.0, 19.0, 24.0, 11.0, 22.0, 11.0, 12.0, 6.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.2271728515625, -12.712158203125, -12.1971435546875, -11.68212890625, -11.1671142578125, -10.652099609375, -10.1370849609375, -9.6220703125, -9.1070556640625, -8.592041015625, -8.0770263671875, -7.56201171875, -7.0469970703125, -6.531982421875, -6.0169677734375, -5.501953125, -4.9869384765625, -4.471923828125, -3.9569091796875, -3.44189453125, -2.9268798828125, -2.411865234375, -1.8968505859375, -1.3818359375, -0.8668212890625, -0.351806640625, 0.1632080078125, 0.67822265625, 1.1932373046875, 1.708251953125, 2.2232666015625, 2.73828125, 3.2532958984375, 3.768310546875, 4.2833251953125, 4.79833984375, 5.3133544921875, 5.828369140625, 6.3433837890625, 6.8583984375, 7.3734130859375, 7.888427734375, 8.4034423828125, 8.91845703125, 9.4334716796875, 9.948486328125, 10.4635009765625, 10.978515625, 11.4935302734375, 12.008544921875, 12.5235595703125, 13.03857421875, 13.5535888671875, 14.068603515625, 14.5836181640625, 15.0986328125, 15.6136474609375, 16.128662109375, 16.6436767578125, 17.15869140625, 17.6737060546875, 18.188720703125, 18.7037353515625, 19.21875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 9.0, 10.0, 10.0, 16.0, 31.0, 43.0, 50.0, 81.0, 137.0, 176.0, 244.0, 431.0, 655.0, 1096.0, 1768.0, 2692.0, 4593.0, 7528.0, 12824.0, 21552.0, 36137.0, 58430.0, 91425.0, 130338.0, 159247.0, 157719.0, 127942.0, 89520.0, 56859.0, 34742.0, 20928.0, 12507.0, 7345.0, 4345.0, 2624.0, 1623.0, 1070.0, 640.0, 401.0, 257.0, 176.0, 95.0, 84.0, 49.0, 34.0, 32.0, 15.0, 12.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.103271484375, -15.56591796875, -15.028564453125, -14.4912109375, -13.953857421875, -13.41650390625, -12.879150390625, -12.341796875, -11.804443359375, -11.26708984375, -10.729736328125, -10.1923828125, -9.655029296875, -9.11767578125, -8.580322265625, -8.04296875, -7.505615234375, -6.96826171875, -6.430908203125, -5.8935546875, -5.356201171875, -4.81884765625, -4.281494140625, -3.744140625, -3.206787109375, -2.66943359375, -2.132080078125, -1.5947265625, -1.057373046875, -0.52001953125, 0.017333984375, 0.5546875, 1.092041015625, 1.62939453125, 2.166748046875, 2.7041015625, 3.241455078125, 3.77880859375, 4.316162109375, 4.853515625, 5.390869140625, 5.92822265625, 6.465576171875, 7.0029296875, 7.540283203125, 8.07763671875, 8.614990234375, 9.15234375, 9.689697265625, 10.22705078125, 10.764404296875, 11.3017578125, 11.839111328125, 12.37646484375, 12.913818359375, 13.451171875, 13.988525390625, 14.52587890625, 15.063232421875, 15.6005859375, 16.137939453125, 16.67529296875, 17.212646484375, 17.75]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 6.0, 2.0, 9.0, 9.0, 14.0, 21.0, 27.0, 18.0, 24.0, 20.0, 32.0, 35.0, 37.0, 38.0, 47.0, 40.0, 38.0, 39.0, 46.0, 50.0, 52.0, 36.0, 37.0, 39.0, 41.0, 31.0, 34.0, 31.0, 20.0, 24.0, 21.0, 19.0, 7.0, 7.0, 10.0, 7.0, 6.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.1484375, -9.869873046875, -9.59130859375, -9.312744140625, -9.0341796875, -8.755615234375, -8.47705078125, -8.198486328125, -7.919921875, -7.641357421875, -7.36279296875, -7.084228515625, -6.8056640625, -6.527099609375, -6.24853515625, -5.969970703125, -5.69140625, -5.412841796875, -5.13427734375, -4.855712890625, -4.5771484375, -4.298583984375, -4.02001953125, -3.741455078125, -3.462890625, -3.184326171875, -2.90576171875, -2.627197265625, -2.3486328125, -2.070068359375, -1.79150390625, -1.512939453125, -1.234375, -0.955810546875, -0.67724609375, -0.398681640625, -0.1201171875, 0.158447265625, 0.43701171875, 0.715576171875, 0.994140625, 1.272705078125, 1.55126953125, 1.829833984375, 2.1083984375, 2.386962890625, 2.66552734375, 2.944091796875, 3.22265625, 3.501220703125, 3.77978515625, 4.058349609375, 4.3369140625, 4.615478515625, 4.89404296875, 5.172607421875, 5.451171875, 5.729736328125, 6.00830078125, 6.286865234375, 6.5654296875, 6.843994140625, 7.12255859375, 7.401123046875, 7.6796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 2.0, 5.0, 3.0, 6.0, 9.0, 20.0, 11.0, 38.0, 39.0, 53.0, 65.0, 117.0, 171.0, 248.0, 389.0, 566.0, 879.0, 1264.0, 2104.0, 3368.0, 5531.0, 9089.0, 15358.0, 26618.0, 46491.0, 80911.0, 133196.0, 187871.0, 190885.0, 138996.0, 85266.0, 49098.0, 28163.0, 16397.0, 9691.0, 5835.0, 3530.0, 2208.0, 1387.0, 889.0, 598.0, 384.0, 242.0, 168.0, 129.0, 80.0, 59.0, 39.0, 34.0, 17.0, 22.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.8828125, -9.574462890625, -9.26611328125, -8.957763671875, -8.6494140625, -8.341064453125, -8.03271484375, -7.724365234375, -7.416015625, -7.107666015625, -6.79931640625, -6.490966796875, -6.1826171875, -5.874267578125, -5.56591796875, -5.257568359375, -4.94921875, -4.640869140625, -4.33251953125, -4.024169921875, -3.7158203125, -3.407470703125, -3.09912109375, -2.790771484375, -2.482421875, -2.174072265625, -1.86572265625, -1.557373046875, -1.2490234375, -0.940673828125, -0.63232421875, -0.323974609375, -0.015625, 0.292724609375, 0.60107421875, 0.909423828125, 1.2177734375, 1.526123046875, 1.83447265625, 2.142822265625, 2.451171875, 2.759521484375, 3.06787109375, 3.376220703125, 3.6845703125, 3.992919921875, 4.30126953125, 4.609619140625, 4.91796875, 5.226318359375, 5.53466796875, 5.843017578125, 6.1513671875, 6.459716796875, 6.76806640625, 7.076416015625, 7.384765625, 7.693115234375, 8.00146484375, 8.309814453125, 8.6181640625, 8.926513671875, 9.23486328125, 9.543212890625, 9.8515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 5.0, 7.0, 14.0, 16.0, 24.0, 24.0, 36.0, 39.0, 52.0, 63.0, 66.0, 72.0, 67.0, 78.0, 75.0, 72.0, 51.0, 44.0, 40.0, 24.0, 26.0, 22.0, 14.0, 13.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010194778442382812, -0.0009839534759521484, -0.0009484291076660156, -0.0009129047393798828, -0.00087738037109375, -0.0008418560028076172, -0.0008063316345214844, -0.0007708072662353516, -0.0007352828979492188, -0.0006997585296630859, -0.0006642341613769531, -0.0006287097930908203, -0.0005931854248046875, -0.0005576610565185547, -0.0005221366882324219, -0.00048661231994628906, -0.00045108795166015625, -0.00041556358337402344, -0.0003800392150878906, -0.0003445148468017578, -0.000308990478515625, -0.0002734661102294922, -0.00023794174194335938, -0.00020241737365722656, -0.00016689300537109375, -0.00013136863708496094, -9.584426879882812e-05, -6.031990051269531e-05, -2.47955322265625e-05, 1.0728836059570312e-05, 4.6253204345703125e-05, 8.177757263183594e-05, 0.00011730194091796875, 0.00015282630920410156, 0.00018835067749023438, 0.0002238750457763672, 0.0002593994140625, 0.0002949237823486328, 0.0003304481506347656, 0.00036597251892089844, 0.00040149688720703125, 0.00043702125549316406, 0.0004725456237792969, 0.0005080699920654297, 0.0005435943603515625, 0.0005791187286376953, 0.0006146430969238281, 0.0006501674652099609, 0.0006856918334960938, 0.0007212162017822266, 0.0007567405700683594, 0.0007922649383544922, 0.000827789306640625, 0.0008633136749267578, 0.0008988380432128906, 0.0009343624114990234, 0.0009698867797851562, 0.001005411148071289, 0.0010409355163574219, 0.0010764598846435547, 0.0011119842529296875, 0.0011475086212158203, 0.0011830329895019531, 0.001218557357788086, 0.0012540817260742188]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 10.0, 12.0, 14.0, 21.0, 43.0, 41.0, 86.0, 111.0, 134.0, 188.0, 225.0, 366.0, 493.0, 742.0, 1049.0, 1493.0, 2277.0, 3376.0, 5444.0, 8563.0, 14185.0, 23690.0, 41421.0, 73108.0, 120616.0, 174719.0, 191127.0, 150579.0, 96073.0, 56547.0, 32069.0, 18698.0, 11016.0, 6800.0, 4271.0, 2850.0, 1843.0, 1211.0, 889.0, 637.0, 443.0, 310.0, 204.0, 162.0, 105.0, 67.0, 68.0, 52.0, 29.0, 28.0, 13.0, 8.0, 12.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-9.96875, -9.6597900390625, -9.350830078125, -9.0418701171875, -8.73291015625, -8.4239501953125, -8.114990234375, -7.8060302734375, -7.4970703125, -7.1881103515625, -6.879150390625, -6.5701904296875, -6.26123046875, -5.9522705078125, -5.643310546875, -5.3343505859375, -5.025390625, -4.7164306640625, -4.407470703125, -4.0985107421875, -3.78955078125, -3.4805908203125, -3.171630859375, -2.8626708984375, -2.5537109375, -2.2447509765625, -1.935791015625, -1.6268310546875, -1.31787109375, -1.0089111328125, -0.699951171875, -0.3909912109375, -0.08203125, 0.2269287109375, 0.535888671875, 0.8448486328125, 1.15380859375, 1.4627685546875, 1.771728515625, 2.0806884765625, 2.3896484375, 2.6986083984375, 3.007568359375, 3.3165283203125, 3.62548828125, 3.9344482421875, 4.243408203125, 4.5523681640625, 4.861328125, 5.1702880859375, 5.479248046875, 5.7882080078125, 6.09716796875, 6.4061279296875, 6.715087890625, 7.0240478515625, 7.3330078125, 7.6419677734375, 7.950927734375, 8.2598876953125, 8.56884765625, 8.8778076171875, 9.186767578125, 9.4957275390625, 9.8046875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 11.0, 20.0, 20.0, 18.0, 47.0, 32.0, 40.0, 50.0, 43.0, 58.0, 60.0, 60.0, 65.0, 55.0, 55.0, 54.0, 42.0, 43.0, 38.0, 30.0, 24.0, 19.0, 22.0, 18.0, 9.0, 12.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.982421875, -2.89495849609375, -2.8074951171875, -2.72003173828125, -2.632568359375, -2.54510498046875, -2.4576416015625, -2.37017822265625, -2.28271484375, -2.19525146484375, -2.1077880859375, -2.02032470703125, -1.932861328125, -1.84539794921875, -1.7579345703125, -1.67047119140625, -1.5830078125, -1.49554443359375, -1.4080810546875, -1.32061767578125, -1.233154296875, -1.14569091796875, -1.0582275390625, -0.97076416015625, -0.88330078125, -0.79583740234375, -0.7083740234375, -0.62091064453125, -0.533447265625, -0.44598388671875, -0.3585205078125, -0.27105712890625, -0.18359375, -0.09613037109375, -0.0086669921875, 0.07879638671875, 0.166259765625, 0.25372314453125, 0.3411865234375, 0.42864990234375, 0.51611328125, 0.60357666015625, 0.6910400390625, 0.77850341796875, 0.865966796875, 0.95343017578125, 1.0408935546875, 1.12835693359375, 1.2158203125, 1.30328369140625, 1.3907470703125, 1.47821044921875, 1.565673828125, 1.65313720703125, 1.7406005859375, 1.82806396484375, 1.91552734375, 2.00299072265625, 2.0904541015625, 2.17791748046875, 2.265380859375, 2.35284423828125, 2.4403076171875, 2.52777099609375, 2.615234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 9.0, 14.0, 15.0, 17.0, 29.0, 28.0, 39.0, 46.0, 43.0, 55.0, 69.0, 62.0, 69.0, 61.0, 49.0, 56.0, 63.0, 42.0, 42.0, 36.0, 30.0, 19.0, 14.0, 14.0, 11.0, 7.0, 10.0, 13.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.586084365844727, -25.78007698059082, -24.97406768798828, -24.168060302734375, -23.362051010131836, -22.55604362487793, -21.75003433227539, -20.944026947021484, -20.138019561767578, -19.332012176513672, -18.526002883911133, -17.719995498657227, -16.913986206054688, -16.10797882080078, -15.301970481872559, -14.495962142944336, -13.689952850341797, -12.883944511413574, -12.077936172485352, -11.271928787231445, -10.465919494628906, -9.659912109375, -8.853903770446777, -8.047895431518555, -7.241887092590332, -6.435878753662109, -5.629870414733887, -4.823862552642822, -4.0178542137146, -3.211845874786377, -2.4058380126953125, -1.5998296737670898, -0.7938213348388672, 0.012186884880065918, 0.818195104598999, 1.6242032051086426, 2.4302115440368652, 3.236219882965088, 4.042227745056152, 4.848236083984375, 5.654244422912598, 6.46025276184082, 7.266261100769043, 8.072269439697266, 8.878276824951172, 9.684286117553711, 10.490293502807617, 11.29630184173584, 12.102310180664062, 12.908318519592285, 13.714326858520508, 14.520334243774414, 15.326343536376953, 16.13235092163086, 16.938358306884766, 17.744367599487305, 18.550376892089844, 19.35638427734375, 20.16239356994629, 20.968400955200195, 21.774410247802734, 22.58041763305664, 23.386425018310547, 24.192434310913086, 24.998441696166992]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 9.0, 4.0, 5.0, 8.0, 10.0, 11.0, 15.0, 20.0, 22.0, 25.0, 14.0, 21.0, 28.0, 27.0, 30.0, 33.0, 46.0, 36.0, 35.0, 35.0, 47.0, 42.0, 44.0, 41.0, 37.0, 22.0, 34.0, 39.0, 31.0, 24.0, 26.0, 20.0, 20.0, 20.0, 19.0, 12.0, 8.0, 18.0, 9.0, 7.0, 8.0, 7.0, 4.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.53162956237793, -11.173201560974121, -10.814773559570312, -10.456345558166504, -10.097917556762695, -9.73948860168457, -9.381060600280762, -9.022632598876953, -8.664204597473145, -8.305776596069336, -7.947348594665527, -7.5889201164245605, -7.230492115020752, -6.872064113616943, -6.513635635375977, -6.155207633972168, -5.796779632568359, -5.438351631164551, -5.079923629760742, -4.721495151519775, -4.363067150115967, -4.004639148712158, -3.6462109088897705, -3.287782669067383, -2.929354667663574, -2.5709266662597656, -2.212498426437378, -1.8540703058242798, -1.4956421852111816, -1.1372140645980835, -0.7787859439849854, -0.42035770416259766, -0.06193065643310547, 0.2964974641799927, 0.6549255847930908, 1.013353705406189, 1.371781826019287, 1.7302099466323853, 2.0886380672454834, 2.447066307067871, 2.8054943084716797, 3.1639223098754883, 3.522350549697876, 3.8807787895202637, 4.239206790924072, 4.597634792327881, 4.956063270568848, 5.314491271972656, 5.672919273376465, 6.031347274780273, 6.389775276184082, 6.748203754425049, 7.106631755828857, 7.465059757232666, 7.823488235473633, 8.181916236877441, 8.54034423828125, 8.898772239685059, 9.257200241088867, 9.615628242492676, 9.974056243896484, 10.33248519897461, 10.690913200378418, 11.049341201782227, 11.407769203186035]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 10.0, 15.0, 16.0, 39.0, 59.0, 63.0, 84.0, 120.0, 200.0, 263.0, 442.0, 657.0, 959.0, 1489.0, 2370.0, 3817.0, 6401.0, 11086.0, 20727.0, 40907.0, 87016.0, 202355.0, 506477.0, 1131189.0, 1206890.0, 562011.0, 220409.0, 93614.0, 43576.0, 21949.0, 11726.0, 6697.0, 3803.0, 2432.0, 1518.0, 976.0, 602.0, 446.0, 288.0, 175.0, 113.0, 93.0, 75.0, 38.0, 25.0, 25.0, 14.0, 9.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-27.03125, -26.06787109375, -25.1044921875, -24.14111328125, -23.177734375, -22.21435546875, -21.2509765625, -20.28759765625, -19.32421875, -18.36083984375, -17.3974609375, -16.43408203125, -15.470703125, -14.50732421875, -13.5439453125, -12.58056640625, -11.6171875, -10.65380859375, -9.6904296875, -8.72705078125, -7.763671875, -6.80029296875, -5.8369140625, -4.87353515625, -3.91015625, -2.94677734375, -1.9833984375, -1.02001953125, -0.056640625, 0.90673828125, 1.8701171875, 2.83349609375, 3.796875, 4.76025390625, 5.7236328125, 6.68701171875, 7.650390625, 8.61376953125, 9.5771484375, 10.54052734375, 11.50390625, 12.46728515625, 13.4306640625, 14.39404296875, 15.357421875, 16.32080078125, 17.2841796875, 18.24755859375, 19.2109375, 20.17431640625, 21.1376953125, 22.10107421875, 23.064453125, 24.02783203125, 24.9912109375, 25.95458984375, 26.91796875, 27.88134765625, 28.8447265625, 29.80810546875, 30.771484375, 31.73486328125, 32.6982421875, 33.66162109375, 34.625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 10.0, 8.0, 10.0, 9.0, 17.0, 5.0, 11.0, 13.0, 17.0, 21.0, 20.0, 15.0, 23.0, 30.0, 19.0, 33.0, 35.0, 39.0, 32.0, 42.0, 46.0, 41.0, 30.0, 34.0, 35.0, 55.0, 33.0, 42.0, 26.0, 29.0, 17.0, 27.0, 16.0, 30.0, 20.0, 16.0, 8.0, 15.0, 12.0, 8.0, 4.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.515625, -9.224365234375, -8.93310546875, -8.641845703125, -8.3505859375, -8.059326171875, -7.76806640625, -7.476806640625, -7.185546875, -6.894287109375, -6.60302734375, -6.311767578125, -6.0205078125, -5.729248046875, -5.43798828125, -5.146728515625, -4.85546875, -4.564208984375, -4.27294921875, -3.981689453125, -3.6904296875, -3.399169921875, -3.10791015625, -2.816650390625, -2.525390625, -2.234130859375, -1.94287109375, -1.651611328125, -1.3603515625, -1.069091796875, -0.77783203125, -0.486572265625, -0.1953125, 0.095947265625, 0.38720703125, 0.678466796875, 0.9697265625, 1.260986328125, 1.55224609375, 1.843505859375, 2.134765625, 2.426025390625, 2.71728515625, 3.008544921875, 3.2998046875, 3.591064453125, 3.88232421875, 4.173583984375, 4.46484375, 4.756103515625, 5.04736328125, 5.338623046875, 5.6298828125, 5.921142578125, 6.21240234375, 6.503662109375, 6.794921875, 7.086181640625, 7.37744140625, 7.668701171875, 7.9599609375, 8.251220703125, 8.54248046875, 8.833740234375, 9.125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 6.0, 10.0, 12.0, 16.0, 35.0, 37.0, 54.0, 77.0, 90.0, 179.0, 214.0, 294.0, 416.0, 654.0, 1005.0, 1597.0, 2577.0, 4284.0, 7173.0, 12487.0, 23043.0, 44672.0, 90940.0, 199664.0, 467754.0, 1025652.0, 1194052.0, 617783.0, 261357.0, 116548.0, 55524.0, 28471.0, 15467.0, 8581.0, 5022.0, 3055.0, 1887.0, 1196.0, 766.0, 538.0, 311.0, 252.0, 172.0, 123.0, 78.0, 47.0, 33.0, 29.0, 16.0, 12.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-37.90625, -36.76318359375, -35.6201171875, -34.47705078125, -33.333984375, -32.19091796875, -31.0478515625, -29.90478515625, -28.76171875, -27.61865234375, -26.4755859375, -25.33251953125, -24.189453125, -23.04638671875, -21.9033203125, -20.76025390625, -19.6171875, -18.47412109375, -17.3310546875, -16.18798828125, -15.044921875, -13.90185546875, -12.7587890625, -11.61572265625, -10.47265625, -9.32958984375, -8.1865234375, -7.04345703125, -5.900390625, -4.75732421875, -3.6142578125, -2.47119140625, -1.328125, -0.18505859375, 0.9580078125, 2.10107421875, 3.244140625, 4.38720703125, 5.5302734375, 6.67333984375, 7.81640625, 8.95947265625, 10.1025390625, 11.24560546875, 12.388671875, 13.53173828125, 14.6748046875, 15.81787109375, 16.9609375, 18.10400390625, 19.2470703125, 20.39013671875, 21.533203125, 22.67626953125, 23.8193359375, 24.96240234375, 26.10546875, 27.24853515625, 28.3916015625, 29.53466796875, 30.677734375, 31.82080078125, 32.9638671875, 34.10693359375, 35.25]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 13.0, 7.0, 10.0, 10.0, 15.0, 19.0, 22.0, 36.0, 43.0, 56.0, 100.0, 102.0, 113.0, 150.0, 200.0, 243.0, 289.0, 288.0, 294.0, 308.0, 329.0, 268.0, 225.0, 204.0, 144.0, 120.0, 99.0, 88.0, 51.0, 47.0, 40.0, 30.0, 25.0, 15.0, 12.0, 21.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.2950439453125, -8.011962890625, -7.7288818359375, -7.44580078125, -7.1627197265625, -6.879638671875, -6.5965576171875, -6.3134765625, -6.0303955078125, -5.747314453125, -5.4642333984375, -5.18115234375, -4.8980712890625, -4.614990234375, -4.3319091796875, -4.048828125, -3.7657470703125, -3.482666015625, -3.1995849609375, -2.91650390625, -2.6334228515625, -2.350341796875, -2.0672607421875, -1.7841796875, -1.5010986328125, -1.218017578125, -0.9349365234375, -0.65185546875, -0.3687744140625, -0.085693359375, 0.1973876953125, 0.48046875, 0.7635498046875, 1.046630859375, 1.3297119140625, 1.61279296875, 1.8958740234375, 2.178955078125, 2.4620361328125, 2.7451171875, 3.0281982421875, 3.311279296875, 3.5943603515625, 3.87744140625, 4.1605224609375, 4.443603515625, 4.7266845703125, 5.009765625, 5.2928466796875, 5.575927734375, 5.8590087890625, 6.14208984375, 6.4251708984375, 6.708251953125, 6.9913330078125, 7.2744140625, 7.5574951171875, 7.840576171875, 8.1236572265625, 8.40673828125, 8.6898193359375, 8.972900390625, 9.2559814453125, 9.5390625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 5.0, 3.0, 11.0, 18.0, 11.0, 15.0, 16.0, 18.0, 24.0, 41.0, 32.0, 35.0, 32.0, 60.0, 73.0, 53.0, 50.0, 63.0, 61.0, 63.0, 39.0, 41.0, 44.0, 20.0, 19.0, 29.0, 27.0, 17.0, 12.0, 9.0, 11.0, 8.0, 4.0, 5.0, 7.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.729507446289062, -27.8569393157959, -26.984371185302734, -26.11180305480957, -25.239234924316406, -24.36666488647461, -23.494098663330078, -22.62152862548828, -21.748960494995117, -20.876392364501953, -20.00382423400879, -19.131256103515625, -18.25868797302246, -17.386119842529297, -16.5135498046875, -15.640981674194336, -14.768414497375488, -13.895846366882324, -13.02327823638916, -12.15070915222168, -11.278141021728516, -10.405572891235352, -9.533004760742188, -8.660436630249023, -7.787868022918701, -6.915299892425537, -6.042731285095215, -5.170163154602051, -4.297595024108887, -3.4250264167785645, -2.5524582862854004, -1.6798896789550781, -0.8073215484619141, 0.06524676084518433, 0.9378150701522827, 1.8103833198547363, 2.6829516887664795, 3.5555200576782227, 4.428088188171387, 5.300656795501709, 6.173224925994873, 7.045793056488037, 7.918361663818359, 8.790929794311523, 9.663497924804688, 10.536066055297852, 11.408634185791016, 12.281203269958496, 13.15377140045166, 14.026339530944824, 14.898907661437988, 15.771476745605469, 16.644044876098633, 17.516613006591797, 18.38918113708496, 19.261749267578125, 20.13431739807129, 21.006885528564453, 21.879453659057617, 22.75202178955078, 23.624589920043945, 24.49715805053711, 25.369728088378906, 26.24229621887207, 27.114864349365234]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 8.0, 7.0, 10.0, 16.0, 14.0, 10.0, 12.0, 17.0, 14.0, 21.0, 18.0, 27.0, 39.0, 33.0, 35.0, 38.0, 36.0, 41.0, 32.0, 31.0, 38.0, 30.0, 43.0, 37.0, 46.0, 35.0, 31.0, 35.0, 34.0, 35.0, 31.0, 26.0, 19.0, 20.0, 19.0, 11.0, 12.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.919206619262695, -12.46863842010498, -12.01806926727295, -11.567501068115234, -11.116931915283203, -10.666363716125488, -10.215795516967773, -9.765226364135742, -9.314658164978027, -8.864089965820312, -8.413520812988281, -7.962952613830566, -7.512383937835693, -7.06181526184082, -6.6112470626831055, -6.160678386688232, -5.710109710693359, -5.259541034698486, -4.808972358703613, -4.358404159545898, -3.9078354835510254, -3.4572668075561523, -3.0066983699798584, -2.5561299324035645, -2.1055612564086914, -1.654992699623108, -1.2044241428375244, -0.7538555860519409, -0.3032870292663574, 0.14728164672851562, 0.5978500843048096, 1.0484185218811035, 1.4989862442016602, 1.9495548009872437, 2.400123357772827, 2.850691795349121, 3.301260471343994, 3.751829147338867, 4.202397346496582, 4.652966022491455, 5.103534698486328, 5.554103374481201, 6.004672050476074, 6.455240249633789, 6.905808925628662, 7.356377601623535, 7.80694580078125, 8.257514953613281, 8.708083152770996, 9.158651351928711, 9.609220504760742, 10.059788703918457, 10.510356903076172, 10.960926055908203, 11.411494255065918, 11.862062454223633, 12.312631607055664, 12.763199806213379, 13.21376895904541, 13.664337158203125, 14.114906311035156, 14.565474510192871, 15.016042709350586, 15.466611862182617, 15.917180061340332]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 8.0, 10.0, 11.0, 24.0, 30.0, 37.0, 44.0, 75.0, 110.0, 178.0, 241.0, 383.0, 564.0, 894.0, 1429.0, 2271.0, 3848.0, 6357.0, 11174.0, 19267.0, 34310.0, 59987.0, 102008.0, 157984.0, 197521.0, 171634.0, 115424.0, 68894.0, 39555.0, 22758.0, 12829.0, 7445.0, 4261.0, 2563.0, 1517.0, 991.0, 644.0, 450.0, 270.0, 183.0, 112.0, 69.0, 61.0, 35.0, 40.0, 16.0, 12.0, 13.0, 4.0, 6.0, 0.0, 4.0, 2.0, 5.0, 1.0, 2.0], "bins": [-13.46875, -13.055908203125, -12.64306640625, -12.230224609375, -11.8173828125, -11.404541015625, -10.99169921875, -10.578857421875, -10.166015625, -9.753173828125, -9.34033203125, -8.927490234375, -8.5146484375, -8.101806640625, -7.68896484375, -7.276123046875, -6.86328125, -6.450439453125, -6.03759765625, -5.624755859375, -5.2119140625, -4.799072265625, -4.38623046875, -3.973388671875, -3.560546875, -3.147705078125, -2.73486328125, -2.322021484375, -1.9091796875, -1.496337890625, -1.08349609375, -0.670654296875, -0.2578125, 0.155029296875, 0.56787109375, 0.980712890625, 1.3935546875, 1.806396484375, 2.21923828125, 2.632080078125, 3.044921875, 3.457763671875, 3.87060546875, 4.283447265625, 4.6962890625, 5.109130859375, 5.52197265625, 5.934814453125, 6.34765625, 6.760498046875, 7.17333984375, 7.586181640625, 7.9990234375, 8.411865234375, 8.82470703125, 9.237548828125, 9.650390625, 10.063232421875, 10.47607421875, 10.888916015625, 11.3017578125, 11.714599609375, 12.12744140625, 12.540283203125, 12.953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 4.0, 7.0, 14.0, 13.0, 21.0, 11.0, 14.0, 22.0, 27.0, 36.0, 30.0, 32.0, 41.0, 45.0, 40.0, 47.0, 40.0, 47.0, 52.0, 43.0, 45.0, 48.0, 39.0, 39.0, 44.0, 28.0, 30.0, 28.0, 19.0, 19.0, 9.0, 14.0, 13.0, 5.0, 6.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.625, -19.0390625, -18.453125, -17.8671875, -17.28125, -16.6953125, -16.109375, -15.5234375, -14.9375, -14.3515625, -13.765625, -13.1796875, -12.59375, -12.0078125, -11.421875, -10.8359375, -10.25, -9.6640625, -9.078125, -8.4921875, -7.90625, -7.3203125, -6.734375, -6.1484375, -5.5625, -4.9765625, -4.390625, -3.8046875, -3.21875, -2.6328125, -2.046875, -1.4609375, -0.875, -0.2890625, 0.296875, 0.8828125, 1.46875, 2.0546875, 2.640625, 3.2265625, 3.8125, 4.3984375, 4.984375, 5.5703125, 6.15625, 6.7421875, 7.328125, 7.9140625, 8.5, 9.0859375, 9.671875, 10.2578125, 10.84375, 11.4296875, 12.015625, 12.6015625, 13.1875, 13.7734375, 14.359375, 14.9453125, 15.53125, 16.1171875, 16.703125, 17.2890625, 17.875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 9.0, 17.0, 21.0, 35.0, 39.0, 76.0, 96.0, 145.0, 192.0, 277.0, 401.0, 543.0, 722.0, 1045.0, 1697.0, 2364.0, 3652.0, 6019.0, 9909.0, 17444.0, 30944.0, 57335.0, 106197.0, 186184.0, 236937.0, 170766.0, 95407.0, 51447.0, 27991.0, 15608.0, 8947.0, 5536.0, 3491.0, 2210.0, 1467.0, 997.0, 720.0, 472.0, 331.0, 236.0, 181.0, 137.0, 85.0, 58.0, 45.0, 27.0, 34.0, 18.0, 12.0, 5.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0], "bins": [-16.578125, -16.066650390625, -15.55517578125, -15.043701171875, -14.5322265625, -14.020751953125, -13.50927734375, -12.997802734375, -12.486328125, -11.974853515625, -11.46337890625, -10.951904296875, -10.4404296875, -9.928955078125, -9.41748046875, -8.906005859375, -8.39453125, -7.883056640625, -7.37158203125, -6.860107421875, -6.3486328125, -5.837158203125, -5.32568359375, -4.814208984375, -4.302734375, -3.791259765625, -3.27978515625, -2.768310546875, -2.2568359375, -1.745361328125, -1.23388671875, -0.722412109375, -0.2109375, 0.300537109375, 0.81201171875, 1.323486328125, 1.8349609375, 2.346435546875, 2.85791015625, 3.369384765625, 3.880859375, 4.392333984375, 4.90380859375, 5.415283203125, 5.9267578125, 6.438232421875, 6.94970703125, 7.461181640625, 7.97265625, 8.484130859375, 8.99560546875, 9.507080078125, 10.0185546875, 10.530029296875, 11.04150390625, 11.552978515625, 12.064453125, 12.575927734375, 13.08740234375, 13.598876953125, 14.1103515625, 14.621826171875, 15.13330078125, 15.644775390625, 16.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 15.0, 11.0, 12.0, 9.0, 5.0, 22.0, 29.0, 21.0, 34.0, 32.0, 38.0, 40.0, 52.0, 52.0, 40.0, 45.0, 59.0, 46.0, 42.0, 40.0, 45.0, 32.0, 41.0, 32.0, 28.0, 24.0, 18.0, 20.0, 14.0, 18.0, 14.0, 14.0, 11.0, 9.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.372314453125, -9.03369140625, -8.695068359375, -8.3564453125, -8.017822265625, -7.67919921875, -7.340576171875, -7.001953125, -6.663330078125, -6.32470703125, -5.986083984375, -5.6474609375, -5.308837890625, -4.97021484375, -4.631591796875, -4.29296875, -3.954345703125, -3.61572265625, -3.277099609375, -2.9384765625, -2.599853515625, -2.26123046875, -1.922607421875, -1.583984375, -1.245361328125, -0.90673828125, -0.568115234375, -0.2294921875, 0.109130859375, 0.44775390625, 0.786376953125, 1.125, 1.463623046875, 1.80224609375, 2.140869140625, 2.4794921875, 2.818115234375, 3.15673828125, 3.495361328125, 3.833984375, 4.172607421875, 4.51123046875, 4.849853515625, 5.1884765625, 5.527099609375, 5.86572265625, 6.204345703125, 6.54296875, 6.881591796875, 7.22021484375, 7.558837890625, 7.8974609375, 8.236083984375, 8.57470703125, 8.913330078125, 9.251953125, 9.590576171875, 9.92919921875, 10.267822265625, 10.6064453125, 10.945068359375, 11.28369140625, 11.622314453125, 11.9609375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 8.0, 18.0, 24.0, 33.0, 49.0, 63.0, 110.0, 192.0, 286.0, 457.0, 816.0, 1299.0, 2294.0, 4141.0, 7708.0, 14416.0, 28782.0, 59462.0, 124599.0, 242529.0, 270900.0, 149112.0, 70377.0, 33854.0, 16900.0, 8769.0, 4839.0, 2593.0, 1562.0, 906.0, 560.0, 319.0, 193.0, 120.0, 84.0, 47.0, 43.0, 20.0, 20.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.6766357421875, -6.439208984375, -6.2017822265625, -5.96435546875, -5.7269287109375, -5.489501953125, -5.2520751953125, -5.0146484375, -4.7772216796875, -4.539794921875, -4.3023681640625, -4.06494140625, -3.8275146484375, -3.590087890625, -3.3526611328125, -3.115234375, -2.8778076171875, -2.640380859375, -2.4029541015625, -2.16552734375, -1.9281005859375, -1.690673828125, -1.4532470703125, -1.2158203125, -0.9783935546875, -0.740966796875, -0.5035400390625, -0.26611328125, -0.0286865234375, 0.208740234375, 0.4461669921875, 0.68359375, 0.9210205078125, 1.158447265625, 1.3958740234375, 1.63330078125, 1.8707275390625, 2.108154296875, 2.3455810546875, 2.5830078125, 2.8204345703125, 3.057861328125, 3.2952880859375, 3.53271484375, 3.7701416015625, 4.007568359375, 4.2449951171875, 4.482421875, 4.7198486328125, 4.957275390625, 5.1947021484375, 5.43212890625, 5.6695556640625, 5.906982421875, 6.1444091796875, 6.3818359375, 6.6192626953125, 6.856689453125, 7.0941162109375, 7.33154296875, 7.5689697265625, 7.806396484375, 8.0438232421875, 8.28125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 13.0, 15.0, 20.0, 26.0, 41.0, 42.0, 56.0, 57.0, 86.0, 98.0, 81.0, 69.0, 85.0, 74.0, 50.0, 43.0, 37.0, 17.0, 23.0, 16.0, 8.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006275177001953125, -0.0006091967225074768, -0.0005908757448196411, -0.0005725547671318054, -0.0005542337894439697, -0.000535912811756134, -0.0005175918340682983, -0.0004992708563804626, -0.00048094987869262695, -0.00046262890100479126, -0.00044430792331695557, -0.0004259869456291199, -0.0004076659679412842, -0.0003893449902534485, -0.0003710240125656128, -0.0003527030348777771, -0.0003343820571899414, -0.0003160610795021057, -0.00029774010181427, -0.0002794191241264343, -0.00026109814643859863, -0.00024277716875076294, -0.00022445619106292725, -0.00020613521337509155, -0.00018781423568725586, -0.00016949325799942017, -0.00015117228031158447, -0.00013285130262374878, -0.00011453032493591309, -9.620934724807739e-05, -7.78883695602417e-05, -5.9567391872406006e-05, -4.124641418457031e-05, -2.292543649673462e-05, -4.604458808898926e-06, 1.3716518878936768e-05, 3.203749656677246e-05, 5.0358474254608154e-05, 6.867945194244385e-05, 8.700042963027954e-05, 0.00010532140731811523, 0.00012364238500595093, 0.00014196336269378662, 0.00016028434038162231, 0.000178605318069458, 0.0001969262957572937, 0.0002152472734451294, 0.0002335682511329651, 0.0002518892288208008, 0.0002702102065086365, 0.00028853118419647217, 0.00030685216188430786, 0.00032517313957214355, 0.00034349411725997925, 0.00036181509494781494, 0.00038013607263565063, 0.00039845705032348633, 0.000416778028011322, 0.0004350990056991577, 0.0004534199833869934, 0.0004717409610748291, 0.0004900619387626648, 0.0005083829164505005, 0.0005267038941383362, 0.0005450248718261719]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 8.0, 16.0, 14.0, 13.0, 25.0, 44.0, 78.0, 116.0, 169.0, 270.0, 368.0, 573.0, 884.0, 1370.0, 2226.0, 3564.0, 5674.0, 9347.0, 14794.0, 25067.0, 40996.0, 66863.0, 106444.0, 151599.0, 174914.0, 154667.0, 110087.0, 69088.0, 42370.0, 25667.0, 15652.0, 9512.0, 5829.0, 3743.0, 2274.0, 1436.0, 975.0, 611.0, 420.0, 263.0, 184.0, 117.0, 83.0, 39.0, 42.0, 24.0, 14.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.17156982421875, -4.9837646484375, -4.79595947265625, -4.608154296875, -4.42034912109375, -4.2325439453125, -4.04473876953125, -3.85693359375, -3.66912841796875, -3.4813232421875, -3.29351806640625, -3.105712890625, -2.91790771484375, -2.7301025390625, -2.54229736328125, -2.3544921875, -2.16668701171875, -1.9788818359375, -1.79107666015625, -1.603271484375, -1.41546630859375, -1.2276611328125, -1.03985595703125, -0.85205078125, -0.66424560546875, -0.4764404296875, -0.28863525390625, -0.100830078125, 0.08697509765625, 0.2747802734375, 0.46258544921875, 0.650390625, 0.83819580078125, 1.0260009765625, 1.21380615234375, 1.401611328125, 1.58941650390625, 1.7772216796875, 1.96502685546875, 2.15283203125, 2.34063720703125, 2.5284423828125, 2.71624755859375, 2.904052734375, 3.09185791015625, 3.2796630859375, 3.46746826171875, 3.6552734375, 3.84307861328125, 4.0308837890625, 4.21868896484375, 4.406494140625, 4.59429931640625, 4.7821044921875, 4.96990966796875, 5.15771484375, 5.34552001953125, 5.5333251953125, 5.72113037109375, 5.908935546875, 6.09674072265625, 6.2845458984375, 6.47235107421875, 6.66015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 10.0, 13.0, 12.0, 19.0, 21.0, 13.0, 19.0, 28.0, 30.0, 45.0, 28.0, 43.0, 45.0, 54.0, 61.0, 60.0, 50.0, 35.0, 40.0, 43.0, 43.0, 46.0, 25.0, 34.0, 36.0, 29.0, 19.0, 13.0, 15.0, 18.0, 9.0, 10.0, 7.0, 8.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.673828125, -1.621368408203125, -1.56890869140625, -1.516448974609375, -1.4639892578125, -1.411529541015625, -1.35906982421875, -1.306610107421875, -1.254150390625, -1.201690673828125, -1.14923095703125, -1.096771240234375, -1.0443115234375, -0.991851806640625, -0.93939208984375, -0.886932373046875, -0.83447265625, -0.782012939453125, -0.72955322265625, -0.677093505859375, -0.6246337890625, -0.572174072265625, -0.51971435546875, -0.467254638671875, -0.414794921875, -0.362335205078125, -0.30987548828125, -0.257415771484375, -0.2049560546875, -0.152496337890625, -0.10003662109375, -0.047576904296875, 0.0048828125, 0.057342529296875, 0.10980224609375, 0.162261962890625, 0.2147216796875, 0.267181396484375, 0.31964111328125, 0.372100830078125, 0.424560546875, 0.477020263671875, 0.52947998046875, 0.581939697265625, 0.6343994140625, 0.686859130859375, 0.73931884765625, 0.791778564453125, 0.84423828125, 0.896697998046875, 0.94915771484375, 1.001617431640625, 1.0540771484375, 1.106536865234375, 1.15899658203125, 1.211456298828125, 1.263916015625, 1.316375732421875, 1.36883544921875, 1.421295166015625, 1.4737548828125, 1.526214599609375, 1.57867431640625, 1.631134033203125, 1.68359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 14.0, 12.0, 14.0, 11.0, 28.0, 23.0, 33.0, 32.0, 39.0, 46.0, 55.0, 49.0, 63.0, 53.0, 67.0, 65.0, 57.0, 49.0, 41.0, 39.0, 23.0, 24.0, 26.0, 23.0, 21.0, 14.0, 11.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.114336013793945, -28.23215675354004, -27.3499755859375, -26.467796325683594, -25.585617065429688, -24.70343780517578, -23.821256637573242, -22.939077377319336, -22.05689811706543, -21.174718856811523, -20.292537689208984, -19.410358428955078, -18.528179168701172, -17.645999908447266, -16.763818740844727, -15.88163948059082, -14.999459266662598, -14.117279052734375, -13.235099792480469, -12.352919578552246, -11.47074031829834, -10.588560104370117, -9.706380844116211, -8.824200630187988, -7.942020893096924, -7.059841156005859, -6.177661418914795, -5.2954816818237305, -4.413301467895508, -3.5311217308044434, -2.648941993713379, -1.7667622566223145, -0.88458251953125, -0.0024027228355407715, 0.8797770738601685, 1.7619569301605225, 2.644136667251587, 3.5263166427612305, 4.408496379852295, 5.290676116943359, 6.172855854034424, 7.055035591125488, 7.937215328216553, 8.819395065307617, 9.70157527923584, 10.583755493164062, 11.465934753417969, 12.348114013671875, 13.230294227600098, 14.11247444152832, 14.994653701782227, 15.87683391571045, 16.759014129638672, 17.641193389892578, 18.523372650146484, 19.40555191040039, 20.28773307800293, 21.169912338256836, 22.052093505859375, 22.93427276611328, 23.816452026367188, 24.698631286621094, 25.580812454223633, 26.46299171447754, 27.345170974731445]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 14.0, 14.0, 14.0, 11.0, 11.0, 18.0, 24.0, 17.0, 25.0, 30.0, 34.0, 38.0, 40.0, 37.0, 36.0, 36.0, 35.0, 35.0, 35.0, 37.0, 45.0, 35.0, 43.0, 29.0, 40.0, 34.0, 30.0, 31.0, 29.0, 17.0, 19.0, 15.0, 19.0, 13.0, 11.0, 4.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.912052154541016, -12.462684631347656, -12.013318061828613, -11.563950538635254, -11.114583969116211, -10.665216445922852, -10.215848922729492, -9.76648235321045, -9.317115783691406, -8.867748260498047, -8.418381690979004, -7.9690141677856445, -7.519647598266602, -7.070280075073242, -6.620913028717041, -6.17154598236084, -5.7221784591674805, -5.272811412811279, -4.823444366455078, -4.374076843261719, -3.9247100353240967, -3.4753429889678955, -3.0259757041931152, -2.576608657836914, -2.127241611480713, -1.6778745651245117, -1.228507399559021, -0.7791402339935303, -0.3297731876373291, 0.11959385871887207, 0.5689611434936523, 1.0183281898498535, 1.467696189880371, 1.9170632362365723, 2.3664302825927734, 2.8157975673675537, 3.265164613723755, 3.714531660079956, 4.163898944854736, 4.6132659912109375, 5.062633037567139, 5.51200008392334, 5.961367130279541, 6.410734176635742, 6.860101699829102, 7.3094682693481445, 7.758835792541504, 8.208202362060547, 8.657569885253906, 9.106937408447266, 9.556303977966309, 10.005671501159668, 10.455038070678711, 10.90440559387207, 11.35377311706543, 11.803139686584473, 12.252506256103516, 12.701873779296875, 13.151240348815918, 13.600607872009277, 14.04997444152832, 14.49934196472168, 14.948709487915039, 15.398076057434082, 15.847443580627441]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 14.0, 24.0, 27.0, 53.0, 84.0, 113.0, 168.0, 244.0, 401.0, 632.0, 993.0, 1507.0, 2376.0, 3612.0, 5752.0, 8887.0, 13819.0, 21611.0, 33372.0, 51637.0, 76165.0, 105933.0, 133440.0, 143924.0, 130768.0, 102125.0, 72940.0, 48751.0, 31721.0, 20711.0, 13174.0, 8422.0, 5373.0, 3456.0, 2190.0, 1454.0, 919.0, 623.0, 387.0, 262.0, 156.0, 125.0, 71.0, 52.0, 36.0, 18.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.890625, -16.31689453125, -15.7431640625, -15.16943359375, -14.595703125, -14.02197265625, -13.4482421875, -12.87451171875, -12.30078125, -11.72705078125, -11.1533203125, -10.57958984375, -10.005859375, -9.43212890625, -8.8583984375, -8.28466796875, -7.7109375, -7.13720703125, -6.5634765625, -5.98974609375, -5.416015625, -4.84228515625, -4.2685546875, -3.69482421875, -3.12109375, -2.54736328125, -1.9736328125, -1.39990234375, -0.826171875, -0.25244140625, 0.3212890625, 0.89501953125, 1.46875, 2.04248046875, 2.6162109375, 3.18994140625, 3.763671875, 4.33740234375, 4.9111328125, 5.48486328125, 6.05859375, 6.63232421875, 7.2060546875, 7.77978515625, 8.353515625, 8.92724609375, 9.5009765625, 10.07470703125, 10.6484375, 11.22216796875, 11.7958984375, 12.36962890625, 12.943359375, 13.51708984375, 14.0908203125, 14.66455078125, 15.23828125, 15.81201171875, 16.3857421875, 16.95947265625, 17.533203125, 18.10693359375, 18.6806640625, 19.25439453125, 19.828125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 11.0, 11.0, 11.0, 15.0, 14.0, 19.0, 29.0, 25.0, 30.0, 38.0, 33.0, 42.0, 33.0, 41.0, 45.0, 37.0, 41.0, 39.0, 43.0, 49.0, 45.0, 33.0, 52.0, 36.0, 27.0, 32.0, 23.0, 16.0, 25.0, 17.0, 20.0, 10.0, 9.0, 1.0, 10.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.1875, -16.646240234375, -16.10498046875, -15.563720703125, -15.0224609375, -14.481201171875, -13.93994140625, -13.398681640625, -12.857421875, -12.316162109375, -11.77490234375, -11.233642578125, -10.6923828125, -10.151123046875, -9.60986328125, -9.068603515625, -8.52734375, -7.986083984375, -7.44482421875, -6.903564453125, -6.3623046875, -5.821044921875, -5.27978515625, -4.738525390625, -4.197265625, -3.656005859375, -3.11474609375, -2.573486328125, -2.0322265625, -1.490966796875, -0.94970703125, -0.408447265625, 0.1328125, 0.674072265625, 1.21533203125, 1.756591796875, 2.2978515625, 2.839111328125, 3.38037109375, 3.921630859375, 4.462890625, 5.004150390625, 5.54541015625, 6.086669921875, 6.6279296875, 7.169189453125, 7.71044921875, 8.251708984375, 8.79296875, 9.334228515625, 9.87548828125, 10.416748046875, 10.9580078125, 11.499267578125, 12.04052734375, 12.581787109375, 13.123046875, 13.664306640625, 14.20556640625, 14.746826171875, 15.2880859375, 15.829345703125, 16.37060546875, 16.911865234375, 17.453125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 5.0, 22.0, 23.0, 26.0, 51.0, 68.0, 114.0, 178.0, 259.0, 406.0, 579.0, 926.0, 1500.0, 2307.0, 3770.0, 6196.0, 10354.0, 17192.0, 28598.0, 46367.0, 73544.0, 110327.0, 146516.0, 162154.0, 144047.0, 107484.0, 71367.0, 44570.0, 27120.0, 16809.0, 9820.0, 6014.0, 3631.0, 2265.0, 1361.0, 892.0, 583.0, 404.0, 238.0, 147.0, 104.0, 76.0, 37.0, 38.0, 21.0, 14.0, 10.0, 7.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.0625, -21.3828125, -20.703125, -20.0234375, -19.34375, -18.6640625, -17.984375, -17.3046875, -16.625, -15.9453125, -15.265625, -14.5859375, -13.90625, -13.2265625, -12.546875, -11.8671875, -11.1875, -10.5078125, -9.828125, -9.1484375, -8.46875, -7.7890625, -7.109375, -6.4296875, -5.75, -5.0703125, -4.390625, -3.7109375, -3.03125, -2.3515625, -1.671875, -0.9921875, -0.3125, 0.3671875, 1.046875, 1.7265625, 2.40625, 3.0859375, 3.765625, 4.4453125, 5.125, 5.8046875, 6.484375, 7.1640625, 7.84375, 8.5234375, 9.203125, 9.8828125, 10.5625, 11.2421875, 11.921875, 12.6015625, 13.28125, 13.9609375, 14.640625, 15.3203125, 16.0, 16.6796875, 17.359375, 18.0390625, 18.71875, 19.3984375, 20.078125, 20.7578125, 21.4375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 11.0, 6.0, 3.0, 3.0, 13.0, 14.0, 14.0, 19.0, 28.0, 16.0, 26.0, 33.0, 35.0, 42.0, 35.0, 34.0, 48.0, 45.0, 58.0, 59.0, 45.0, 48.0, 49.0, 47.0, 41.0, 34.0, 31.0, 25.0, 22.0, 24.0, 23.0, 21.0, 15.0, 10.0, 8.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.56005859375, -13.1669921875, -12.77392578125, -12.380859375, -11.98779296875, -11.5947265625, -11.20166015625, -10.80859375, -10.41552734375, -10.0224609375, -9.62939453125, -9.236328125, -8.84326171875, -8.4501953125, -8.05712890625, -7.6640625, -7.27099609375, -6.8779296875, -6.48486328125, -6.091796875, -5.69873046875, -5.3056640625, -4.91259765625, -4.51953125, -4.12646484375, -3.7333984375, -3.34033203125, -2.947265625, -2.55419921875, -2.1611328125, -1.76806640625, -1.375, -0.98193359375, -0.5888671875, -0.19580078125, 0.197265625, 0.59033203125, 0.9833984375, 1.37646484375, 1.76953125, 2.16259765625, 2.5556640625, 2.94873046875, 3.341796875, 3.73486328125, 4.1279296875, 4.52099609375, 4.9140625, 5.30712890625, 5.7001953125, 6.09326171875, 6.486328125, 6.87939453125, 7.2724609375, 7.66552734375, 8.05859375, 8.45166015625, 8.8447265625, 9.23779296875, 9.630859375, 10.02392578125, 10.4169921875, 10.81005859375, 11.203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 7.0, 9.0, 22.0, 31.0, 32.0, 42.0, 53.0, 89.0, 121.0, 213.0, 303.0, 524.0, 885.0, 1516.0, 2975.0, 6465.0, 14783.0, 38466.0, 115647.0, 342180.0, 341950.0, 115594.0, 38528.0, 14823.0, 6341.0, 3078.0, 1559.0, 872.0, 506.0, 282.0, 207.0, 131.0, 78.0, 58.0, 49.0, 34.0, 25.0, 11.0, 17.0, 13.0, 2.0, 12.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-32.21875, -31.2119140625, -30.205078125, -29.1982421875, -28.19140625, -27.1845703125, -26.177734375, -25.1708984375, -24.1640625, -23.1572265625, -22.150390625, -21.1435546875, -20.13671875, -19.1298828125, -18.123046875, -17.1162109375, -16.109375, -15.1025390625, -14.095703125, -13.0888671875, -12.08203125, -11.0751953125, -10.068359375, -9.0615234375, -8.0546875, -7.0478515625, -6.041015625, -5.0341796875, -4.02734375, -3.0205078125, -2.013671875, -1.0068359375, 0.0, 1.0068359375, 2.013671875, 3.0205078125, 4.02734375, 5.0341796875, 6.041015625, 7.0478515625, 8.0546875, 9.0615234375, 10.068359375, 11.0751953125, 12.08203125, 13.0888671875, 14.095703125, 15.1025390625, 16.109375, 17.1162109375, 18.123046875, 19.1298828125, 20.13671875, 21.1435546875, 22.150390625, 23.1572265625, 24.1640625, 25.1708984375, 26.177734375, 27.1845703125, 28.19140625, 29.1982421875, 30.205078125, 31.2119140625, 32.21875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 12.0, 9.0, 8.0, 12.0, 17.0, 49.0, 63.0, 110.0, 175.0, 183.0, 130.0, 91.0, 50.0, 31.0, 17.0, 8.0, 6.0, 4.0, 7.0, 1.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005340576171875, -0.005217015743255615, -0.0050934553146362305, -0.004969894886016846, -0.004846334457397461, -0.004722774028778076, -0.004599213600158691, -0.004475653171539307, -0.004352092742919922, -0.004228532314300537, -0.004104971885681152, -0.003981411457061768, -0.003857851028442383, -0.003734290599822998, -0.0036107301712036133, -0.0034871697425842285, -0.0033636093139648438, -0.003240048885345459, -0.0031164884567260742, -0.0029929280281066895, -0.0028693675994873047, -0.00274580717086792, -0.002622246742248535, -0.0024986863136291504, -0.0023751258850097656, -0.002251565456390381, -0.002128005027770996, -0.0020044445991516113, -0.0018808841705322266, -0.0017573237419128418, -0.001633763313293457, -0.0015102028846740723, -0.0013866424560546875, -0.0012630820274353027, -0.001139521598815918, -0.0010159611701965332, -0.0008924007415771484, -0.0007688403129577637, -0.0006452798843383789, -0.0005217194557189941, -0.0003981590270996094, -0.0002745985984802246, -0.00015103816986083984, -2.7477741241455078e-05, 9.608268737792969e-05, 0.00021964311599731445, 0.0003432035446166992, 0.000466763973236084, 0.0005903244018554688, 0.0007138848304748535, 0.0008374452590942383, 0.000961005687713623, 0.0010845661163330078, 0.0012081265449523926, 0.0013316869735717773, 0.0014552474021911621, 0.0015788078308105469, 0.0017023682594299316, 0.0018259286880493164, 0.0019494891166687012, 0.002073049545288086, 0.0021966099739074707, 0.0023201704025268555, 0.0024437308311462402, 0.002567291259765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 13.0, 16.0, 22.0, 24.0, 47.0, 70.0, 97.0, 167.0, 219.0, 365.0, 511.0, 854.0, 1310.0, 2161.0, 3502.0, 5789.0, 11030.0, 21588.0, 45769.0, 107532.0, 242739.0, 307724.0, 163404.0, 68109.0, 30809.0, 15001.0, 7904.0, 4423.0, 2701.0, 1738.0, 955.0, 646.0, 421.0, 306.0, 206.0, 116.0, 93.0, 65.0, 31.0, 23.0, 21.0, 11.0, 8.0, 6.0, 5.0, 0.0, 3.0, 2.0, 1.0], "bins": [-27.96875, -27.197021484375, -26.42529296875, -25.653564453125, -24.8818359375, -24.110107421875, -23.33837890625, -22.566650390625, -21.794921875, -21.023193359375, -20.25146484375, -19.479736328125, -18.7080078125, -17.936279296875, -17.16455078125, -16.392822265625, -15.62109375, -14.849365234375, -14.07763671875, -13.305908203125, -12.5341796875, -11.762451171875, -10.99072265625, -10.218994140625, -9.447265625, -8.675537109375, -7.90380859375, -7.132080078125, -6.3603515625, -5.588623046875, -4.81689453125, -4.045166015625, -3.2734375, -2.501708984375, -1.72998046875, -0.958251953125, -0.1865234375, 0.585205078125, 1.35693359375, 2.128662109375, 2.900390625, 3.672119140625, 4.44384765625, 5.215576171875, 5.9873046875, 6.759033203125, 7.53076171875, 8.302490234375, 9.07421875, 9.845947265625, 10.61767578125, 11.389404296875, 12.1611328125, 12.932861328125, 13.70458984375, 14.476318359375, 15.248046875, 16.019775390625, 16.79150390625, 17.563232421875, 18.3349609375, 19.106689453125, 19.87841796875, 20.650146484375, 21.421875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 4.0, 2.0, 9.0, 18.0, 17.0, 30.0, 33.0, 37.0, 50.0, 52.0, 53.0, 77.0, 67.0, 90.0, 73.0, 64.0, 75.0, 56.0, 33.0, 32.0, 25.0, 16.0, 23.0, 14.0, 11.0, 5.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -7.0006103515625, -6.790283203125, -6.5799560546875, -6.36962890625, -6.1593017578125, -5.948974609375, -5.7386474609375, -5.5283203125, -5.3179931640625, -5.107666015625, -4.8973388671875, -4.68701171875, -4.4766845703125, -4.266357421875, -4.0560302734375, -3.845703125, -3.6353759765625, -3.425048828125, -3.2147216796875, -3.00439453125, -2.7940673828125, -2.583740234375, -2.3734130859375, -2.1630859375, -1.9527587890625, -1.742431640625, -1.5321044921875, -1.32177734375, -1.1114501953125, -0.901123046875, -0.6907958984375, -0.48046875, -0.2701416015625, -0.059814453125, 0.1505126953125, 0.36083984375, 0.5711669921875, 0.781494140625, 0.9918212890625, 1.2021484375, 1.4124755859375, 1.622802734375, 1.8331298828125, 2.04345703125, 2.2537841796875, 2.464111328125, 2.6744384765625, 2.884765625, 3.0950927734375, 3.305419921875, 3.5157470703125, 3.72607421875, 3.9364013671875, 4.146728515625, 4.3570556640625, 4.5673828125, 4.7777099609375, 4.988037109375, 5.1983642578125, 5.40869140625, 5.6190185546875, 5.829345703125, 6.0396728515625, 6.25]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 16.0, 5.0, 12.0, 16.0, 18.0, 13.0, 23.0, 35.0, 40.0, 39.0, 56.0, 53.0, 54.0, 71.0, 57.0, 69.0, 59.0, 58.0, 59.0, 45.0, 25.0, 38.0, 25.0, 13.0, 17.0, 13.0, 13.0, 6.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.932640075683594, -28.98223876953125, -28.031837463378906, -27.08143424987793, -26.131032943725586, -25.180631637573242, -24.2302303314209, -23.279827117919922, -22.329425811767578, -21.379024505615234, -20.42862319946289, -19.478219985961914, -18.52781867980957, -17.577417373657227, -16.627016067504883, -15.676613807678223, -14.726212501525879, -13.775811195373535, -12.825408935546875, -11.875007629394531, -10.924605369567871, -9.974204063415527, -9.023801803588867, -8.073400497436523, -7.1229987144470215, -6.1725969314575195, -5.222195148468018, -4.271793365478516, -3.3213918209075928, -2.37099027633667, -1.420588493347168, -0.470186710357666, 0.48021507263183594, 1.430616855621338, 2.38101863861084, 3.3314201831817627, 4.281822204589844, 5.2322235107421875, 6.1826252937316895, 7.133027076721191, 8.083429336547852, 9.033830642700195, 9.984232902526855, 10.9346342086792, 11.88503646850586, 12.835437774658203, 13.785839080810547, 14.736241340637207, 15.68664264678955, 16.63704490661621, 17.587446212768555, 18.5378475189209, 19.488248825073242, 20.43865203857422, 21.389053344726562, 22.339454650878906, 23.28985595703125, 24.240257263183594, 25.190658569335938, 26.141061782836914, 27.091463088989258, 28.0418643951416, 28.992265701293945, 29.942668914794922, 30.893070220947266]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 8.0, 6.0, 4.0, 7.0, 7.0, 12.0, 8.0, 12.0, 18.0, 19.0, 25.0, 17.0, 18.0, 25.0, 19.0, 15.0, 27.0, 19.0, 33.0, 36.0, 43.0, 41.0, 28.0, 32.0, 41.0, 41.0, 36.0, 45.0, 31.0, 35.0, 31.0, 26.0, 29.0, 33.0, 27.0, 24.0, 21.0, 23.0, 9.0, 20.0, 6.0, 12.0, 8.0, 8.0, 7.0, 2.0, 0.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-15.10141658782959, -14.670954704284668, -14.240493774414062, -13.81003189086914, -13.379570007324219, -12.949108123779297, -12.518647193908691, -12.08818531036377, -11.657724380493164, -11.227262496948242, -10.796801567077637, -10.366339683532715, -9.935877799987793, -9.505416870117188, -9.074954986572266, -8.644493103027344, -8.214031219482422, -7.783569812774658, -7.353107929229736, -6.922646522521973, -6.492184638977051, -6.061723232269287, -5.631261825561523, -5.200799942016602, -4.770338535308838, -4.339877128601074, -3.9094152450561523, -3.4789538383483887, -3.048492193222046, -2.618030548095703, -2.1875691413879395, -1.7571074962615967, -1.326645851135254, -0.8961842656135559, -0.4657226800918579, -0.03526115417480469, 0.3952004909515381, 0.8256621360778809, 1.2561235427856445, 1.6865851879119873, 2.11704683303833, 2.547508478164673, 2.9779701232910156, 3.4084315299987793, 3.838893175125122, 4.269354820251465, 4.6998162269592285, 5.130277633666992, 5.560739517211914, 5.991200923919678, 6.4216628074646, 6.852124214172363, 7.282586097717285, 7.713047504425049, 8.143508911132812, 8.573970794677734, 9.004432678222656, 9.434894561767578, 9.865355491638184, 10.295817375183105, 10.726279258728027, 11.156740188598633, 11.587202072143555, 12.017663955688477, 12.448124885559082]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [6.0, 10.0, 8.0, 14.0, 22.0, 31.0, 38.0, 67.0, 59.0, 104.0, 146.0, 172.0, 289.0, 425.0, 584.0, 835.0, 1248.0, 1839.0, 2813.0, 4104.0, 6404.0, 10299.0, 17048.0, 28523.0, 50450.0, 93648.0, 183404.0, 374914.0, 724937.0, 1017857.0, 796489.0, 427548.0, 210119.0, 104868.0, 55538.0, 30835.0, 18044.0, 10947.0, 6753.0, 4234.0, 2730.0, 1826.0, 1216.0, 899.0, 582.0, 411.0, 297.0, 167.0, 148.0, 106.0, 74.0, 45.0, 35.0, 29.0, 15.0, 11.0, 11.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0], "bins": [-28.140625, -27.189697265625, -26.23876953125, -25.287841796875, -24.3369140625, -23.385986328125, -22.43505859375, -21.484130859375, -20.533203125, -19.582275390625, -18.63134765625, -17.680419921875, -16.7294921875, -15.778564453125, -14.82763671875, -13.876708984375, -12.92578125, -11.974853515625, -11.02392578125, -10.072998046875, -9.1220703125, -8.171142578125, -7.22021484375, -6.269287109375, -5.318359375, -4.367431640625, -3.41650390625, -2.465576171875, -1.5146484375, -0.563720703125, 0.38720703125, 1.338134765625, 2.2890625, 3.239990234375, 4.19091796875, 5.141845703125, 6.0927734375, 7.043701171875, 7.99462890625, 8.945556640625, 9.896484375, 10.847412109375, 11.79833984375, 12.749267578125, 13.7001953125, 14.651123046875, 15.60205078125, 16.552978515625, 17.50390625, 18.454833984375, 19.40576171875, 20.356689453125, 21.3076171875, 22.258544921875, 23.20947265625, 24.160400390625, 25.111328125, 26.062255859375, 27.01318359375, 27.964111328125, 28.9150390625, 29.865966796875, 30.81689453125, 31.767822265625, 32.71875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0, 7.0, 7.0, 5.0, 5.0, 15.0, 17.0, 18.0, 14.0, 12.0, 20.0, 16.0, 23.0, 19.0, 28.0, 21.0, 32.0, 35.0, 28.0, 28.0, 36.0, 40.0, 27.0, 43.0, 40.0, 41.0, 34.0, 43.0, 33.0, 32.0, 32.0, 26.0, 31.0, 28.0, 24.0, 19.0, 16.0, 13.0, 11.0, 17.0, 16.0, 4.0, 8.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 3.0, 1.0], "bins": [-12.375, -11.996826171875, -11.61865234375, -11.240478515625, -10.8623046875, -10.484130859375, -10.10595703125, -9.727783203125, -9.349609375, -8.971435546875, -8.59326171875, -8.215087890625, -7.8369140625, -7.458740234375, -7.08056640625, -6.702392578125, -6.32421875, -5.946044921875, -5.56787109375, -5.189697265625, -4.8115234375, -4.433349609375, -4.05517578125, -3.677001953125, -3.298828125, -2.920654296875, -2.54248046875, -2.164306640625, -1.7861328125, -1.407958984375, -1.02978515625, -0.651611328125, -0.2734375, 0.104736328125, 0.48291015625, 0.861083984375, 1.2392578125, 1.617431640625, 1.99560546875, 2.373779296875, 2.751953125, 3.130126953125, 3.50830078125, 3.886474609375, 4.2646484375, 4.642822265625, 5.02099609375, 5.399169921875, 5.77734375, 6.155517578125, 6.53369140625, 6.911865234375, 7.2900390625, 7.668212890625, 8.04638671875, 8.424560546875, 8.802734375, 9.180908203125, 9.55908203125, 9.937255859375, 10.3154296875, 10.693603515625, 11.07177734375, 11.449951171875, 11.828125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 18.0, 19.0, 30.0, 53.0, 80.0, 112.0, 134.0, 214.0, 263.0, 516.0, 642.0, 1015.0, 1639.0, 2511.0, 4025.0, 6452.0, 10721.0, 18083.0, 31593.0, 56477.0, 104166.0, 201484.0, 399547.0, 756170.0, 1022737.0, 747595.0, 394021.0, 198512.0, 102911.0, 55323.0, 30856.0, 17862.0, 10675.0, 6460.0, 3935.0, 2478.0, 1646.0, 1079.0, 725.0, 472.0, 316.0, 201.0, 159.0, 113.0, 77.0, 53.0, 41.0, 28.0, 17.0, 8.0, 7.0, 5.0, 2.0, 2.0], "bins": [-42.0, -40.7822265625, -39.564453125, -38.3466796875, -37.12890625, -35.9111328125, -34.693359375, -33.4755859375, -32.2578125, -31.0400390625, -29.822265625, -28.6044921875, -27.38671875, -26.1689453125, -24.951171875, -23.7333984375, -22.515625, -21.2978515625, -20.080078125, -18.8623046875, -17.64453125, -16.4267578125, -15.208984375, -13.9912109375, -12.7734375, -11.5556640625, -10.337890625, -9.1201171875, -7.90234375, -6.6845703125, -5.466796875, -4.2490234375, -3.03125, -1.8134765625, -0.595703125, 0.6220703125, 1.83984375, 3.0576171875, 4.275390625, 5.4931640625, 6.7109375, 7.9287109375, 9.146484375, 10.3642578125, 11.58203125, 12.7998046875, 14.017578125, 15.2353515625, 16.453125, 17.6708984375, 18.888671875, 20.1064453125, 21.32421875, 22.5419921875, 23.759765625, 24.9775390625, 26.1953125, 27.4130859375, 28.630859375, 29.8486328125, 31.06640625, 32.2841796875, 33.501953125, 34.7197265625, 35.9375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 15.0, 22.0, 23.0, 29.0, 54.0, 58.0, 71.0, 104.0, 103.0, 143.0, 163.0, 200.0, 244.0, 254.0, 291.0, 289.0, 295.0, 259.0, 243.0, 216.0, 187.0, 137.0, 117.0, 92.0, 92.0, 66.0, 72.0, 40.0, 48.0, 21.0, 30.0, 11.0, 11.0, 9.0, 12.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1533203125, -8.814453125, -8.4755859375, -8.13671875, -7.7978515625, -7.458984375, -7.1201171875, -6.78125, -6.4423828125, -6.103515625, -5.7646484375, -5.42578125, -5.0869140625, -4.748046875, -4.4091796875, -4.0703125, -3.7314453125, -3.392578125, -3.0537109375, -2.71484375, -2.3759765625, -2.037109375, -1.6982421875, -1.359375, -1.0205078125, -0.681640625, -0.3427734375, -0.00390625, 0.3349609375, 0.673828125, 1.0126953125, 1.3515625, 1.6904296875, 2.029296875, 2.3681640625, 2.70703125, 3.0458984375, 3.384765625, 3.7236328125, 4.0625, 4.4013671875, 4.740234375, 5.0791015625, 5.41796875, 5.7568359375, 6.095703125, 6.4345703125, 6.7734375, 7.1123046875, 7.451171875, 7.7900390625, 8.12890625, 8.4677734375, 8.806640625, 9.1455078125, 9.484375, 9.8232421875, 10.162109375, 10.5009765625, 10.83984375, 11.1787109375, 11.517578125, 11.8564453125, 12.1953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 11.0, 14.0, 8.0, 15.0, 15.0, 24.0, 30.0, 44.0, 52.0, 56.0, 55.0, 69.0, 70.0, 86.0, 59.0, 59.0, 71.0, 45.0, 46.0, 34.0, 23.0, 23.0, 17.0, 13.0, 8.0, 8.0, 3.0, 11.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.60175323486328, -43.22584533691406, -41.84994125366211, -40.47403335571289, -39.09812927246094, -37.72222137451172, -36.3463134765625, -34.97040939331055, -33.594505310058594, -32.218597412109375, -30.842693328857422, -29.466785430908203, -28.09088134765625, -26.71497344970703, -25.339067459106445, -23.96316146850586, -22.58725357055664, -21.211347579956055, -19.83544158935547, -18.45953369140625, -17.083629608154297, -15.707722663879395, -14.331815719604492, -12.955909729003906, -11.58000373840332, -10.204097747802734, -8.828191757202148, -7.452284812927246, -6.07637882232666, -4.700472831726074, -3.324565887451172, -1.948659896850586, -0.5727500915527344, 0.8031561374664307, 2.1790623664855957, 3.55496883392334, 4.930874824523926, 6.306780815124512, 7.682687759399414, 9.05859375, 10.434499740600586, 11.810405731201172, 13.186311721801758, 14.56221866607666, 15.938124656677246, 17.314029693603516, 18.689937591552734, 20.06584358215332, 21.441749572753906, 22.817655563354492, 24.193561553955078, 25.569469451904297, 26.94537353515625, 28.32128143310547, 29.697187423706055, 31.07309341430664, 32.448997497558594, 33.82490539550781, 35.200809478759766, 36.576717376708984, 37.95262145996094, 39.328529357910156, 40.704437255859375, 42.08034133911133, 43.45624923706055]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 2.0, 8.0, 11.0, 7.0, 11.0, 8.0, 15.0, 20.0, 22.0, 14.0, 19.0, 21.0, 37.0, 40.0, 38.0, 27.0, 37.0, 43.0, 37.0, 51.0, 45.0, 37.0, 46.0, 36.0, 43.0, 46.0, 31.0, 42.0, 33.0, 22.0, 29.0, 16.0, 19.0, 13.0, 13.0, 14.0, 8.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.908977508544922, -19.299041748046875, -18.68910789489746, -18.079172134399414, -17.46923828125, -16.859302520751953, -16.24936866760254, -15.639432907104492, -15.029498100280762, -14.419563293457031, -13.8096284866333, -13.19969367980957, -12.589757919311523, -11.97982406616211, -11.369888305664062, -10.759953498840332, -10.150018692016602, -9.540083885192871, -8.93014907836914, -8.32021427154541, -7.7102789878845215, -7.100344181060791, -6.490408897399902, -5.880474090576172, -5.270539283752441, -4.660604476928711, -4.0506696701049805, -3.440734386444092, -2.8307995796203613, -2.220864772796631, -1.6109297275543213, -1.0009946823120117, -0.39105796813964844, 0.21887695789337158, 0.8288118839263916, 1.4387468099594116, 2.0486817359924316, 2.658616542816162, 3.2685515880584717, 3.8784866333007812, 4.488421440124512, 5.098356246948242, 5.708291053771973, 6.318226337432861, 6.928161144256592, 7.538095951080322, 8.148031234741211, 8.757966041564941, 9.367900848388672, 9.977835655212402, 10.587770462036133, 11.197705268859863, 11.807640075683594, 12.41757583618164, 13.027510643005371, 13.637445449829102, 14.247380256652832, 14.857315063476562, 15.467249870300293, 16.077184677124023, 16.68712043762207, 17.297054290771484, 17.90699005126953, 18.516925811767578, 19.126859664916992]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 9.0, 11.0, 11.0, 15.0, 23.0, 29.0, 52.0, 67.0, 103.0, 173.0, 263.0, 463.0, 729.0, 1154.0, 2086.0, 3557.0, 6674.0, 12440.0, 23712.0, 46946.0, 90648.0, 165019.0, 234085.0, 204354.0, 121901.0, 64378.0, 32654.0, 17028.0, 8654.0, 4811.0, 2532.0, 1580.0, 826.0, 592.0, 358.0, 226.0, 133.0, 83.0, 59.0, 39.0, 29.0, 16.0, 15.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.88427734375, -19.2373046875, -18.59033203125, -17.943359375, -17.29638671875, -16.6494140625, -16.00244140625, -15.35546875, -14.70849609375, -14.0615234375, -13.41455078125, -12.767578125, -12.12060546875, -11.4736328125, -10.82666015625, -10.1796875, -9.53271484375, -8.8857421875, -8.23876953125, -7.591796875, -6.94482421875, -6.2978515625, -5.65087890625, -5.00390625, -4.35693359375, -3.7099609375, -3.06298828125, -2.416015625, -1.76904296875, -1.1220703125, -0.47509765625, 0.171875, 0.81884765625, 1.4658203125, 2.11279296875, 2.759765625, 3.40673828125, 4.0537109375, 4.70068359375, 5.34765625, 5.99462890625, 6.6416015625, 7.28857421875, 7.935546875, 8.58251953125, 9.2294921875, 9.87646484375, 10.5234375, 11.17041015625, 11.8173828125, 12.46435546875, 13.111328125, 13.75830078125, 14.4052734375, 15.05224609375, 15.69921875, 16.34619140625, 16.9931640625, 17.64013671875, 18.287109375, 18.93408203125, 19.5810546875, 20.22802734375, 20.875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 6.0, 9.0, 7.0, 14.0, 11.0, 23.0, 15.0, 21.0, 23.0, 24.0, 34.0, 38.0, 27.0, 50.0, 34.0, 46.0, 42.0, 47.0, 42.0, 59.0, 42.0, 28.0, 45.0, 42.0, 40.0, 30.0, 30.0, 18.0, 22.0, 20.0, 21.0, 16.0, 11.0, 6.0, 7.0, 6.0, 9.0, 2.0, 2.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-24.078125, -23.36474609375, -22.6513671875, -21.93798828125, -21.224609375, -20.51123046875, -19.7978515625, -19.08447265625, -18.37109375, -17.65771484375, -16.9443359375, -16.23095703125, -15.517578125, -14.80419921875, -14.0908203125, -13.37744140625, -12.6640625, -11.95068359375, -11.2373046875, -10.52392578125, -9.810546875, -9.09716796875, -8.3837890625, -7.67041015625, -6.95703125, -6.24365234375, -5.5302734375, -4.81689453125, -4.103515625, -3.39013671875, -2.6767578125, -1.96337890625, -1.25, -0.53662109375, 0.1767578125, 0.89013671875, 1.603515625, 2.31689453125, 3.0302734375, 3.74365234375, 4.45703125, 5.17041015625, 5.8837890625, 6.59716796875, 7.310546875, 8.02392578125, 8.7373046875, 9.45068359375, 10.1640625, 10.87744140625, 11.5908203125, 12.30419921875, 13.017578125, 13.73095703125, 14.4443359375, 15.15771484375, 15.87109375, 16.58447265625, 17.2978515625, 18.01123046875, 18.724609375, 19.43798828125, 20.1513671875, 20.86474609375, 21.578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 14.0, 18.0, 26.0, 20.0, 35.0, 58.0, 69.0, 106.0, 150.0, 208.0, 307.0, 461.0, 637.0, 1008.0, 1488.0, 2343.0, 3739.0, 6211.0, 10920.0, 19573.0, 37521.0, 72875.0, 138790.0, 229829.0, 228871.0, 137996.0, 71866.0, 36771.0, 19151.0, 10623.0, 6225.0, 3707.0, 2340.0, 1498.0, 967.0, 626.0, 468.0, 295.0, 225.0, 155.0, 108.0, 76.0, 50.0, 38.0, 23.0, 21.0, 13.0, 8.0, 12.0, 5.0, 3.0, 3.0, 3.0], "bins": [-24.578125, -23.875732421875, -23.17333984375, -22.470947265625, -21.7685546875, -21.066162109375, -20.36376953125, -19.661376953125, -18.958984375, -18.256591796875, -17.55419921875, -16.851806640625, -16.1494140625, -15.447021484375, -14.74462890625, -14.042236328125, -13.33984375, -12.637451171875, -11.93505859375, -11.232666015625, -10.5302734375, -9.827880859375, -9.12548828125, -8.423095703125, -7.720703125, -7.018310546875, -6.31591796875, -5.613525390625, -4.9111328125, -4.208740234375, -3.50634765625, -2.803955078125, -2.1015625, -1.399169921875, -0.69677734375, 0.005615234375, 0.7080078125, 1.410400390625, 2.11279296875, 2.815185546875, 3.517578125, 4.219970703125, 4.92236328125, 5.624755859375, 6.3271484375, 7.029541015625, 7.73193359375, 8.434326171875, 9.13671875, 9.839111328125, 10.54150390625, 11.243896484375, 11.9462890625, 12.648681640625, 13.35107421875, 14.053466796875, 14.755859375, 15.458251953125, 16.16064453125, 16.863037109375, 17.5654296875, 18.267822265625, 18.97021484375, 19.672607421875, 20.375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 4.0, 7.0, 6.0, 5.0, 12.0, 12.0, 22.0, 20.0, 21.0, 21.0, 27.0, 21.0, 31.0, 35.0, 38.0, 37.0, 47.0, 46.0, 50.0, 32.0, 45.0, 39.0, 32.0, 47.0, 35.0, 35.0, 34.0, 31.0, 27.0, 35.0, 17.0, 20.0, 19.0, 20.0, 10.0, 17.0, 9.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.703125, -12.2801513671875, -11.857177734375, -11.4342041015625, -11.01123046875, -10.5882568359375, -10.165283203125, -9.7423095703125, -9.3193359375, -8.8963623046875, -8.473388671875, -8.0504150390625, -7.62744140625, -7.2044677734375, -6.781494140625, -6.3585205078125, -5.935546875, -5.5125732421875, -5.089599609375, -4.6666259765625, -4.24365234375, -3.8206787109375, -3.397705078125, -2.9747314453125, -2.5517578125, -2.1287841796875, -1.705810546875, -1.2828369140625, -0.85986328125, -0.4368896484375, -0.013916015625, 0.4090576171875, 0.83203125, 1.2550048828125, 1.677978515625, 2.1009521484375, 2.52392578125, 2.9468994140625, 3.369873046875, 3.7928466796875, 4.2158203125, 4.6387939453125, 5.061767578125, 5.4847412109375, 5.90771484375, 6.3306884765625, 6.753662109375, 7.1766357421875, 7.599609375, 8.0225830078125, 8.445556640625, 8.8685302734375, 9.29150390625, 9.7144775390625, 10.137451171875, 10.5604248046875, 10.9833984375, 11.4063720703125, 11.829345703125, 12.2523193359375, 12.67529296875, 13.0982666015625, 13.521240234375, 13.9442138671875, 14.3671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 11.0, 16.0, 34.0, 28.0, 72.0, 90.0, 117.0, 211.0, 331.0, 411.0, 646.0, 984.0, 1712.0, 2579.0, 4350.0, 7260.0, 12144.0, 21578.0, 39509.0, 74092.0, 141039.0, 238310.0, 223527.0, 126829.0, 67450.0, 36007.0, 20125.0, 11226.0, 6736.0, 4178.0, 2501.0, 1526.0, 978.0, 654.0, 416.0, 261.0, 209.0, 116.0, 88.0, 57.0, 41.0, 21.0, 19.0, 16.0, 10.0, 7.0, 8.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5, -8.2159423828125, -7.931884765625, -7.6478271484375, -7.36376953125, -7.0797119140625, -6.795654296875, -6.5115966796875, -6.2275390625, -5.9434814453125, -5.659423828125, -5.3753662109375, -5.09130859375, -4.8072509765625, -4.523193359375, -4.2391357421875, -3.955078125, -3.6710205078125, -3.386962890625, -3.1029052734375, -2.81884765625, -2.5347900390625, -2.250732421875, -1.9666748046875, -1.6826171875, -1.3985595703125, -1.114501953125, -0.8304443359375, -0.54638671875, -0.2623291015625, 0.021728515625, 0.3057861328125, 0.58984375, 0.8739013671875, 1.157958984375, 1.4420166015625, 1.72607421875, 2.0101318359375, 2.294189453125, 2.5782470703125, 2.8623046875, 3.1463623046875, 3.430419921875, 3.7144775390625, 3.99853515625, 4.2825927734375, 4.566650390625, 4.8507080078125, 5.134765625, 5.4188232421875, 5.702880859375, 5.9869384765625, 6.27099609375, 6.5550537109375, 6.839111328125, 7.1231689453125, 7.4072265625, 7.6912841796875, 7.975341796875, 8.2593994140625, 8.54345703125, 8.8275146484375, 9.111572265625, 9.3956298828125, 9.6796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 10.0, 8.0, 10.0, 6.0, 18.0, 23.0, 28.0, 23.0, 49.0, 54.0, 49.0, 82.0, 90.0, 81.0, 90.0, 68.0, 85.0, 57.0, 47.0, 31.0, 23.0, 20.0, 8.0, 14.0, 8.0, 4.0, 3.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010890960693359375, -0.001062937080860138, -0.0010367780923843384, -0.0010106191039085388, -0.0009844601154327393, -0.0009583011269569397, -0.0009321421384811401, -0.0009059831500053406, -0.000879824161529541, -0.0008536651730537415, -0.0008275061845779419, -0.0008013471961021423, -0.0007751882076263428, -0.0007490292191505432, -0.0007228702306747437, -0.0006967112421989441, -0.0006705522537231445, -0.000644393265247345, -0.0006182342767715454, -0.0005920752882957458, -0.0005659162998199463, -0.0005397573113441467, -0.0005135983228683472, -0.0004874393343925476, -0.00046128034591674805, -0.0004351213574409485, -0.0004089623689651489, -0.00038280338048934937, -0.0003566443920135498, -0.00033048540353775024, -0.0003043264150619507, -0.0002781674265861511, -0.00025200843811035156, -0.000225849449634552, -0.00019969046115875244, -0.00017353147268295288, -0.00014737248420715332, -0.00012121349573135376, -9.50545072555542e-05, -6.889551877975464e-05, -4.273653030395508e-05, -1.6577541828155518e-05, 9.581446647644043e-06, 3.5740435123443604e-05, 6.189942359924316e-05, 8.805841207504272e-05, 0.00011421740055084229, 0.00014037638902664185, 0.0001665353775024414, 0.00019269436597824097, 0.00021885335445404053, 0.0002450123429298401, 0.00027117133140563965, 0.0002973303198814392, 0.00032348930835723877, 0.00034964829683303833, 0.0003758072853088379, 0.00040196627378463745, 0.000428125262260437, 0.00045428425073623657, 0.00048044323921203613, 0.0005066022276878357, 0.0005327612161636353, 0.0005589202046394348, 0.0005850791931152344]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 14.0, 22.0, 18.0, 41.0, 67.0, 87.0, 116.0, 207.0, 335.0, 536.0, 826.0, 1241.0, 2039.0, 3355.0, 5399.0, 8793.0, 14640.0, 24744.0, 42429.0, 72384.0, 119859.0, 173297.0, 189904.0, 150367.0, 97256.0, 57374.0, 33343.0, 19633.0, 11671.0, 7044.0, 4266.0, 2701.0, 1696.0, 1034.0, 641.0, 415.0, 265.0, 165.0, 122.0, 73.0, 41.0, 28.0, 23.0, 11.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-9.765625, -9.47216796875, -9.1787109375, -8.88525390625, -8.591796875, -8.29833984375, -8.0048828125, -7.71142578125, -7.41796875, -7.12451171875, -6.8310546875, -6.53759765625, -6.244140625, -5.95068359375, -5.6572265625, -5.36376953125, -5.0703125, -4.77685546875, -4.4833984375, -4.18994140625, -3.896484375, -3.60302734375, -3.3095703125, -3.01611328125, -2.72265625, -2.42919921875, -2.1357421875, -1.84228515625, -1.548828125, -1.25537109375, -0.9619140625, -0.66845703125, -0.375, -0.08154296875, 0.2119140625, 0.50537109375, 0.798828125, 1.09228515625, 1.3857421875, 1.67919921875, 1.97265625, 2.26611328125, 2.5595703125, 2.85302734375, 3.146484375, 3.43994140625, 3.7333984375, 4.02685546875, 4.3203125, 4.61376953125, 4.9072265625, 5.20068359375, 5.494140625, 5.78759765625, 6.0810546875, 6.37451171875, 6.66796875, 6.96142578125, 7.2548828125, 7.54833984375, 7.841796875, 8.13525390625, 8.4287109375, 8.72216796875, 9.015625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 3.0, 7.0, 5.0, 6.0, 14.0, 11.0, 15.0, 10.0, 17.0, 18.0, 24.0, 23.0, 26.0, 24.0, 28.0, 30.0, 47.0, 51.0, 57.0, 42.0, 45.0, 48.0, 42.0, 37.0, 35.0, 44.0, 31.0, 41.0, 31.0, 24.0, 24.0, 20.0, 18.0, 18.0, 11.0, 17.0, 12.0, 9.0, 5.0, 2.0, 8.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.29296875, -2.22393798828125, -2.1549072265625, -2.08587646484375, -2.016845703125, -1.94781494140625, -1.8787841796875, -1.80975341796875, -1.74072265625, -1.67169189453125, -1.6026611328125, -1.53363037109375, -1.464599609375, -1.39556884765625, -1.3265380859375, -1.25750732421875, -1.1884765625, -1.11944580078125, -1.0504150390625, -0.98138427734375, -0.912353515625, -0.84332275390625, -0.7742919921875, -0.70526123046875, -0.63623046875, -0.56719970703125, -0.4981689453125, -0.42913818359375, -0.360107421875, -0.29107666015625, -0.2220458984375, -0.15301513671875, -0.083984375, -0.01495361328125, 0.0540771484375, 0.12310791015625, 0.192138671875, 0.26116943359375, 0.3302001953125, 0.39923095703125, 0.46826171875, 0.53729248046875, 0.6063232421875, 0.67535400390625, 0.744384765625, 0.81341552734375, 0.8824462890625, 0.95147705078125, 1.0205078125, 1.08953857421875, 1.1585693359375, 1.22760009765625, 1.296630859375, 1.36566162109375, 1.4346923828125, 1.50372314453125, 1.57275390625, 1.64178466796875, 1.7108154296875, 1.77984619140625, 1.848876953125, 1.91790771484375, 1.9869384765625, 2.05596923828125, 2.125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 10.0, 12.0, 11.0, 11.0, 9.0, 19.0, 28.0, 34.0, 48.0, 55.0, 48.0, 64.0, 61.0, 92.0, 75.0, 60.0, 63.0, 62.0, 46.0, 44.0, 28.0, 19.0, 21.0, 13.0, 9.0, 14.0, 4.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.70714569091797, -43.313541412353516, -41.91993713378906, -40.526329040527344, -39.13272476196289, -37.73912048339844, -36.345516204833984, -34.95191192626953, -33.55830383300781, -32.16469955444336, -30.771093368530273, -29.37748908996582, -27.983882904052734, -26.59027862548828, -25.196674346923828, -23.803068161010742, -22.40946388244629, -21.015859603881836, -19.62225341796875, -18.228649139404297, -16.83504295349121, -15.441438674926758, -14.047833442687988, -12.654228210449219, -11.26062297821045, -9.86701774597168, -8.47341251373291, -7.079807758331299, -5.686202526092529, -4.29259729385376, -2.8989925384521484, -1.505387306213379, -0.11178207397460938, 1.2818230390548706, 2.6754281520843506, 4.069033145904541, 5.4626383781433105, 6.85624361038208, 8.249848365783691, 9.643453598022461, 11.03705883026123, 12.4306640625, 13.82426929473877, 15.217874526977539, 16.611478805541992, 18.005084991455078, 19.39868927001953, 20.792293548583984, 22.18589973449707, 23.579504013061523, 24.97311019897461, 26.366714477539062, 27.76032066345215, 29.1539249420166, 30.547531127929688, 31.94113540649414, 33.334739685058594, 34.72834396362305, 36.1219482421875, 37.51555633544922, 38.90916061401367, 40.302764892578125, 41.69636917114258, 43.08997344970703, 44.48358154296875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 9.0, 6.0, 11.0, 13.0, 11.0, 26.0, 15.0, 16.0, 22.0, 29.0, 39.0, 32.0, 36.0, 31.0, 40.0, 35.0, 46.0, 44.0, 48.0, 42.0, 41.0, 35.0, 48.0, 41.0, 35.0, 35.0, 28.0, 26.0, 28.0, 18.0, 17.0, 15.0, 7.0, 14.0, 11.0, 6.0, 5.0, 6.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.435171127319336, -18.831344604492188, -18.22751808166504, -17.62369155883789, -17.019865036010742, -16.416038513183594, -15.812211990356445, -15.208385467529297, -14.604558944702148, -14.000732421875, -13.396905899047852, -12.793079376220703, -12.189252853393555, -11.585426330566406, -10.981599807739258, -10.37777328491211, -9.773947715759277, -9.170121192932129, -8.56629467010498, -7.962468147277832, -7.358641624450684, -6.754815101623535, -6.150989055633545, -5.5471625328063965, -4.943336009979248, -4.3395094871521, -3.735682964324951, -3.131856679916382, -2.5280301570892334, -1.924203634262085, -1.3203773498535156, -0.7165508270263672, -0.11272430419921875, 0.4911021590232849, 1.0949286222457886, 1.6987550258636475, 2.302581548690796, 2.9064080715179443, 3.5102343559265137, 4.114060878753662, 4.7178874015808105, 5.321713924407959, 5.925540447235107, 6.529366493225098, 7.133193016052246, 7.7370195388793945, 8.340846061706543, 8.944672584533691, 9.54849910736084, 10.152325630187988, 10.756152153015137, 11.359978675842285, 11.963805198669434, 12.567631721496582, 13.171457290649414, 13.775283813476562, 14.379110336303711, 14.98293685913086, 15.586763381958008, 16.190589904785156, 16.794416427612305, 17.398242950439453, 18.0020694732666, 18.60589599609375, 19.2097225189209]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 3.0, 8.0, 17.0, 14.0, 27.0, 50.0, 51.0, 90.0, 118.0, 193.0, 280.0, 473.0, 706.0, 1112.0, 1653.0, 2653.0, 4246.0, 6877.0, 11074.0, 17710.0, 28271.0, 43554.0, 66369.0, 95733.0, 124681.0, 143461.0, 139065.0, 115462.0, 84940.0, 57685.0, 37799.0, 23874.0, 15018.0, 9376.0, 5728.0, 3767.0, 2324.0, 1427.0, 941.0, 604.0, 388.0, 246.0, 155.0, 97.0, 92.0, 56.0, 31.0, 23.0, 17.0, 11.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.34375, -20.628173828125, -19.91259765625, -19.197021484375, -18.4814453125, -17.765869140625, -17.05029296875, -16.334716796875, -15.619140625, -14.903564453125, -14.18798828125, -13.472412109375, -12.7568359375, -12.041259765625, -11.32568359375, -10.610107421875, -9.89453125, -9.178955078125, -8.46337890625, -7.747802734375, -7.0322265625, -6.316650390625, -5.60107421875, -4.885498046875, -4.169921875, -3.454345703125, -2.73876953125, -2.023193359375, -1.3076171875, -0.592041015625, 0.12353515625, 0.839111328125, 1.5546875, 2.270263671875, 2.98583984375, 3.701416015625, 4.4169921875, 5.132568359375, 5.84814453125, 6.563720703125, 7.279296875, 7.994873046875, 8.71044921875, 9.426025390625, 10.1416015625, 10.857177734375, 11.57275390625, 12.288330078125, 13.00390625, 13.719482421875, 14.43505859375, 15.150634765625, 15.8662109375, 16.581787109375, 17.29736328125, 18.012939453125, 18.728515625, 19.444091796875, 20.15966796875, 20.875244140625, 21.5908203125, 22.306396484375, 23.02197265625, 23.737548828125, 24.453125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 11.0, 8.0, 10.0, 13.0, 14.0, 11.0, 18.0, 29.0, 23.0, 31.0, 34.0, 25.0, 31.0, 35.0, 42.0, 40.0, 42.0, 65.0, 46.0, 43.0, 37.0, 42.0, 39.0, 48.0, 41.0, 27.0, 25.0, 38.0, 17.0, 17.0, 14.0, 10.0, 18.0, 13.0, 12.0, 12.0, 4.0, 2.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.875, -23.161865234375, -22.44873046875, -21.735595703125, -21.0224609375, -20.309326171875, -19.59619140625, -18.883056640625, -18.169921875, -17.456787109375, -16.74365234375, -16.030517578125, -15.3173828125, -14.604248046875, -13.89111328125, -13.177978515625, -12.46484375, -11.751708984375, -11.03857421875, -10.325439453125, -9.6123046875, -8.899169921875, -8.18603515625, -7.472900390625, -6.759765625, -6.046630859375, -5.33349609375, -4.620361328125, -3.9072265625, -3.194091796875, -2.48095703125, -1.767822265625, -1.0546875, -0.341552734375, 0.37158203125, 1.084716796875, 1.7978515625, 2.510986328125, 3.22412109375, 3.937255859375, 4.650390625, 5.363525390625, 6.07666015625, 6.789794921875, 7.5029296875, 8.216064453125, 8.92919921875, 9.642333984375, 10.35546875, 11.068603515625, 11.78173828125, 12.494873046875, 13.2080078125, 13.921142578125, 14.63427734375, 15.347412109375, 16.060546875, 16.773681640625, 17.48681640625, 18.199951171875, 18.9130859375, 19.626220703125, 20.33935546875, 21.052490234375, 21.765625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 4.0, 14.0, 13.0, 28.0, 33.0, 43.0, 93.0, 115.0, 158.0, 283.0, 392.0, 610.0, 955.0, 1517.0, 2406.0, 3886.0, 6120.0, 9550.0, 14720.0, 22577.0, 34967.0, 51612.0, 74038.0, 100231.0, 124486.0, 135388.0, 125727.0, 103497.0, 77112.0, 54242.0, 36407.0, 24107.0, 15633.0, 10110.0, 6361.0, 4095.0, 2548.0, 1573.0, 1000.0, 665.0, 432.0, 281.0, 176.0, 100.0, 83.0, 51.0, 35.0, 20.0, 16.0, 18.0, 7.0, 2.0, 10.0, 4.0, 1.0, 4.0, 2.0], "bins": [-23.609375, -22.88427734375, -22.1591796875, -21.43408203125, -20.708984375, -19.98388671875, -19.2587890625, -18.53369140625, -17.80859375, -17.08349609375, -16.3583984375, -15.63330078125, -14.908203125, -14.18310546875, -13.4580078125, -12.73291015625, -12.0078125, -11.28271484375, -10.5576171875, -9.83251953125, -9.107421875, -8.38232421875, -7.6572265625, -6.93212890625, -6.20703125, -5.48193359375, -4.7568359375, -4.03173828125, -3.306640625, -2.58154296875, -1.8564453125, -1.13134765625, -0.40625, 0.31884765625, 1.0439453125, 1.76904296875, 2.494140625, 3.21923828125, 3.9443359375, 4.66943359375, 5.39453125, 6.11962890625, 6.8447265625, 7.56982421875, 8.294921875, 9.02001953125, 9.7451171875, 10.47021484375, 11.1953125, 11.92041015625, 12.6455078125, 13.37060546875, 14.095703125, 14.82080078125, 15.5458984375, 16.27099609375, 16.99609375, 17.72119140625, 18.4462890625, 19.17138671875, 19.896484375, 20.62158203125, 21.3466796875, 22.07177734375, 22.796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 11.0, 9.0, 9.0, 12.0, 13.0, 14.0, 19.0, 22.0, 24.0, 21.0, 27.0, 28.0, 30.0, 38.0, 33.0, 36.0, 33.0, 36.0, 42.0, 32.0, 36.0, 31.0, 30.0, 32.0, 43.0, 33.0, 36.0, 27.0, 22.0, 32.0, 18.0, 23.0, 15.0, 19.0, 18.0, 16.0, 15.0, 7.0, 9.0, 5.0, 0.0, 5.0, 7.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0], "bins": [-13.078125, -12.689453125, -12.30078125, -11.912109375, -11.5234375, -11.134765625, -10.74609375, -10.357421875, -9.96875, -9.580078125, -9.19140625, -8.802734375, -8.4140625, -8.025390625, -7.63671875, -7.248046875, -6.859375, -6.470703125, -6.08203125, -5.693359375, -5.3046875, -4.916015625, -4.52734375, -4.138671875, -3.75, -3.361328125, -2.97265625, -2.583984375, -2.1953125, -1.806640625, -1.41796875, -1.029296875, -0.640625, -0.251953125, 0.13671875, 0.525390625, 0.9140625, 1.302734375, 1.69140625, 2.080078125, 2.46875, 2.857421875, 3.24609375, 3.634765625, 4.0234375, 4.412109375, 4.80078125, 5.189453125, 5.578125, 5.966796875, 6.35546875, 6.744140625, 7.1328125, 7.521484375, 7.91015625, 8.298828125, 8.6875, 9.076171875, 9.46484375, 9.853515625, 10.2421875, 10.630859375, 11.01953125, 11.408203125, 11.796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 9.0, 14.0, 16.0, 24.0, 43.0, 53.0, 88.0, 125.0, 189.0, 315.0, 417.0, 710.0, 1081.0, 1753.0, 3012.0, 4774.0, 8088.0, 14016.0, 24863.0, 44343.0, 79219.0, 136989.0, 208511.0, 206602.0, 133737.0, 77602.0, 43713.0, 24213.0, 13710.0, 7956.0, 4612.0, 2811.0, 1736.0, 1082.0, 755.0, 467.0, 296.0, 211.0, 140.0, 90.0, 59.0, 49.0, 15.0, 9.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0], "bins": [-22.375, -21.7353515625, -21.095703125, -20.4560546875, -19.81640625, -19.1767578125, -18.537109375, -17.8974609375, -17.2578125, -16.6181640625, -15.978515625, -15.3388671875, -14.69921875, -14.0595703125, -13.419921875, -12.7802734375, -12.140625, -11.5009765625, -10.861328125, -10.2216796875, -9.58203125, -8.9423828125, -8.302734375, -7.6630859375, -7.0234375, -6.3837890625, -5.744140625, -5.1044921875, -4.46484375, -3.8251953125, -3.185546875, -2.5458984375, -1.90625, -1.2666015625, -0.626953125, 0.0126953125, 0.65234375, 1.2919921875, 1.931640625, 2.5712890625, 3.2109375, 3.8505859375, 4.490234375, 5.1298828125, 5.76953125, 6.4091796875, 7.048828125, 7.6884765625, 8.328125, 8.9677734375, 9.607421875, 10.2470703125, 10.88671875, 11.5263671875, 12.166015625, 12.8056640625, 13.4453125, 14.0849609375, 14.724609375, 15.3642578125, 16.00390625, 16.6435546875, 17.283203125, 17.9228515625, 18.5625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 9.0, 10.0, 17.0, 12.0, 22.0, 30.0, 37.0, 45.0, 73.0, 78.0, 77.0, 89.0, 79.0, 67.0, 63.0, 58.0, 44.0, 40.0, 38.0, 15.0, 21.0, 13.0, 6.0, 6.0, 12.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023136138916015625, -0.0022360682487487793, -0.002158522605895996, -0.002080976963043213, -0.0020034313201904297, -0.0019258856773376465, -0.0018483400344848633, -0.00177079439163208, -0.0016932487487792969, -0.0016157031059265137, -0.0015381574630737305, -0.0014606118202209473, -0.001383066177368164, -0.0013055205345153809, -0.0012279748916625977, -0.0011504292488098145, -0.0010728836059570312, -0.000995337963104248, -0.0009177923202514648, -0.0008402466773986816, -0.0007627010345458984, -0.0006851553916931152, -0.000607609748840332, -0.0005300641059875488, -0.0004525184631347656, -0.0003749728202819824, -0.0002974271774291992, -0.00021988153457641602, -0.0001423358917236328, -6.479024887084961e-05, 1.2755393981933594e-05, 9.03010368347168e-05, 0.0001678466796875, 0.0002453923225402832, 0.0003229379653930664, 0.0004004836082458496, 0.0004780292510986328, 0.000555574893951416, 0.0006331205368041992, 0.0007106661796569824, 0.0007882118225097656, 0.0008657574653625488, 0.000943303108215332, 0.0010208487510681152, 0.0010983943939208984, 0.0011759400367736816, 0.0012534856796264648, 0.001331031322479248, 0.0014085769653320312, 0.0014861226081848145, 0.0015636682510375977, 0.0016412138938903809, 0.001718759536743164, 0.0017963051795959473, 0.0018738508224487305, 0.0019513964653015137, 0.002028942108154297, 0.00210648775100708, 0.0021840333938598633, 0.0022615790367126465, 0.0023391246795654297, 0.002416670322418213, 0.002494215965270996, 0.0025717616081237793, 0.0026493072509765625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 14.0, 11.0, 22.0, 36.0, 47.0, 81.0, 104.0, 150.0, 216.0, 305.0, 491.0, 767.0, 1189.0, 1848.0, 2858.0, 4484.0, 7288.0, 11952.0, 19677.0, 33278.0, 56142.0, 95757.0, 152513.0, 198836.0, 174488.0, 114616.0, 68687.0, 40791.0, 23729.0, 14259.0, 8698.0, 5473.0, 3451.0, 2135.0, 1388.0, 924.0, 591.0, 428.0, 261.0, 189.0, 118.0, 74.0, 54.0, 35.0, 32.0, 19.0, 8.0, 10.0, 2.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.171875, -18.547119140625, -17.92236328125, -17.297607421875, -16.6728515625, -16.048095703125, -15.42333984375, -14.798583984375, -14.173828125, -13.549072265625, -12.92431640625, -12.299560546875, -11.6748046875, -11.050048828125, -10.42529296875, -9.800537109375, -9.17578125, -8.551025390625, -7.92626953125, -7.301513671875, -6.6767578125, -6.052001953125, -5.42724609375, -4.802490234375, -4.177734375, -3.552978515625, -2.92822265625, -2.303466796875, -1.6787109375, -1.053955078125, -0.42919921875, 0.195556640625, 0.8203125, 1.445068359375, 2.06982421875, 2.694580078125, 3.3193359375, 3.944091796875, 4.56884765625, 5.193603515625, 5.818359375, 6.443115234375, 7.06787109375, 7.692626953125, 8.3173828125, 8.942138671875, 9.56689453125, 10.191650390625, 10.81640625, 11.441162109375, 12.06591796875, 12.690673828125, 13.3154296875, 13.940185546875, 14.56494140625, 15.189697265625, 15.814453125, 16.439208984375, 17.06396484375, 17.688720703125, 18.3134765625, 18.938232421875, 19.56298828125, 20.187744140625, 20.8125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 13.0, 8.0, 8.0, 10.0, 17.0, 18.0, 23.0, 28.0, 35.0, 38.0, 41.0, 55.0, 55.0, 55.0, 48.0, 51.0, 56.0, 52.0, 54.0, 52.0, 52.0, 34.0, 35.0, 19.0, 23.0, 27.0, 14.0, 15.0, 12.0, 7.0, 16.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.059326171875, -4.86865234375, -4.677978515625, -4.4873046875, -4.296630859375, -4.10595703125, -3.915283203125, -3.724609375, -3.533935546875, -3.34326171875, -3.152587890625, -2.9619140625, -2.771240234375, -2.58056640625, -2.389892578125, -2.19921875, -2.008544921875, -1.81787109375, -1.627197265625, -1.4365234375, -1.245849609375, -1.05517578125, -0.864501953125, -0.673828125, -0.483154296875, -0.29248046875, -0.101806640625, 0.0888671875, 0.279541015625, 0.47021484375, 0.660888671875, 0.8515625, 1.042236328125, 1.23291015625, 1.423583984375, 1.6142578125, 1.804931640625, 1.99560546875, 2.186279296875, 2.376953125, 2.567626953125, 2.75830078125, 2.948974609375, 3.1396484375, 3.330322265625, 3.52099609375, 3.711669921875, 3.90234375, 4.093017578125, 4.28369140625, 4.474365234375, 4.6650390625, 4.855712890625, 5.04638671875, 5.237060546875, 5.427734375, 5.618408203125, 5.80908203125, 5.999755859375, 6.1904296875, 6.381103515625, 6.57177734375, 6.762451171875, 6.953125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 9.0, 22.0, 15.0, 27.0, 32.0, 45.0, 41.0, 39.0, 46.0, 65.0, 66.0, 64.0, 50.0, 68.0, 58.0, 39.0, 49.0, 50.0, 30.0, 22.0, 25.0, 22.0, 19.0, 19.0, 10.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-43.08380126953125, -41.820255279541016, -40.55670928955078, -39.29316329956055, -38.02961730957031, -36.76606750488281, -35.50252151489258, -34.238975524902344, -32.97542953491211, -31.711883544921875, -30.44833755493164, -29.184789657592773, -27.92124366760254, -26.657697677612305, -25.394149780273438, -24.130603790283203, -22.86705780029297, -21.603511810302734, -20.3399658203125, -19.076417922973633, -17.8128719329834, -16.549325942993164, -15.285778999328613, -14.022232055664062, -12.758686065673828, -11.495140075683594, -10.231593132019043, -8.968046188354492, -7.704500198364258, -6.440953731536865, -5.177407264709473, -3.913860321044922, -2.650310516357422, -1.3867640495300293, -0.12321758270263672, 1.1403288841247559, 2.4038753509521484, 3.667421817779541, 4.930968284606934, 6.194515228271484, 7.458061218261719, 8.721607208251953, 9.985154151916504, 11.248701095581055, 12.512247085571289, 13.775793075561523, 15.039340019226074, 16.302886962890625, 17.56643295288086, 18.829978942871094, 20.093524932861328, 21.357072830200195, 22.62061882019043, 23.884164810180664, 25.14771270751953, 26.411258697509766, 27.6748046875, 28.938350677490234, 30.20189666748047, 31.465444564819336, 32.72898864746094, 33.99253845214844, 35.25608444213867, 36.519630432128906, 37.78317642211914]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 5.0, 10.0, 9.0, 17.0, 9.0, 12.0, 23.0, 21.0, 20.0, 22.0, 31.0, 26.0, 28.0, 30.0, 28.0, 35.0, 31.0, 42.0, 30.0, 38.0, 48.0, 42.0, 34.0, 43.0, 40.0, 28.0, 36.0, 28.0, 29.0, 27.0, 23.0, 23.0, 17.0, 12.0, 20.0, 11.0, 15.0, 11.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.468355178833008, -17.85744285583496, -17.246530532836914, -16.635618209838867, -16.02470588684082, -15.413792610168457, -14.80288028717041, -14.191967010498047, -13.5810546875, -12.970142364501953, -12.359230041503906, -11.74831771850586, -11.137404441833496, -10.52649211883545, -9.915579795837402, -9.304666519165039, -8.693755149841309, -8.082842826843262, -7.471930027008057, -6.86101770401001, -6.250104904174805, -5.639192581176758, -5.028280258178711, -4.417367458343506, -3.806455135345459, -3.195542573928833, -2.584630012512207, -1.9737176895141602, -1.3628051280975342, -0.7518925666809082, -0.14098024368286133, 0.46993255615234375, 1.0808448791503906, 1.6917574405670166, 2.3026700019836426, 2.9135823249816895, 3.5244948863983154, 4.135407447814941, 4.746319770812988, 5.357232570648193, 5.96814489364624, 6.579057216644287, 7.189970016479492, 7.800882339477539, 8.411794662475586, 9.022706985473633, 9.63361930847168, 10.244532585144043, 10.85544490814209, 11.466357231140137, 12.077269554138184, 12.688182830810547, 13.299095153808594, 13.91000747680664, 14.520919799804688, 15.131832122802734, 15.742744445800781, 16.353656768798828, 16.964569091796875, 17.575481414794922, 18.18639373779297, 18.797306060791016, 19.408218383789062, 20.019132614135742, 20.63004493713379]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 6.0, 8.0, 12.0, 21.0, 32.0, 54.0, 75.0, 93.0, 172.0, 235.0, 333.0, 488.0, 763.0, 1169.0, 1918.0, 2862.0, 4614.0, 7404.0, 12280.0, 21128.0, 37721.0, 69967.0, 136537.0, 282396.0, 590653.0, 1001840.0, 950315.0, 532218.0, 256779.0, 127270.0, 66374.0, 35957.0, 20584.0, 11912.0, 7260.0, 4539.0, 2979.0, 1829.0, 1184.0, 760.0, 518.0, 354.0, 236.0, 155.0, 98.0, 55.0, 39.0, 34.0, 13.0, 19.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.90625, -40.59375, -39.28125, -37.96875, -36.65625, -35.34375, -34.03125, -32.71875, -31.40625, -30.09375, -28.78125, -27.46875, -26.15625, -24.84375, -23.53125, -22.21875, -20.90625, -19.59375, -18.28125, -16.96875, -15.65625, -14.34375, -13.03125, -11.71875, -10.40625, -9.09375, -7.78125, -6.46875, -5.15625, -3.84375, -2.53125, -1.21875, 0.09375, 1.40625, 2.71875, 4.03125, 5.34375, 6.65625, 7.96875, 9.28125, 10.59375, 11.90625, 13.21875, 14.53125, 15.84375, 17.15625, 18.46875, 19.78125, 21.09375, 22.40625, 23.71875, 25.03125, 26.34375, 27.65625, 28.96875, 30.28125, 31.59375, 32.90625, 34.21875, 35.53125, 36.84375, 38.15625, 39.46875, 40.78125, 42.09375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 8.0, 7.0, 8.0, 14.0, 8.0, 15.0, 23.0, 16.0, 14.0, 34.0, 31.0, 19.0, 37.0, 26.0, 40.0, 36.0, 24.0, 26.0, 45.0, 35.0, 41.0, 36.0, 31.0, 52.0, 47.0, 31.0, 33.0, 38.0, 26.0, 26.0, 20.0, 20.0, 21.0, 12.0, 12.0, 14.0, 17.0, 14.0, 5.0, 7.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.28125, -17.7041015625, -17.126953125, -16.5498046875, -15.97265625, -15.3955078125, -14.818359375, -14.2412109375, -13.6640625, -13.0869140625, -12.509765625, -11.9326171875, -11.35546875, -10.7783203125, -10.201171875, -9.6240234375, -9.046875, -8.4697265625, -7.892578125, -7.3154296875, -6.73828125, -6.1611328125, -5.583984375, -5.0068359375, -4.4296875, -3.8525390625, -3.275390625, -2.6982421875, -2.12109375, -1.5439453125, -0.966796875, -0.3896484375, 0.1875, 0.7646484375, 1.341796875, 1.9189453125, 2.49609375, 3.0732421875, 3.650390625, 4.2275390625, 4.8046875, 5.3818359375, 5.958984375, 6.5361328125, 7.11328125, 7.6904296875, 8.267578125, 8.8447265625, 9.421875, 9.9990234375, 10.576171875, 11.1533203125, 11.73046875, 12.3076171875, 12.884765625, 13.4619140625, 14.0390625, 14.6162109375, 15.193359375, 15.7705078125, 16.34765625, 16.9248046875, 17.501953125, 18.0791015625, 18.65625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 10.0, 11.0, 9.0, 25.0, 26.0, 35.0, 59.0, 77.0, 102.0, 163.0, 242.0, 302.0, 520.0, 673.0, 995.0, 1495.0, 2145.0, 3416.0, 5336.0, 8252.0, 13418.0, 22692.0, 38614.0, 68958.0, 127282.0, 244231.0, 480860.0, 853872.0, 982046.0, 631984.0, 326818.0, 166949.0, 89392.0, 49252.0, 28424.0, 16527.0, 10248.0, 6538.0, 4090.0, 2737.0, 1771.0, 1147.0, 744.0, 565.0, 374.0, 244.0, 193.0, 128.0, 80.0, 71.0, 52.0, 29.0, 17.0, 18.0, 15.0, 8.0, 6.0, 3.0, 3.0, 1.0], "bins": [-53.96875, -52.29345703125, -50.6181640625, -48.94287109375, -47.267578125, -45.59228515625, -43.9169921875, -42.24169921875, -40.56640625, -38.89111328125, -37.2158203125, -35.54052734375, -33.865234375, -32.18994140625, -30.5146484375, -28.83935546875, -27.1640625, -25.48876953125, -23.8134765625, -22.13818359375, -20.462890625, -18.78759765625, -17.1123046875, -15.43701171875, -13.76171875, -12.08642578125, -10.4111328125, -8.73583984375, -7.060546875, -5.38525390625, -3.7099609375, -2.03466796875, -0.359375, 1.31591796875, 2.9912109375, 4.66650390625, 6.341796875, 8.01708984375, 9.6923828125, 11.36767578125, 13.04296875, 14.71826171875, 16.3935546875, 18.06884765625, 19.744140625, 21.41943359375, 23.0947265625, 24.77001953125, 26.4453125, 28.12060546875, 29.7958984375, 31.47119140625, 33.146484375, 34.82177734375, 36.4970703125, 38.17236328125, 39.84765625, 41.52294921875, 43.1982421875, 44.87353515625, 46.548828125, 48.22412109375, 49.8994140625, 51.57470703125, 53.25]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 12.0, 18.0, 20.0, 25.0, 59.0, 51.0, 91.0, 102.0, 132.0, 146.0, 192.0, 286.0, 311.0, 309.0, 321.0, 328.0, 288.0, 233.0, 250.0, 182.0, 149.0, 124.0, 98.0, 78.0, 55.0, 45.0, 37.0, 21.0, 17.0, 15.0, 14.0, 12.0, 13.0, 3.0, 6.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.625, -17.07275390625, -16.5205078125, -15.96826171875, -15.416015625, -14.86376953125, -14.3115234375, -13.75927734375, -13.20703125, -12.65478515625, -12.1025390625, -11.55029296875, -10.998046875, -10.44580078125, -9.8935546875, -9.34130859375, -8.7890625, -8.23681640625, -7.6845703125, -7.13232421875, -6.580078125, -6.02783203125, -5.4755859375, -4.92333984375, -4.37109375, -3.81884765625, -3.2666015625, -2.71435546875, -2.162109375, -1.60986328125, -1.0576171875, -0.50537109375, 0.046875, 0.59912109375, 1.1513671875, 1.70361328125, 2.255859375, 2.80810546875, 3.3603515625, 3.91259765625, 4.46484375, 5.01708984375, 5.5693359375, 6.12158203125, 6.673828125, 7.22607421875, 7.7783203125, 8.33056640625, 8.8828125, 9.43505859375, 9.9873046875, 10.53955078125, 11.091796875, 11.64404296875, 12.1962890625, 12.74853515625, 13.30078125, 13.85302734375, 14.4052734375, 14.95751953125, 15.509765625, 16.06201171875, 16.6142578125, 17.16650390625, 17.71875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 6.0, 5.0, 11.0, 15.0, 9.0, 17.0, 18.0, 29.0, 25.0, 41.0, 61.0, 50.0, 47.0, 64.0, 69.0, 77.0, 58.0, 78.0, 55.0, 54.0, 35.0, 33.0, 27.0, 21.0, 20.0, 18.0, 14.0, 9.0, 5.0, 7.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.71512985229492, -55.800018310546875, -53.88490676879883, -51.96979522705078, -50.0546875, -48.13957214355469, -46.224464416503906, -44.30935287475586, -42.39424133300781, -40.479129791259766, -38.56401824951172, -36.64890670776367, -34.733795166015625, -32.818687438964844, -30.903575897216797, -28.98846435546875, -27.073352813720703, -25.158241271972656, -23.24312973022461, -21.328020095825195, -19.41290855407715, -17.4977970123291, -15.582686424255371, -13.66757583618164, -11.752464294433594, -9.837352752685547, -7.922242164611816, -6.007131099700928, -4.092020034790039, -2.176908493041992, -0.2617979049682617, 1.6533126831054688, 3.5684280395507812, 5.48353910446167, 7.398650169372559, 9.313760757446289, 11.228872299194336, 13.143983840942383, 15.059094429016113, 16.974205017089844, 18.88931655883789, 20.804428100585938, 22.719539642333984, 24.6346492767334, 26.549760818481445, 28.464872360229492, 30.379981994628906, 32.29509353637695, 34.210205078125, 36.12531661987305, 38.040428161621094, 39.95553970336914, 41.87065124511719, 43.78575897216797, 45.700870513916016, 47.61598205566406, 49.53109359741211, 51.446205139160156, 53.3613166809082, 55.27642822265625, 57.19153594970703, 59.106651306152344, 61.021759033203125, 62.93687057495117, 64.85198211669922]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 5.0, 5.0, 15.0, 10.0, 19.0, 22.0, 26.0, 14.0, 22.0, 33.0, 41.0, 26.0, 41.0, 41.0, 48.0, 45.0, 47.0, 39.0, 46.0, 53.0, 27.0, 39.0, 43.0, 35.0, 38.0, 33.0, 22.0, 26.0, 25.0, 25.0, 15.0, 8.0, 9.0, 11.0, 8.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.67736053466797, -28.741315841674805, -27.80527114868164, -26.869226455688477, -25.933181762695312, -24.997135162353516, -24.06109046936035, -23.125045776367188, -22.189001083374023, -21.25295639038086, -20.316911697387695, -19.38086700439453, -18.444820404052734, -17.508777618408203, -16.572731018066406, -15.636686325073242, -14.700641632080078, -13.764596939086914, -12.82855224609375, -11.89250659942627, -10.956461906433105, -10.020417213439941, -9.084371566772461, -8.148326873779297, -7.212282180786133, -6.276237487792969, -5.3401923179626465, -4.404147148132324, -3.46810245513916, -2.532057762145996, -1.5960125923156738, -0.6599674224853516, 0.2760772705078125, 1.2121222019195557, 2.148167133331299, 3.084212064743042, 4.020256996154785, 4.956301689147949, 5.8923468589782715, 6.828392028808594, 7.764436721801758, 8.700481414794922, 9.636526107788086, 10.572571754455566, 11.50861644744873, 12.444661140441895, 13.380706787109375, 14.316751480102539, 15.252796173095703, 16.188840866088867, 17.12488555908203, 18.060930252075195, 18.99697494506836, 19.933021545410156, 20.86906623840332, 21.805110931396484, 22.74115562438965, 23.677200317382812, 24.613245010375977, 25.54928970336914, 26.485336303710938, 27.42137908935547, 28.357425689697266, 29.29347038269043, 30.229515075683594]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 9.0, 10.0, 10.0, 23.0, 46.0, 37.0, 60.0, 79.0, 115.0, 200.0, 317.0, 462.0, 747.0, 1275.0, 2083.0, 3596.0, 6684.0, 12752.0, 24701.0, 51566.0, 107161.0, 201498.0, 259158.0, 185653.0, 96170.0, 46027.0, 22412.0, 11288.0, 6020.0, 3291.0, 1992.0, 1114.0, 682.0, 410.0, 283.0, 162.0, 139.0, 90.0, 52.0, 45.0, 26.0, 34.0, 18.0, 19.0, 4.0, 11.0, 6.0, 2.0, 2.0, 3.0, 4.0], "bins": [-38.5625, -37.473876953125, -36.38525390625, -35.296630859375, -34.2080078125, -33.119384765625, -32.03076171875, -30.942138671875, -29.853515625, -28.764892578125, -27.67626953125, -26.587646484375, -25.4990234375, -24.410400390625, -23.32177734375, -22.233154296875, -21.14453125, -20.055908203125, -18.96728515625, -17.878662109375, -16.7900390625, -15.701416015625, -14.61279296875, -13.524169921875, -12.435546875, -11.346923828125, -10.25830078125, -9.169677734375, -8.0810546875, -6.992431640625, -5.90380859375, -4.815185546875, -3.7265625, -2.637939453125, -1.54931640625, -0.460693359375, 0.6279296875, 1.716552734375, 2.80517578125, 3.893798828125, 4.982421875, 6.071044921875, 7.15966796875, 8.248291015625, 9.3369140625, 10.425537109375, 11.51416015625, 12.602783203125, 13.69140625, 14.780029296875, 15.86865234375, 16.957275390625, 18.0458984375, 19.134521484375, 20.22314453125, 21.311767578125, 22.400390625, 23.489013671875, 24.57763671875, 25.666259765625, 26.7548828125, 27.843505859375, 28.93212890625, 30.020751953125, 31.109375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 6.0, 9.0, 15.0, 15.0, 13.0, 26.0, 32.0, 28.0, 35.0, 26.0, 40.0, 53.0, 63.0, 51.0, 64.0, 56.0, 49.0, 48.0, 56.0, 52.0, 36.0, 33.0, 44.0, 25.0, 18.0, 18.0, 20.0, 13.0, 13.0, 9.0, 7.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.46875, -39.20703125, -37.9453125, -36.68359375, -35.421875, -34.16015625, -32.8984375, -31.63671875, -30.375, -29.11328125, -27.8515625, -26.58984375, -25.328125, -24.06640625, -22.8046875, -21.54296875, -20.28125, -19.01953125, -17.7578125, -16.49609375, -15.234375, -13.97265625, -12.7109375, -11.44921875, -10.1875, -8.92578125, -7.6640625, -6.40234375, -5.140625, -3.87890625, -2.6171875, -1.35546875, -0.09375, 1.16796875, 2.4296875, 3.69140625, 4.953125, 6.21484375, 7.4765625, 8.73828125, 10.0, 11.26171875, 12.5234375, 13.78515625, 15.046875, 16.30859375, 17.5703125, 18.83203125, 20.09375, 21.35546875, 22.6171875, 23.87890625, 25.140625, 26.40234375, 27.6640625, 28.92578125, 30.1875, 31.44921875, 32.7109375, 33.97265625, 35.234375, 36.49609375, 37.7578125, 39.01953125, 40.28125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 8.0, 9.0, 23.0, 39.0, 39.0, 71.0, 80.0, 112.0, 186.0, 258.0, 378.0, 536.0, 827.0, 1233.0, 1871.0, 3018.0, 5083.0, 9185.0, 17091.0, 35353.0, 76162.0, 166436.0, 284794.0, 228921.0, 111931.0, 50897.0, 24129.0, 12272.0, 6581.0, 3947.0, 2362.0, 1541.0, 999.0, 680.0, 475.0, 307.0, 203.0, 174.0, 107.0, 82.0, 39.0, 39.0, 30.0, 14.0, 13.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.0791015625, -33.814453125, -32.5498046875, -31.28515625, -30.0205078125, -28.755859375, -27.4912109375, -26.2265625, -24.9619140625, -23.697265625, -22.4326171875, -21.16796875, -19.9033203125, -18.638671875, -17.3740234375, -16.109375, -14.8447265625, -13.580078125, -12.3154296875, -11.05078125, -9.7861328125, -8.521484375, -7.2568359375, -5.9921875, -4.7275390625, -3.462890625, -2.1982421875, -0.93359375, 0.3310546875, 1.595703125, 2.8603515625, 4.125, 5.3896484375, 6.654296875, 7.9189453125, 9.18359375, 10.4482421875, 11.712890625, 12.9775390625, 14.2421875, 15.5068359375, 16.771484375, 18.0361328125, 19.30078125, 20.5654296875, 21.830078125, 23.0947265625, 24.359375, 25.6240234375, 26.888671875, 28.1533203125, 29.41796875, 30.6826171875, 31.947265625, 33.2119140625, 34.4765625, 35.7412109375, 37.005859375, 38.2705078125, 39.53515625, 40.7998046875, 42.064453125, 43.3291015625, 44.59375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 4.0, 10.0, 10.0, 11.0, 9.0, 19.0, 12.0, 18.0, 23.0, 25.0, 29.0, 28.0, 35.0, 32.0, 53.0, 44.0, 37.0, 42.0, 31.0, 39.0, 43.0, 49.0, 39.0, 43.0, 49.0, 39.0, 31.0, 26.0, 32.0, 28.0, 24.0, 16.0, 6.0, 11.0, 11.0, 12.0, 7.0, 7.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.72265625, -16.1171875, -15.51171875, -14.90625, -14.30078125, -13.6953125, -13.08984375, -12.484375, -11.87890625, -11.2734375, -10.66796875, -10.0625, -9.45703125, -8.8515625, -8.24609375, -7.640625, -7.03515625, -6.4296875, -5.82421875, -5.21875, -4.61328125, -4.0078125, -3.40234375, -2.796875, -2.19140625, -1.5859375, -0.98046875, -0.375, 0.23046875, 0.8359375, 1.44140625, 2.046875, 2.65234375, 3.2578125, 3.86328125, 4.46875, 5.07421875, 5.6796875, 6.28515625, 6.890625, 7.49609375, 8.1015625, 8.70703125, 9.3125, 9.91796875, 10.5234375, 11.12890625, 11.734375, 12.33984375, 12.9453125, 13.55078125, 14.15625, 14.76171875, 15.3671875, 15.97265625, 16.578125, 17.18359375, 17.7890625, 18.39453125, 19.0, 19.60546875, 20.2109375, 20.81640625, 21.421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 10.0, 11.0, 15.0, 29.0, 42.0, 56.0, 85.0, 135.0, 242.0, 356.0, 546.0, 902.0, 1585.0, 2711.0, 4909.0, 8827.0, 16014.0, 30717.0, 59821.0, 120098.0, 233612.0, 266382.0, 148419.0, 73170.0, 36775.0, 19175.0, 10417.0, 5702.0, 3086.0, 1821.0, 1102.0, 694.0, 349.0, 257.0, 166.0, 123.0, 53.0, 46.0, 36.0, 22.0, 13.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4609375, -14.0111083984375, -13.561279296875, -13.1114501953125, -12.66162109375, -12.2117919921875, -11.761962890625, -11.3121337890625, -10.8623046875, -10.4124755859375, -9.962646484375, -9.5128173828125, -9.06298828125, -8.6131591796875, -8.163330078125, -7.7135009765625, -7.263671875, -6.8138427734375, -6.364013671875, -5.9141845703125, -5.46435546875, -5.0145263671875, -4.564697265625, -4.1148681640625, -3.6650390625, -3.2152099609375, -2.765380859375, -2.3155517578125, -1.86572265625, -1.4158935546875, -0.966064453125, -0.5162353515625, -0.06640625, 0.3834228515625, 0.833251953125, 1.2830810546875, 1.73291015625, 2.1827392578125, 2.632568359375, 3.0823974609375, 3.5322265625, 3.9820556640625, 4.431884765625, 4.8817138671875, 5.33154296875, 5.7813720703125, 6.231201171875, 6.6810302734375, 7.130859375, 7.5806884765625, 8.030517578125, 8.4803466796875, 8.93017578125, 9.3800048828125, 9.829833984375, 10.2796630859375, 10.7294921875, 11.1793212890625, 11.629150390625, 12.0789794921875, 12.52880859375, 12.9786376953125, 13.428466796875, 13.8782958984375, 14.328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 11.0, 17.0, 25.0, 33.0, 31.0, 43.0, 53.0, 63.0, 60.0, 68.0, 84.0, 74.0, 57.0, 81.0, 54.0, 37.0, 32.0, 30.0, 25.0, 17.0, 15.0, 15.0, 9.0, 3.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010166168212890625, -0.0009861737489700317, -0.000955730676651001, -0.0009252876043319702, -0.0008948445320129395, -0.0008644014596939087, -0.0008339583873748779, -0.0008035153150558472, -0.0007730722427368164, -0.0007426291704177856, -0.0007121860980987549, -0.0006817430257797241, -0.0006512999534606934, -0.0006208568811416626, -0.0005904138088226318, -0.0005599707365036011, -0.0005295276641845703, -0.0004990845918655396, -0.0004686415195465088, -0.00043819844722747803, -0.00040775537490844727, -0.0003773123025894165, -0.00034686923027038574, -0.000316426157951355, -0.0002859830856323242, -0.00025554001331329346, -0.0002250969409942627, -0.00019465386867523193, -0.00016421079635620117, -0.0001337677240371704, -0.00010332465171813965, -7.288157939910889e-05, -4.2438507080078125e-05, -1.1995434761047363e-05, 1.84476375579834e-05, 4.889070987701416e-05, 7.933378219604492e-05, 0.00010977685451507568, 0.00014021992683410645, 0.0001706629991531372, 0.00020110607147216797, 0.00023154914379119873, 0.0002619922161102295, 0.00029243528842926025, 0.000322878360748291, 0.0003533214330673218, 0.00038376450538635254, 0.0004142075777053833, 0.00044465065002441406, 0.0004750937223434448, 0.0005055367946624756, 0.0005359798669815063, 0.0005664229393005371, 0.0005968660116195679, 0.0006273090839385986, 0.0006577521562576294, 0.0006881952285766602, 0.0007186383008956909, 0.0007490813732147217, 0.0007795244455337524, 0.0008099675178527832, 0.000840410590171814, 0.0008708536624908447, 0.0009012967348098755, 0.0009317398071289062]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 11.0, 12.0, 25.0, 20.0, 41.0, 51.0, 84.0, 112.0, 146.0, 232.0, 316.0, 447.0, 664.0, 1024.0, 1530.0, 2390.0, 3697.0, 6113.0, 10086.0, 16336.0, 28105.0, 48284.0, 81123.0, 129324.0, 177759.0, 182732.0, 138100.0, 88541.0, 53574.0, 30779.0, 17887.0, 10627.0, 6548.0, 4098.0, 2626.0, 1751.0, 1055.0, 745.0, 479.0, 328.0, 237.0, 151.0, 115.0, 80.0, 57.0, 43.0, 26.0, 16.0, 10.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-13.0546875, -12.6478271484375, -12.240966796875, -11.8341064453125, -11.42724609375, -11.0203857421875, -10.613525390625, -10.2066650390625, -9.7998046875, -9.3929443359375, -8.986083984375, -8.5792236328125, -8.17236328125, -7.7655029296875, -7.358642578125, -6.9517822265625, -6.544921875, -6.1380615234375, -5.731201171875, -5.3243408203125, -4.91748046875, -4.5106201171875, -4.103759765625, -3.6968994140625, -3.2900390625, -2.8831787109375, -2.476318359375, -2.0694580078125, -1.66259765625, -1.2557373046875, -0.848876953125, -0.4420166015625, -0.03515625, 0.3717041015625, 0.778564453125, 1.1854248046875, 1.59228515625, 1.9991455078125, 2.406005859375, 2.8128662109375, 3.2197265625, 3.6265869140625, 4.033447265625, 4.4403076171875, 4.84716796875, 5.2540283203125, 5.660888671875, 6.0677490234375, 6.474609375, 6.8814697265625, 7.288330078125, 7.6951904296875, 8.10205078125, 8.5089111328125, 8.915771484375, 9.3226318359375, 9.7294921875, 10.1363525390625, 10.543212890625, 10.9500732421875, 11.35693359375, 11.7637939453125, 12.170654296875, 12.5775146484375, 12.984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 12.0, 17.0, 20.0, 23.0, 23.0, 32.0, 46.0, 52.0, 56.0, 50.0, 58.0, 63.0, 77.0, 73.0, 74.0, 55.0, 58.0, 32.0, 42.0, 20.0, 25.0, 20.0, 12.0, 9.0, 11.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.03692626953125, -3.8980712890625, -3.75921630859375, -3.620361328125, -3.48150634765625, -3.3426513671875, -3.20379638671875, -3.06494140625, -2.92608642578125, -2.7872314453125, -2.64837646484375, -2.509521484375, -2.37066650390625, -2.2318115234375, -2.09295654296875, -1.9541015625, -1.81524658203125, -1.6763916015625, -1.53753662109375, -1.398681640625, -1.25982666015625, -1.1209716796875, -0.98211669921875, -0.84326171875, -0.70440673828125, -0.5655517578125, -0.42669677734375, -0.287841796875, -0.14898681640625, -0.0101318359375, 0.12872314453125, 0.267578125, 0.40643310546875, 0.5452880859375, 0.68414306640625, 0.822998046875, 0.96185302734375, 1.1007080078125, 1.23956298828125, 1.37841796875, 1.51727294921875, 1.6561279296875, 1.79498291015625, 1.933837890625, 2.07269287109375, 2.2115478515625, 2.35040283203125, 2.4892578125, 2.62811279296875, 2.7669677734375, 2.90582275390625, 3.044677734375, 3.18353271484375, 3.3223876953125, 3.46124267578125, 3.60009765625, 3.73895263671875, 3.8778076171875, 4.01666259765625, 4.155517578125, 4.29437255859375, 4.4332275390625, 4.57208251953125, 4.7109375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 12.0, 11.0, 18.0, 18.0, 27.0, 27.0, 47.0, 50.0, 53.0, 56.0, 72.0, 62.0, 72.0, 71.0, 63.0, 62.0, 38.0, 46.0, 31.0, 31.0, 19.0, 21.0, 12.0, 13.0, 13.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.996620178222656, -56.07065963745117, -54.14469909667969, -52.21874237060547, -50.292781829833984, -48.3668212890625, -46.440860748291016, -44.51490020751953, -42.58894348144531, -40.66298294067383, -38.737022399902344, -36.811065673828125, -34.88510513305664, -32.959144592285156, -31.033184051513672, -29.10722541809082, -27.181264877319336, -25.25530433654785, -23.329345703125, -21.403385162353516, -19.477426528930664, -17.55146598815918, -15.625506401062012, -13.699546813964844, -11.773587226867676, -9.847627639770508, -7.92166805267334, -5.995707988739014, -4.069748401641846, -2.1437883377075195, -0.21782875061035156, 1.7081308364868164, 3.6340904235839844, 5.560050010681152, 7.48600959777832, 9.411970138549805, 11.337928771972656, 13.26388931274414, 15.189848899841309, 17.115808486938477, 19.041767120361328, 20.967727661132812, 22.893686294555664, 24.81964683532715, 26.74560546875, 28.671566009521484, 30.59752655029297, 32.52348327636719, 34.44944763183594, 36.37540817260742, 38.301368713378906, 40.227325439453125, 42.15328598022461, 44.079246520996094, 46.00520706176758, 47.93116760253906, 49.85712432861328, 51.783084869384766, 53.70904541015625, 55.63500213623047, 57.56096267700195, 59.48692321777344, 61.41288375854492, 63.338844299316406, 65.26480102539062]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 2.0, 13.0, 8.0, 22.0, 17.0, 20.0, 26.0, 24.0, 29.0, 33.0, 31.0, 35.0, 41.0, 57.0, 43.0, 48.0, 43.0, 44.0, 48.0, 40.0, 40.0, 36.0, 40.0, 40.0, 22.0, 33.0, 21.0, 27.0, 26.0, 15.0, 8.0, 11.0, 9.0, 7.0, 8.0, 8.0, 1.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.31357765197754, -29.365747451782227, -28.41791534423828, -27.47008514404297, -26.522254943847656, -25.574424743652344, -24.6265926361084, -23.678762435913086, -22.73093032836914, -21.783100128173828, -20.835268020629883, -19.88743782043457, -18.939607620239258, -17.991775512695312, -17.0439453125, -16.096115112304688, -15.148284912109375, -14.200453758239746, -13.252623558044434, -12.304792404174805, -11.356962203979492, -10.409131050109863, -9.461299896240234, -8.513469696044922, -7.565638542175293, -6.617807865142822, -5.669977188110352, -4.722146034240723, -3.774315357208252, -2.8264846801757812, -1.8786535263061523, -0.9308228492736816, 0.017009735107421875, 0.9648405313491821, 1.9126713275909424, 2.860502243041992, 3.808332920074463, 4.756163597106934, 5.7039947509765625, 6.651825428009033, 7.599656105041504, 8.547487258911133, 9.495317459106445, 10.443148612976074, 11.390979766845703, 12.338809967041016, 13.286641120910645, 14.234472274780273, 15.182302474975586, 16.1301326751709, 17.077964782714844, 18.025794982910156, 18.97362518310547, 19.92145538330078, 20.869287490844727, 21.81711769104004, 22.764949798583984, 23.712779998779297, 24.660612106323242, 25.608442306518555, 26.556272506713867, 27.504104614257812, 28.451934814453125, 29.399765014648438, 30.34759521484375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 10.0, 17.0, 27.0, 35.0, 55.0, 85.0, 105.0, 193.0, 241.0, 338.0, 556.0, 852.0, 1323.0, 2004.0, 3397.0, 5505.0, 9227.0, 15639.0, 26672.0, 45988.0, 77027.0, 118631.0, 159962.0, 173651.0, 147509.0, 103010.0, 63736.0, 37880.0, 21802.0, 12720.0, 7514.0, 4577.0, 2934.0, 1847.0, 1163.0, 779.0, 479.0, 344.0, 220.0, 157.0, 104.0, 75.0, 52.0, 37.0, 23.0, 22.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-40.375, -39.1259765625, -37.876953125, -36.6279296875, -35.37890625, -34.1298828125, -32.880859375, -31.6318359375, -30.3828125, -29.1337890625, -27.884765625, -26.6357421875, -25.38671875, -24.1376953125, -22.888671875, -21.6396484375, -20.390625, -19.1416015625, -17.892578125, -16.6435546875, -15.39453125, -14.1455078125, -12.896484375, -11.6474609375, -10.3984375, -9.1494140625, -7.900390625, -6.6513671875, -5.40234375, -4.1533203125, -2.904296875, -1.6552734375, -0.40625, 0.8427734375, 2.091796875, 3.3408203125, 4.58984375, 5.8388671875, 7.087890625, 8.3369140625, 9.5859375, 10.8349609375, 12.083984375, 13.3330078125, 14.58203125, 15.8310546875, 17.080078125, 18.3291015625, 19.578125, 20.8271484375, 22.076171875, 23.3251953125, 24.57421875, 25.8232421875, 27.072265625, 28.3212890625, 29.5703125, 30.8193359375, 32.068359375, 33.3173828125, 34.56640625, 35.8154296875, 37.064453125, 38.3134765625, 39.5625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 5.0, 14.0, 7.0, 8.0, 12.0, 18.0, 16.0, 21.0, 22.0, 26.0, 40.0, 39.0, 44.0, 35.0, 33.0, 43.0, 44.0, 49.0, 44.0, 42.0, 48.0, 39.0, 38.0, 29.0, 47.0, 33.0, 21.0, 33.0, 20.0, 19.0, 19.0, 15.0, 10.0, 9.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.34375, -27.32470703125, -26.3056640625, -25.28662109375, -24.267578125, -23.24853515625, -22.2294921875, -21.21044921875, -20.19140625, -19.17236328125, -18.1533203125, -17.13427734375, -16.115234375, -15.09619140625, -14.0771484375, -13.05810546875, -12.0390625, -11.02001953125, -10.0009765625, -8.98193359375, -7.962890625, -6.94384765625, -5.9248046875, -4.90576171875, -3.88671875, -2.86767578125, -1.8486328125, -0.82958984375, 0.189453125, 1.20849609375, 2.2275390625, 3.24658203125, 4.265625, 5.28466796875, 6.3037109375, 7.32275390625, 8.341796875, 9.36083984375, 10.3798828125, 11.39892578125, 12.41796875, 13.43701171875, 14.4560546875, 15.47509765625, 16.494140625, 17.51318359375, 18.5322265625, 19.55126953125, 20.5703125, 21.58935546875, 22.6083984375, 23.62744140625, 24.646484375, 25.66552734375, 26.6845703125, 27.70361328125, 28.72265625, 29.74169921875, 30.7607421875, 31.77978515625, 32.798828125, 33.81787109375, 34.8369140625, 35.85595703125, 36.875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 6.0, 13.0, 16.0, 26.0, 32.0, 67.0, 100.0, 135.0, 181.0, 317.0, 493.0, 743.0, 1230.0, 2017.0, 3449.0, 6011.0, 11253.0, 21073.0, 39988.0, 73380.0, 124816.0, 181345.0, 199355.0, 158602.0, 100442.0, 56771.0, 30289.0, 15979.0, 8510.0, 4797.0, 2714.0, 1624.0, 989.0, 633.0, 414.0, 264.0, 153.0, 122.0, 65.0, 55.0, 31.0, 22.0, 12.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.15625, -45.5458984375, -43.935546875, -42.3251953125, -40.71484375, -39.1044921875, -37.494140625, -35.8837890625, -34.2734375, -32.6630859375, -31.052734375, -29.4423828125, -27.83203125, -26.2216796875, -24.611328125, -23.0009765625, -21.390625, -19.7802734375, -18.169921875, -16.5595703125, -14.94921875, -13.3388671875, -11.728515625, -10.1181640625, -8.5078125, -6.8974609375, -5.287109375, -3.6767578125, -2.06640625, -0.4560546875, 1.154296875, 2.7646484375, 4.375, 5.9853515625, 7.595703125, 9.2060546875, 10.81640625, 12.4267578125, 14.037109375, 15.6474609375, 17.2578125, 18.8681640625, 20.478515625, 22.0888671875, 23.69921875, 25.3095703125, 26.919921875, 28.5302734375, 30.140625, 31.7509765625, 33.361328125, 34.9716796875, 36.58203125, 38.1923828125, 39.802734375, 41.4130859375, 43.0234375, 44.6337890625, 46.244140625, 47.8544921875, 49.46484375, 51.0751953125, 52.685546875, 54.2958984375, 55.90625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 15.0, 14.0, 13.0, 22.0, 18.0, 20.0, 20.0, 22.0, 35.0, 28.0, 27.0, 23.0, 44.0, 28.0, 53.0, 43.0, 50.0, 56.0, 41.0, 27.0, 32.0, 34.0, 30.0, 30.0, 30.0, 24.0, 21.0, 27.0, 21.0, 29.0, 24.0, 10.0, 20.0, 11.0, 6.0, 8.0, 9.0, 1.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0], "bins": [-21.09375, -20.48193359375, -19.8701171875, -19.25830078125, -18.646484375, -18.03466796875, -17.4228515625, -16.81103515625, -16.19921875, -15.58740234375, -14.9755859375, -14.36376953125, -13.751953125, -13.14013671875, -12.5283203125, -11.91650390625, -11.3046875, -10.69287109375, -10.0810546875, -9.46923828125, -8.857421875, -8.24560546875, -7.6337890625, -7.02197265625, -6.41015625, -5.79833984375, -5.1865234375, -4.57470703125, -3.962890625, -3.35107421875, -2.7392578125, -2.12744140625, -1.515625, -0.90380859375, -0.2919921875, 0.31982421875, 0.931640625, 1.54345703125, 2.1552734375, 2.76708984375, 3.37890625, 3.99072265625, 4.6025390625, 5.21435546875, 5.826171875, 6.43798828125, 7.0498046875, 7.66162109375, 8.2734375, 8.88525390625, 9.4970703125, 10.10888671875, 10.720703125, 11.33251953125, 11.9443359375, 12.55615234375, 13.16796875, 13.77978515625, 14.3916015625, 15.00341796875, 15.615234375, 16.22705078125, 16.8388671875, 17.45068359375, 18.0625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 11.0, 14.0, 28.0, 34.0, 46.0, 60.0, 97.0, 143.0, 196.0, 276.0, 348.0, 539.0, 820.0, 1205.0, 1825.0, 2801.0, 4175.0, 6763.0, 10610.0, 17537.0, 29451.0, 50977.0, 90048.0, 153786.0, 207712.0, 185050.0, 118512.0, 67086.0, 38318.0, 22421.0, 13555.0, 8440.0, 5261.0, 3488.0, 2214.0, 1483.0, 1051.0, 680.0, 464.0, 288.0, 216.0, 163.0, 104.0, 77.0, 51.0, 47.0, 23.0, 17.0, 13.0, 3.0, 9.0, 5.0, 3.0, 4.0, 4.0], "bins": [-31.90625, -30.960693359375, -30.01513671875, -29.069580078125, -28.1240234375, -27.178466796875, -26.23291015625, -25.287353515625, -24.341796875, -23.396240234375, -22.45068359375, -21.505126953125, -20.5595703125, -19.614013671875, -18.66845703125, -17.722900390625, -16.77734375, -15.831787109375, -14.88623046875, -13.940673828125, -12.9951171875, -12.049560546875, -11.10400390625, -10.158447265625, -9.212890625, -8.267333984375, -7.32177734375, -6.376220703125, -5.4306640625, -4.485107421875, -3.53955078125, -2.593994140625, -1.6484375, -0.702880859375, 0.24267578125, 1.188232421875, 2.1337890625, 3.079345703125, 4.02490234375, 4.970458984375, 5.916015625, 6.861572265625, 7.80712890625, 8.752685546875, 9.6982421875, 10.643798828125, 11.58935546875, 12.534912109375, 13.48046875, 14.426025390625, 15.37158203125, 16.317138671875, 17.2626953125, 18.208251953125, 19.15380859375, 20.099365234375, 21.044921875, 21.990478515625, 22.93603515625, 23.881591796875, 24.8271484375, 25.772705078125, 26.71826171875, 27.663818359375, 28.609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 11.0, 5.0, 14.0, 15.0, 23.0, 18.0, 28.0, 27.0, 34.0, 46.0, 68.0, 75.0, 67.0, 65.0, 79.0, 70.0, 58.0, 54.0, 42.0, 40.0, 28.0, 22.0, 11.0, 20.0, 15.0, 7.0, 9.0, 5.0, 3.0, 7.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00377655029296875, -0.003665328025817871, -0.003554105758666992, -0.0034428834915161133, -0.0033316612243652344, -0.0032204389572143555, -0.0031092166900634766, -0.0029979944229125977, -0.0028867721557617188, -0.00277554988861084, -0.002664327621459961, -0.002553105354309082, -0.002441883087158203, -0.0023306608200073242, -0.0022194385528564453, -0.0021082162857055664, -0.0019969940185546875, -0.0018857717514038086, -0.0017745494842529297, -0.0016633272171020508, -0.0015521049499511719, -0.001440882682800293, -0.001329660415649414, -0.0012184381484985352, -0.0011072158813476562, -0.0009959936141967773, -0.0008847713470458984, -0.0007735490798950195, -0.0006623268127441406, -0.0005511045455932617, -0.0004398822784423828, -0.0003286600112915039, -0.000217437744140625, -0.0001062154769897461, 5.0067901611328125e-06, 0.00011622905731201172, 0.00022745132446289062, 0.00033867359161376953, 0.00044989585876464844, 0.0005611181259155273, 0.0006723403930664062, 0.0007835626602172852, 0.0008947849273681641, 0.001006007194519043, 0.0011172294616699219, 0.0012284517288208008, 0.0013396739959716797, 0.0014508962631225586, 0.0015621185302734375, 0.0016733407974243164, 0.0017845630645751953, 0.0018957853317260742, 0.002007007598876953, 0.002118229866027832, 0.002229452133178711, 0.00234067440032959, 0.0024518966674804688, 0.0025631189346313477, 0.0026743412017822266, 0.0027855634689331055, 0.0028967857360839844, 0.0030080080032348633, 0.003119230270385742, 0.003230452537536621, 0.0033416748046875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 9.0, 10.0, 10.0, 16.0, 17.0, 34.0, 46.0, 82.0, 139.0, 190.0, 244.0, 392.0, 676.0, 1056.0, 1613.0, 2706.0, 4370.0, 7440.0, 13185.0, 23801.0, 44707.0, 88091.0, 167820.0, 248088.0, 203895.0, 112920.0, 57675.0, 30009.0, 16175.0, 9166.0, 5186.0, 3324.0, 2029.0, 1224.0, 746.0, 537.0, 306.0, 220.0, 147.0, 89.0, 56.0, 38.0, 29.0, 14.0, 9.0, 7.0, 9.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-37.21875, -36.080078125, -34.94140625, -33.802734375, -32.6640625, -31.525390625, -30.38671875, -29.248046875, -28.109375, -26.970703125, -25.83203125, -24.693359375, -23.5546875, -22.416015625, -21.27734375, -20.138671875, -19.0, -17.861328125, -16.72265625, -15.583984375, -14.4453125, -13.306640625, -12.16796875, -11.029296875, -9.890625, -8.751953125, -7.61328125, -6.474609375, -5.3359375, -4.197265625, -3.05859375, -1.919921875, -0.78125, 0.357421875, 1.49609375, 2.634765625, 3.7734375, 4.912109375, 6.05078125, 7.189453125, 8.328125, 9.466796875, 10.60546875, 11.744140625, 12.8828125, 14.021484375, 15.16015625, 16.298828125, 17.4375, 18.576171875, 19.71484375, 20.853515625, 21.9921875, 23.130859375, 24.26953125, 25.408203125, 26.546875, 27.685546875, 28.82421875, 29.962890625, 31.1015625, 32.240234375, 33.37890625, 34.517578125, 35.65625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 15.0, 8.0, 3.0, 20.0, 17.0, 22.0, 26.0, 34.0, 45.0, 61.0, 62.0, 56.0, 71.0, 67.0, 82.0, 70.0, 58.0, 58.0, 47.0, 42.0, 26.0, 28.0, 19.0, 15.0, 9.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7578125, -11.4296875, -11.1015625, -10.7734375, -10.4453125, -10.1171875, -9.7890625, -9.4609375, -9.1328125, -8.8046875, -8.4765625, -8.1484375, -7.8203125, -7.4921875, -7.1640625, -6.8359375, -6.5078125, -6.1796875, -5.8515625, -5.5234375, -5.1953125, -4.8671875, -4.5390625, -4.2109375, -3.8828125, -3.5546875, -3.2265625, -2.8984375, -2.5703125, -2.2421875, -1.9140625, -1.5859375, -1.2578125, -0.9296875, -0.6015625, -0.2734375, 0.0546875, 0.3828125, 0.7109375, 1.0390625, 1.3671875, 1.6953125, 2.0234375, 2.3515625, 2.6796875, 3.0078125, 3.3359375, 3.6640625, 3.9921875, 4.3203125, 4.6484375, 4.9765625, 5.3046875, 5.6328125, 5.9609375, 6.2890625, 6.6171875, 6.9453125, 7.2734375, 7.6015625, 7.9296875, 8.2578125, 8.5859375, 8.9140625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 6.0, 6.0, 13.0, 7.0, 13.0, 11.0, 22.0, 17.0, 24.0, 41.0, 39.0, 35.0, 62.0, 52.0, 73.0, 63.0, 58.0, 64.0, 67.0, 63.0, 41.0, 36.0, 30.0, 29.0, 27.0, 16.0, 12.0, 16.0, 10.0, 11.0, 7.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.947601318359375, -56.02047348022461, -54.09334945678711, -52.166221618652344, -50.239097595214844, -48.31196975708008, -46.38484191894531, -44.45771789550781, -42.53059005737305, -40.60346221923828, -38.67633819580078, -36.749210357666016, -34.82208251953125, -32.89495849609375, -30.967830657958984, -29.04070472717285, -27.11357879638672, -25.186452865600586, -23.259326934814453, -21.332199096679688, -19.405073165893555, -17.477947235107422, -15.550820350646973, -13.623693466186523, -11.69656753540039, -9.769441604614258, -7.842314720153809, -5.915188312530518, -3.9880619049072266, -2.0609359741210938, -0.13380908966064453, 1.7933177947998047, 3.7204437255859375, 5.6475701332092285, 7.5746965408325195, 9.501823425292969, 11.428949356079102, 13.356075286865234, 15.283202171325684, 17.210329055786133, 19.137454986572266, 21.0645809173584, 22.99170684814453, 24.918834686279297, 26.84596061706543, 28.773086547851562, 30.700214385986328, 32.627342224121094, 34.554466247558594, 36.48159408569336, 38.40871810913086, 40.335845947265625, 42.262969970703125, 44.19009780883789, 46.117225646972656, 48.044349670410156, 49.97147750854492, 51.89860534667969, 53.82572937011719, 55.75285720825195, 57.67998504638672, 59.60710906982422, 61.534236907958984, 63.46136474609375, 65.38848876953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 13.0, 2.0, 13.0, 17.0, 19.0, 19.0, 18.0, 22.0, 23.0, 33.0, 25.0, 24.0, 33.0, 43.0, 38.0, 40.0, 45.0, 40.0, 46.0, 47.0, 28.0, 43.0, 33.0, 34.0, 32.0, 23.0, 41.0, 23.0, 14.0, 24.0, 21.0, 15.0, 22.0, 9.0, 6.0, 12.0, 14.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.10472297668457, -29.111766815185547, -28.118812561035156, -27.125856399536133, -26.13290023803711, -25.13994598388672, -24.146989822387695, -23.154033660888672, -22.16107940673828, -21.168123245239258, -20.175168991088867, -19.182212829589844, -18.18925666809082, -17.196300506591797, -16.203346252441406, -15.210390090942383, -14.21743392944336, -13.224478721618652, -12.231522560119629, -11.238567352294922, -10.245611190795898, -9.252655982971191, -8.259700775146484, -7.266745090484619, -6.273789405822754, -5.280833721160889, -4.287878036499023, -3.2949228286743164, -2.301967144012451, -1.309011459350586, -0.3160562515258789, 0.6768994331359863, 1.6698532104492188, 2.662808895111084, 3.65576434135437, 4.648719787597656, 5.6416754722595215, 6.634631156921387, 7.627586364746094, 8.620542526245117, 9.613497734069824, 10.606452941894531, 11.599409103393555, 12.592364311218262, 13.585319519042969, 14.578275680541992, 15.5712308883667, 16.564186096191406, 17.55714225769043, 18.550098419189453, 19.543052673339844, 20.536008834838867, 21.52896499633789, 22.52191925048828, 23.514875411987305, 24.507831573486328, 25.50078582763672, 26.493741989135742, 27.486696243286133, 28.479652404785156, 29.47260856628418, 30.465564727783203, 31.458518981933594, 32.451473236083984, 33.44443130493164]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 3.0, 20.0, 23.0, 27.0, 58.0, 85.0, 129.0, 191.0, 329.0, 503.0, 869.0, 1321.0, 2151.0, 3515.0, 5962.0, 10276.0, 18720.0, 36664.0, 77148.0, 180342.0, 468196.0, 1141569.0, 1271929.0, 580505.0, 218598.0, 89358.0, 40266.0, 19853.0, 10785.0, 5999.0, 3454.0, 2050.0, 1242.0, 803.0, 510.0, 302.0, 189.0, 123.0, 69.0, 56.0, 25.0, 20.0, 19.0, 12.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.1337890625, -73.517578125, -70.9013671875, -68.28515625, -65.6689453125, -63.052734375, -60.4365234375, -57.8203125, -55.2041015625, -52.587890625, -49.9716796875, -47.35546875, -44.7392578125, -42.123046875, -39.5068359375, -36.890625, -34.2744140625, -31.658203125, -29.0419921875, -26.42578125, -23.8095703125, -21.193359375, -18.5771484375, -15.9609375, -13.3447265625, -10.728515625, -8.1123046875, -5.49609375, -2.8798828125, -0.263671875, 2.3525390625, 4.96875, 7.5849609375, 10.201171875, 12.8173828125, 15.43359375, 18.0498046875, 20.666015625, 23.2822265625, 25.8984375, 28.5146484375, 31.130859375, 33.7470703125, 36.36328125, 38.9794921875, 41.595703125, 44.2119140625, 46.828125, 49.4443359375, 52.060546875, 54.6767578125, 57.29296875, 59.9091796875, 62.525390625, 65.1416015625, 67.7578125, 70.3740234375, 72.990234375, 75.6064453125, 78.22265625, 80.8388671875, 83.455078125, 86.0712890625, 88.6875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 13.0, 8.0, 10.0, 20.0, 26.0, 17.0, 17.0, 12.0, 25.0, 18.0, 24.0, 26.0, 40.0, 48.0, 30.0, 47.0, 53.0, 39.0, 53.0, 38.0, 42.0, 36.0, 42.0, 33.0, 31.0, 24.0, 30.0, 25.0, 27.0, 22.0, 26.0, 14.0, 13.0, 20.0, 8.0, 4.0, 10.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.0625, -30.9677734375, -29.873046875, -28.7783203125, -27.68359375, -26.5888671875, -25.494140625, -24.3994140625, -23.3046875, -22.2099609375, -21.115234375, -20.0205078125, -18.92578125, -17.8310546875, -16.736328125, -15.6416015625, -14.546875, -13.4521484375, -12.357421875, -11.2626953125, -10.16796875, -9.0732421875, -7.978515625, -6.8837890625, -5.7890625, -4.6943359375, -3.599609375, -2.5048828125, -1.41015625, -0.3154296875, 0.779296875, 1.8740234375, 2.96875, 4.0634765625, 5.158203125, 6.2529296875, 7.34765625, 8.4423828125, 9.537109375, 10.6318359375, 11.7265625, 12.8212890625, 13.916015625, 15.0107421875, 16.10546875, 17.2001953125, 18.294921875, 19.3896484375, 20.484375, 21.5791015625, 22.673828125, 23.7685546875, 24.86328125, 25.9580078125, 27.052734375, 28.1474609375, 29.2421875, 30.3369140625, 31.431640625, 32.5263671875, 33.62109375, 34.7158203125, 35.810546875, 36.9052734375, 38.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 13.0, 10.0, 17.0, 38.0, 46.0, 69.0, 101.0, 171.0, 237.0, 393.0, 510.0, 798.0, 1245.0, 1994.0, 3066.0, 5001.0, 8009.0, 13565.0, 22844.0, 40154.0, 73579.0, 142946.0, 295891.0, 642609.0, 1159845.0, 914642.0, 432861.0, 203383.0, 101333.0, 54046.0, 29846.0, 17434.0, 10139.0, 6481.0, 3918.0, 2494.0, 1590.0, 964.0, 647.0, 454.0, 306.0, 190.0, 117.0, 86.0, 73.0, 42.0, 32.0, 18.0, 15.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-101.8125, -98.60546875, -95.3984375, -92.19140625, -88.984375, -85.77734375, -82.5703125, -79.36328125, -76.15625, -72.94921875, -69.7421875, -66.53515625, -63.328125, -60.12109375, -56.9140625, -53.70703125, -50.5, -47.29296875, -44.0859375, -40.87890625, -37.671875, -34.46484375, -31.2578125, -28.05078125, -24.84375, -21.63671875, -18.4296875, -15.22265625, -12.015625, -8.80859375, -5.6015625, -2.39453125, 0.8125, 4.01953125, 7.2265625, 10.43359375, 13.640625, 16.84765625, 20.0546875, 23.26171875, 26.46875, 29.67578125, 32.8828125, 36.08984375, 39.296875, 42.50390625, 45.7109375, 48.91796875, 52.125, 55.33203125, 58.5390625, 61.74609375, 64.953125, 68.16015625, 71.3671875, 74.57421875, 77.78125, 80.98828125, 84.1953125, 87.40234375, 90.609375, 93.81640625, 97.0234375, 100.23046875, 103.4375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 10.0, 16.0, 16.0, 13.0, 18.0, 32.0, 34.0, 36.0, 60.0, 66.0, 86.0, 105.0, 115.0, 164.0, 164.0, 205.0, 240.0, 284.0, 261.0, 286.0, 292.0, 246.0, 211.0, 192.0, 165.0, 138.0, 111.0, 98.0, 87.0, 59.0, 46.0, 47.0, 35.0, 23.0, 21.0, 19.0, 14.0, 4.0, 9.0, 4.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-25.84375, -25.043701171875, -24.24365234375, -23.443603515625, -22.6435546875, -21.843505859375, -21.04345703125, -20.243408203125, -19.443359375, -18.643310546875, -17.84326171875, -17.043212890625, -16.2431640625, -15.443115234375, -14.64306640625, -13.843017578125, -13.04296875, -12.242919921875, -11.44287109375, -10.642822265625, -9.8427734375, -9.042724609375, -8.24267578125, -7.442626953125, -6.642578125, -5.842529296875, -5.04248046875, -4.242431640625, -3.4423828125, -2.642333984375, -1.84228515625, -1.042236328125, -0.2421875, 0.557861328125, 1.35791015625, 2.157958984375, 2.9580078125, 3.758056640625, 4.55810546875, 5.358154296875, 6.158203125, 6.958251953125, 7.75830078125, 8.558349609375, 9.3583984375, 10.158447265625, 10.95849609375, 11.758544921875, 12.55859375, 13.358642578125, 14.15869140625, 14.958740234375, 15.7587890625, 16.558837890625, 17.35888671875, 18.158935546875, 18.958984375, 19.759033203125, 20.55908203125, 21.359130859375, 22.1591796875, 22.959228515625, 23.75927734375, 24.559326171875, 25.359375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 13.0, 9.0, 14.0, 15.0, 24.0, 32.0, 39.0, 36.0, 50.0, 69.0, 72.0, 90.0, 69.0, 75.0, 64.0, 50.0, 61.0, 42.0, 38.0, 21.0, 24.0, 15.0, 8.0, 12.0, 7.0, 6.0, 3.0, 8.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-124.36991882324219, -120.25525665283203, -116.14058685302734, -112.02592468261719, -107.91126251220703, -103.79660034179688, -99.68193054199219, -95.56726837158203, -91.45260620117188, -87.33794403076172, -83.22327423095703, -79.10861206054688, -74.99394989013672, -70.87928771972656, -66.76461791992188, -62.64995574951172, -58.53528594970703, -54.42061996459961, -50.30595779418945, -46.19129180908203, -42.076629638671875, -37.96196365356445, -33.84729766845703, -29.732633590698242, -25.617969512939453, -21.503305435180664, -17.388641357421875, -13.273975372314453, -9.159311294555664, -5.044647216796875, -0.9299812316894531, 3.184682846069336, 7.299346923828125, 11.414011001586914, 15.52867603302002, 19.643341064453125, 23.758005142211914, 27.872669219970703, 31.987335205078125, 36.10199737548828, 40.2166633605957, 44.331329345703125, 48.44599151611328, 52.5606575012207, 56.675323486328125, 60.78998565673828, 64.90464782714844, 69.01931762695312, 73.13397979736328, 77.24864196777344, 81.36331176757812, 85.47797393798828, 89.59263610839844, 93.70730590820312, 97.82196807861328, 101.93663024902344, 106.05130004882812, 110.16596221923828, 114.28063201904297, 118.39529418945312, 122.50995635986328, 126.62461853027344, 130.73928833007812, 134.8539581298828, 138.96861267089844]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 10.0, 19.0, 18.0, 9.0, 17.0, 22.0, 26.0, 26.0, 23.0, 26.0, 32.0, 46.0, 28.0, 41.0, 56.0, 37.0, 46.0, 40.0, 37.0, 57.0, 41.0, 49.0, 41.0, 28.0, 22.0, 32.0, 22.0, 18.0, 19.0, 11.0, 12.0, 10.0, 7.0, 7.0, 4.0, 1.0, 11.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-58.71641540527344, -56.88956069946289, -55.06270980834961, -53.23585510253906, -51.409000396728516, -49.582149505615234, -47.75529479980469, -45.928443908691406, -44.10158920288086, -42.27473449707031, -40.44788360595703, -38.621028900146484, -36.79417419433594, -34.967323303222656, -33.14046859741211, -31.313615798950195, -29.48676109313965, -27.659908294677734, -25.833053588867188, -24.006200790405273, -22.17934799194336, -20.352493286132812, -18.5256404876709, -16.698787689208984, -14.871933937072754, -13.045080184936523, -11.21822738647461, -9.391373634338379, -7.564520359039307, -5.737667083740234, -3.910813331604004, -2.08396053314209, -0.2571067810058594, 1.5697466135025024, 3.3966000080108643, 5.223453521728516, 7.050306797027588, 8.87716007232666, 10.70401382446289, 12.530866622924805, 14.357720375061035, 16.184574127197266, 18.01142692565918, 19.838279724121094, 21.66513442993164, 23.491987228393555, 25.31884002685547, 27.145694732666016, 28.97254753112793, 30.799400329589844, 32.62625503540039, 34.45310974121094, 36.27996063232422, 38.106815338134766, 39.93367004394531, 41.760520935058594, 43.58737564086914, 45.41423034667969, 47.24108123779297, 49.067935943603516, 50.89479064941406, 52.721641540527344, 54.54849624633789, 56.37535095214844, 58.20220184326172]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 5.0, 6.0, 14.0, 19.0, 25.0, 50.0, 58.0, 80.0, 109.0, 178.0, 296.0, 432.0, 691.0, 1128.0, 1809.0, 3131.0, 5604.0, 10275.0, 20127.0, 41831.0, 90331.0, 186709.0, 282818.0, 205411.0, 101782.0, 47041.0, 22471.0, 11306.0, 6078.0, 3434.0, 1991.0, 1214.0, 736.0, 436.0, 304.0, 189.0, 134.0, 103.0, 58.0, 38.0, 35.0, 21.0, 11.0, 12.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.125, -62.9951171875, -60.865234375, -58.7353515625, -56.60546875, -54.4755859375, -52.345703125, -50.2158203125, -48.0859375, -45.9560546875, -43.826171875, -41.6962890625, -39.56640625, -37.4365234375, -35.306640625, -33.1767578125, -31.046875, -28.9169921875, -26.787109375, -24.6572265625, -22.52734375, -20.3974609375, -18.267578125, -16.1376953125, -14.0078125, -11.8779296875, -9.748046875, -7.6181640625, -5.48828125, -3.3583984375, -1.228515625, 0.9013671875, 3.03125, 5.1611328125, 7.291015625, 9.4208984375, 11.55078125, 13.6806640625, 15.810546875, 17.9404296875, 20.0703125, 22.2001953125, 24.330078125, 26.4599609375, 28.58984375, 30.7197265625, 32.849609375, 34.9794921875, 37.109375, 39.2392578125, 41.369140625, 43.4990234375, 45.62890625, 47.7587890625, 49.888671875, 52.0185546875, 54.1484375, 56.2783203125, 58.408203125, 60.5380859375, 62.66796875, 64.7978515625, 66.927734375, 69.0576171875, 71.1875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 9.0, 7.0, 10.0, 8.0, 17.0, 28.0, 24.0, 26.0, 30.0, 38.0, 34.0, 45.0, 51.0, 47.0, 66.0, 57.0, 63.0, 68.0, 59.0, 48.0, 45.0, 45.0, 26.0, 33.0, 24.0, 20.0, 14.0, 8.0, 10.0, 9.0, 10.0, 1.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.5, -95.8134765625, -93.126953125, -90.4404296875, -87.75390625, -85.0673828125, -82.380859375, -79.6943359375, -77.0078125, -74.3212890625, -71.634765625, -68.9482421875, -66.26171875, -63.5751953125, -60.888671875, -58.2021484375, -55.515625, -52.8291015625, -50.142578125, -47.4560546875, -44.76953125, -42.0830078125, -39.396484375, -36.7099609375, -34.0234375, -31.3369140625, -28.650390625, -25.9638671875, -23.27734375, -20.5908203125, -17.904296875, -15.2177734375, -12.53125, -9.8447265625, -7.158203125, -4.4716796875, -1.78515625, 0.9013671875, 3.587890625, 6.2744140625, 8.9609375, 11.6474609375, 14.333984375, 17.0205078125, 19.70703125, 22.3935546875, 25.080078125, 27.7666015625, 30.453125, 33.1396484375, 35.826171875, 38.5126953125, 41.19921875, 43.8857421875, 46.572265625, 49.2587890625, 51.9453125, 54.6318359375, 57.318359375, 60.0048828125, 62.69140625, 65.3779296875, 68.064453125, 70.7509765625, 73.4375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 12.0, 15.0, 24.0, 31.0, 39.0, 52.0, 77.0, 107.0, 138.0, 233.0, 312.0, 454.0, 770.0, 1180.0, 1971.0, 3343.0, 6218.0, 12603.0, 26088.0, 58466.0, 138174.0, 281084.0, 275252.0, 133256.0, 56860.0, 25154.0, 11828.0, 6141.0, 3378.0, 1924.0, 1179.0, 698.0, 473.0, 318.0, 208.0, 135.0, 98.0, 79.0, 44.0, 26.0, 31.0, 17.0, 16.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.75, -73.3046875, -70.859375, -68.4140625, -65.96875, -63.5234375, -61.078125, -58.6328125, -56.1875, -53.7421875, -51.296875, -48.8515625, -46.40625, -43.9609375, -41.515625, -39.0703125, -36.625, -34.1796875, -31.734375, -29.2890625, -26.84375, -24.3984375, -21.953125, -19.5078125, -17.0625, -14.6171875, -12.171875, -9.7265625, -7.28125, -4.8359375, -2.390625, 0.0546875, 2.5, 4.9453125, 7.390625, 9.8359375, 12.28125, 14.7265625, 17.171875, 19.6171875, 22.0625, 24.5078125, 26.953125, 29.3984375, 31.84375, 34.2890625, 36.734375, 39.1796875, 41.625, 44.0703125, 46.515625, 48.9609375, 51.40625, 53.8515625, 56.296875, 58.7421875, 61.1875, 63.6328125, 66.078125, 68.5234375, 70.96875, 73.4140625, 75.859375, 78.3046875, 80.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 10.0, 6.0, 4.0, 11.0, 14.0, 9.0, 14.0, 16.0, 22.0, 15.0, 23.0, 36.0, 25.0, 52.0, 38.0, 24.0, 33.0, 51.0, 34.0, 40.0, 32.0, 45.0, 33.0, 41.0, 54.0, 29.0, 33.0, 31.0, 31.0, 31.0, 23.0, 24.0, 17.0, 15.0, 8.0, 17.0, 9.0, 10.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.4375, -33.30029296875, -32.1630859375, -31.02587890625, -29.888671875, -28.75146484375, -27.6142578125, -26.47705078125, -25.33984375, -24.20263671875, -23.0654296875, -21.92822265625, -20.791015625, -19.65380859375, -18.5166015625, -17.37939453125, -16.2421875, -15.10498046875, -13.9677734375, -12.83056640625, -11.693359375, -10.55615234375, -9.4189453125, -8.28173828125, -7.14453125, -6.00732421875, -4.8701171875, -3.73291015625, -2.595703125, -1.45849609375, -0.3212890625, 0.81591796875, 1.953125, 3.09033203125, 4.2275390625, 5.36474609375, 6.501953125, 7.63916015625, 8.7763671875, 9.91357421875, 11.05078125, 12.18798828125, 13.3251953125, 14.46240234375, 15.599609375, 16.73681640625, 17.8740234375, 19.01123046875, 20.1484375, 21.28564453125, 22.4228515625, 23.56005859375, 24.697265625, 25.83447265625, 26.9716796875, 28.10888671875, 29.24609375, 30.38330078125, 31.5205078125, 32.65771484375, 33.794921875, 34.93212890625, 36.0693359375, 37.20654296875, 38.34375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 12.0, 12.0, 20.0, 25.0, 32.0, 43.0, 77.0, 101.0, 149.0, 211.0, 323.0, 452.0, 656.0, 1016.0, 1620.0, 2651.0, 4230.0, 7071.0, 12397.0, 21790.0, 40528.0, 76765.0, 148799.0, 252792.0, 220259.0, 118589.0, 61340.0, 32617.0, 17874.0, 10146.0, 5919.0, 3599.0, 2246.0, 1446.0, 848.0, 601.0, 401.0, 294.0, 196.0, 125.0, 84.0, 63.0, 50.0, 29.0, 25.0, 10.0, 8.0, 11.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-23.15625, -22.4287109375, -21.701171875, -20.9736328125, -20.24609375, -19.5185546875, -18.791015625, -18.0634765625, -17.3359375, -16.6083984375, -15.880859375, -15.1533203125, -14.42578125, -13.6982421875, -12.970703125, -12.2431640625, -11.515625, -10.7880859375, -10.060546875, -9.3330078125, -8.60546875, -7.8779296875, -7.150390625, -6.4228515625, -5.6953125, -4.9677734375, -4.240234375, -3.5126953125, -2.78515625, -2.0576171875, -1.330078125, -0.6025390625, 0.125, 0.8525390625, 1.580078125, 2.3076171875, 3.03515625, 3.7626953125, 4.490234375, 5.2177734375, 5.9453125, 6.6728515625, 7.400390625, 8.1279296875, 8.85546875, 9.5830078125, 10.310546875, 11.0380859375, 11.765625, 12.4931640625, 13.220703125, 13.9482421875, 14.67578125, 15.4033203125, 16.130859375, 16.8583984375, 17.5859375, 18.3134765625, 19.041015625, 19.7685546875, 20.49609375, 21.2236328125, 21.951171875, 22.6787109375, 23.40625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 13.0, 16.0, 21.0, 24.0, 25.0, 27.0, 46.0, 65.0, 68.0, 86.0, 92.0, 69.0, 74.0, 67.0, 46.0, 53.0, 30.0, 30.0, 25.0, 17.0, 18.0, 15.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020923614501953125, -0.002036452293395996, -0.0019805431365966797, -0.0019246339797973633, -0.0018687248229980469, -0.0018128156661987305, -0.001756906509399414, -0.0017009973526000977, -0.0016450881958007812, -0.0015891790390014648, -0.0015332698822021484, -0.001477360725402832, -0.0014214515686035156, -0.0013655424118041992, -0.0013096332550048828, -0.0012537240982055664, -0.00119781494140625, -0.0011419057846069336, -0.0010859966278076172, -0.0010300874710083008, -0.0009741783142089844, -0.000918269157409668, -0.0008623600006103516, -0.0008064508438110352, -0.0007505416870117188, -0.0006946325302124023, -0.0006387233734130859, -0.0005828142166137695, -0.0005269050598144531, -0.0004709959030151367, -0.0004150867462158203, -0.0003591775894165039, -0.0003032684326171875, -0.0002473592758178711, -0.0001914501190185547, -0.00013554096221923828, -7.963180541992188e-05, -2.372264862060547e-05, 3.218650817871094e-05, 8.809566497802734e-05, 0.00014400482177734375, 0.00019991397857666016, 0.00025582313537597656, 0.00031173229217529297, 0.0003676414489746094, 0.0004235506057739258, 0.0004794597625732422, 0.0005353689193725586, 0.000591278076171875, 0.0006471872329711914, 0.0007030963897705078, 0.0007590055465698242, 0.0008149147033691406, 0.000870823860168457, 0.0009267330169677734, 0.0009826421737670898, 0.0010385513305664062, 0.0010944604873657227, 0.001150369644165039, 0.0012062788009643555, 0.0012621879577636719, 0.0013180971145629883, 0.0013740062713623047, 0.001429915428161621, 0.0014858245849609375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 12.0, 13.0, 34.0, 30.0, 36.0, 58.0, 106.0, 112.0, 175.0, 252.0, 353.0, 488.0, 773.0, 1274.0, 2077.0, 3975.0, 7958.0, 18097.0, 44108.0, 108161.0, 244979.0, 316514.0, 172923.0, 71125.0, 29065.0, 12563.0, 5604.0, 2888.0, 1686.0, 981.0, 647.0, 430.0, 320.0, 194.0, 151.0, 105.0, 79.0, 55.0, 38.0, 29.0, 17.0, 20.0, 6.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.46875, -36.2705078125, -35.072265625, -33.8740234375, -32.67578125, -31.4775390625, -30.279296875, -29.0810546875, -27.8828125, -26.6845703125, -25.486328125, -24.2880859375, -23.08984375, -21.8916015625, -20.693359375, -19.4951171875, -18.296875, -17.0986328125, -15.900390625, -14.7021484375, -13.50390625, -12.3056640625, -11.107421875, -9.9091796875, -8.7109375, -7.5126953125, -6.314453125, -5.1162109375, -3.91796875, -2.7197265625, -1.521484375, -0.3232421875, 0.875, 2.0732421875, 3.271484375, 4.4697265625, 5.66796875, 6.8662109375, 8.064453125, 9.2626953125, 10.4609375, 11.6591796875, 12.857421875, 14.0556640625, 15.25390625, 16.4521484375, 17.650390625, 18.8486328125, 20.046875, 21.2451171875, 22.443359375, 23.6416015625, 24.83984375, 26.0380859375, 27.236328125, 28.4345703125, 29.6328125, 30.8310546875, 32.029296875, 33.2275390625, 34.42578125, 35.6240234375, 36.822265625, 38.0205078125, 39.21875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 12.0, 18.0, 18.0, 22.0, 15.0, 48.0, 36.0, 39.0, 51.0, 52.0, 53.0, 55.0, 59.0, 76.0, 56.0, 52.0, 56.0, 45.0, 37.0, 36.0, 26.0, 20.0, 8.0, 14.0, 12.0, 8.0, 6.0, 9.0, 9.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.12109375, -6.9097900390625, -6.698486328125, -6.4871826171875, -6.27587890625, -6.0645751953125, -5.853271484375, -5.6419677734375, -5.4306640625, -5.2193603515625, -5.008056640625, -4.7967529296875, -4.58544921875, -4.3741455078125, -4.162841796875, -3.9515380859375, -3.740234375, -3.5289306640625, -3.317626953125, -3.1063232421875, -2.89501953125, -2.6837158203125, -2.472412109375, -2.2611083984375, -2.0498046875, -1.8385009765625, -1.627197265625, -1.4158935546875, -1.20458984375, -0.9932861328125, -0.781982421875, -0.5706787109375, -0.359375, -0.1480712890625, 0.063232421875, 0.2745361328125, 0.48583984375, 0.6971435546875, 0.908447265625, 1.1197509765625, 1.3310546875, 1.5423583984375, 1.753662109375, 1.9649658203125, 2.17626953125, 2.3875732421875, 2.598876953125, 2.8101806640625, 3.021484375, 3.2327880859375, 3.444091796875, 3.6553955078125, 3.86669921875, 4.0780029296875, 4.289306640625, 4.5006103515625, 4.7119140625, 4.9232177734375, 5.134521484375, 5.3458251953125, 5.55712890625, 5.7684326171875, 5.979736328125, 6.1910400390625, 6.40234375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 12.0, 8.0, 10.0, 12.0, 20.0, 18.0, 34.0, 34.0, 46.0, 51.0, 53.0, 83.0, 82.0, 73.0, 78.0, 66.0, 59.0, 51.0, 40.0, 38.0, 21.0, 26.0, 15.0, 10.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 6.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-134.5395050048828, -130.36776733398438, -126.1960220336914, -122.02428436279297, -117.85254669189453, -113.68080139160156, -109.50906372070312, -105.33732604980469, -101.16558837890625, -96.99385070800781, -92.82210540771484, -88.6503677368164, -84.47863006591797, -80.306884765625, -76.13514709472656, -71.96340942382812, -67.79166412353516, -63.61992263793945, -59.448184967041016, -55.27644348144531, -51.104705810546875, -46.93296432495117, -42.76122283935547, -38.58948516845703, -34.41774368286133, -30.246004104614258, -26.074264526367188, -21.902523040771484, -17.730783462524414, -13.559043884277344, -9.38730239868164, -5.21556282043457, -1.0438232421875, 3.1279168128967285, 7.299656867980957, 11.471397399902344, 15.643136978149414, 19.814876556396484, 23.986618041992188, 28.158357620239258, 32.33009719848633, 36.50183868408203, 40.67357635498047, 44.84531784057617, 49.017059326171875, 53.18879699707031, 57.360538482666016, 61.53227996826172, 65.70401763916016, 69.8757553100586, 74.04750061035156, 78.21923828125, 82.39097595214844, 86.56271362304688, 90.73445892333984, 94.90619659423828, 99.07794189453125, 103.24967956542969, 107.42142486572266, 111.5931625366211, 115.76490020751953, 119.9366455078125, 124.10838317871094, 128.28012084960938, 132.4518585205078]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 7.0, 4.0, 6.0, 8.0, 8.0, 8.0, 9.0, 23.0, 15.0, 13.0, 16.0, 21.0, 28.0, 23.0, 22.0, 31.0, 35.0, 41.0, 37.0, 48.0, 41.0, 43.0, 41.0, 44.0, 48.0, 48.0, 45.0, 39.0, 41.0, 24.0, 33.0, 29.0, 14.0, 20.0, 19.0, 10.0, 10.0, 10.0, 7.0, 5.0, 4.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.4119987487793, -57.544837951660156, -55.677677154541016, -53.810516357421875, -51.943355560302734, -50.076194763183594, -48.20903396606445, -46.34187316894531, -44.47471237182617, -42.60755157470703, -40.74039077758789, -38.87322998046875, -37.00606918334961, -35.13890838623047, -33.27174758911133, -31.404586791992188, -29.537424087524414, -27.670263290405273, -25.803102493286133, -23.935941696166992, -22.06878089904785, -20.201618194580078, -18.334457397460938, -16.467296600341797, -14.600136756896973, -12.732975959777832, -10.865815162658691, -8.998653411865234, -7.131493091583252, -5.264331817626953, -3.3971710205078125, -1.5300102233886719, 0.33715057373046875, 2.2043113708496094, 4.07147216796875, 5.938633441925049, 7.8057942390441895, 9.672955513000488, 11.540116310119629, 13.40727710723877, 15.27443790435791, 17.141599655151367, 19.008760452270508, 20.87592124938965, 22.74308204650879, 24.61024284362793, 26.47740364074707, 28.34456443786621, 30.21172523498535, 32.078887939453125, 33.946048736572266, 35.813209533691406, 37.68037033081055, 39.54753112792969, 41.41469192504883, 43.28185272216797, 45.14901351928711, 47.01617431640625, 48.88333511352539, 50.75049591064453, 52.61765670776367, 54.48481750488281, 56.35197830200195, 58.219139099121094, 60.086299896240234]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 18.0, 38.0, 51.0, 64.0, 90.0, 129.0, 191.0, 254.0, 381.0, 548.0, 873.0, 1263.0, 1878.0, 2792.0, 4518.0, 7025.0, 11092.0, 18232.0, 30394.0, 50629.0, 84402.0, 133408.0, 178032.0, 177311.0, 132835.0, 83947.0, 49866.0, 29517.0, 17854.0, 11105.0, 6736.0, 4478.0, 2852.0, 1885.0, 1231.0, 811.0, 580.0, 354.0, 277.0, 185.0, 119.0, 87.0, 67.0, 46.0, 25.0, 26.0, 15.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-81.4375, -78.96875, -76.5, -74.03125, -71.5625, -69.09375, -66.625, -64.15625, -61.6875, -59.21875, -56.75, -54.28125, -51.8125, -49.34375, -46.875, -44.40625, -41.9375, -39.46875, -37.0, -34.53125, -32.0625, -29.59375, -27.125, -24.65625, -22.1875, -19.71875, -17.25, -14.78125, -12.3125, -9.84375, -7.375, -4.90625, -2.4375, 0.03125, 2.5, 4.96875, 7.4375, 9.90625, 12.375, 14.84375, 17.3125, 19.78125, 22.25, 24.71875, 27.1875, 29.65625, 32.125, 34.59375, 37.0625, 39.53125, 42.0, 44.46875, 46.9375, 49.40625, 51.875, 54.34375, 56.8125, 59.28125, 61.75, 64.21875, 66.6875, 69.15625, 71.625, 74.09375, 76.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 4.0, 11.0, 9.0, 11.0, 12.0, 16.0, 23.0, 26.0, 27.0, 31.0, 38.0, 44.0, 45.0, 63.0, 54.0, 60.0, 49.0, 53.0, 55.0, 62.0, 45.0, 47.0, 35.0, 32.0, 29.0, 29.0, 20.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.1875, -69.5283203125, -66.869140625, -64.2099609375, -61.55078125, -58.8916015625, -56.232421875, -53.5732421875, -50.9140625, -48.2548828125, -45.595703125, -42.9365234375, -40.27734375, -37.6181640625, -34.958984375, -32.2998046875, -29.640625, -26.9814453125, -24.322265625, -21.6630859375, -19.00390625, -16.3447265625, -13.685546875, -11.0263671875, -8.3671875, -5.7080078125, -3.048828125, -0.3896484375, 2.26953125, 4.9287109375, 7.587890625, 10.2470703125, 12.90625, 15.5654296875, 18.224609375, 20.8837890625, 23.54296875, 26.2021484375, 28.861328125, 31.5205078125, 34.1796875, 36.8388671875, 39.498046875, 42.1572265625, 44.81640625, 47.4755859375, 50.134765625, 52.7939453125, 55.453125, 58.1123046875, 60.771484375, 63.4306640625, 66.08984375, 68.7490234375, 71.408203125, 74.0673828125, 76.7265625, 79.3857421875, 82.044921875, 84.7041015625, 87.36328125, 90.0224609375, 92.681640625, 95.3408203125, 98.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 10.0, 15.0, 17.0, 22.0, 38.0, 50.0, 64.0, 112.0, 136.0, 204.0, 325.0, 420.0, 667.0, 921.0, 1453.0, 2214.0, 3249.0, 5256.0, 8604.0, 14059.0, 24345.0, 43534.0, 77663.0, 137055.0, 204478.0, 204183.0, 136396.0, 77702.0, 43464.0, 24044.0, 14167.0, 8399.0, 5175.0, 3401.0, 2143.0, 1449.0, 1013.0, 669.0, 451.0, 282.0, 207.0, 149.0, 102.0, 89.0, 48.0, 25.0, 28.0, 17.0, 8.0, 9.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0], "bins": [-138.5, -134.302734375, -130.10546875, -125.908203125, -121.7109375, -117.513671875, -113.31640625, -109.119140625, -104.921875, -100.724609375, -96.52734375, -92.330078125, -88.1328125, -83.935546875, -79.73828125, -75.541015625, -71.34375, -67.146484375, -62.94921875, -58.751953125, -54.5546875, -50.357421875, -46.16015625, -41.962890625, -37.765625, -33.568359375, -29.37109375, -25.173828125, -20.9765625, -16.779296875, -12.58203125, -8.384765625, -4.1875, 0.009765625, 4.20703125, 8.404296875, 12.6015625, 16.798828125, 20.99609375, 25.193359375, 29.390625, 33.587890625, 37.78515625, 41.982421875, 46.1796875, 50.376953125, 54.57421875, 58.771484375, 62.96875, 67.166015625, 71.36328125, 75.560546875, 79.7578125, 83.955078125, 88.15234375, 92.349609375, 96.546875, 100.744140625, 104.94140625, 109.138671875, 113.3359375, 117.533203125, 121.73046875, 125.927734375, 130.125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 7.0, 7.0, 15.0, 6.0, 13.0, 12.0, 25.0, 27.0, 32.0, 29.0, 40.0, 30.0, 36.0, 49.0, 43.0, 43.0, 43.0, 53.0, 60.0, 46.0, 53.0, 39.0, 36.0, 39.0, 26.0, 35.0, 32.0, 20.0, 16.0, 18.0, 7.0, 11.0, 17.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0], "bins": [-65.4375, -63.68408203125, -61.9306640625, -60.17724609375, -58.423828125, -56.67041015625, -54.9169921875, -53.16357421875, -51.41015625, -49.65673828125, -47.9033203125, -46.14990234375, -44.396484375, -42.64306640625, -40.8896484375, -39.13623046875, -37.3828125, -35.62939453125, -33.8759765625, -32.12255859375, -30.369140625, -28.61572265625, -26.8623046875, -25.10888671875, -23.35546875, -21.60205078125, -19.8486328125, -18.09521484375, -16.341796875, -14.58837890625, -12.8349609375, -11.08154296875, -9.328125, -7.57470703125, -5.8212890625, -4.06787109375, -2.314453125, -0.56103515625, 1.1923828125, 2.94580078125, 4.69921875, 6.45263671875, 8.2060546875, 9.95947265625, 11.712890625, 13.46630859375, 15.2197265625, 16.97314453125, 18.7265625, 20.47998046875, 22.2333984375, 23.98681640625, 25.740234375, 27.49365234375, 29.2470703125, 31.00048828125, 32.75390625, 34.50732421875, 36.2607421875, 38.01416015625, 39.767578125, 41.52099609375, 43.2744140625, 45.02783203125, 46.78125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 12.0, 13.0, 9.0, 21.0, 51.0, 69.0, 87.0, 114.0, 182.0, 305.0, 488.0, 805.0, 1312.0, 2319.0, 3946.0, 7525.0, 14907.0, 30823.0, 65650.0, 141645.0, 260504.0, 255841.0, 137073.0, 63956.0, 29603.0, 14488.0, 7399.0, 3898.0, 2165.0, 1227.0, 755.0, 497.0, 269.0, 199.0, 117.0, 87.0, 68.0, 39.0, 23.0, 18.0, 14.0, 13.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-102.0, -98.998046875, -95.99609375, -92.994140625, -89.9921875, -86.990234375, -83.98828125, -80.986328125, -77.984375, -74.982421875, -71.98046875, -68.978515625, -65.9765625, -62.974609375, -59.97265625, -56.970703125, -53.96875, -50.966796875, -47.96484375, -44.962890625, -41.9609375, -38.958984375, -35.95703125, -32.955078125, -29.953125, -26.951171875, -23.94921875, -20.947265625, -17.9453125, -14.943359375, -11.94140625, -8.939453125, -5.9375, -2.935546875, 0.06640625, 3.068359375, 6.0703125, 9.072265625, 12.07421875, 15.076171875, 18.078125, 21.080078125, 24.08203125, 27.083984375, 30.0859375, 33.087890625, 36.08984375, 39.091796875, 42.09375, 45.095703125, 48.09765625, 51.099609375, 54.1015625, 57.103515625, 60.10546875, 63.107421875, 66.109375, 69.111328125, 72.11328125, 75.115234375, 78.1171875, 81.119140625, 84.12109375, 87.123046875, 90.125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 8.0, 8.0, 15.0, 17.0, 22.0, 30.0, 42.0, 61.0, 102.0, 113.0, 123.0, 104.0, 97.0, 67.0, 64.0, 36.0, 24.0, 17.0, 13.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01335906982421875, -0.01296079158782959, -0.01256251335144043, -0.01216423511505127, -0.01176595687866211, -0.01136767864227295, -0.010969400405883789, -0.010571122169494629, -0.010172843933105469, -0.009774565696716309, -0.009376287460327148, -0.008978009223937988, -0.008579730987548828, -0.008181452751159668, -0.007783174514770508, -0.007384896278381348, -0.0069866180419921875, -0.006588339805603027, -0.006190061569213867, -0.005791783332824707, -0.005393505096435547, -0.004995226860046387, -0.0045969486236572266, -0.004198670387268066, -0.0038003921508789062, -0.003402113914489746, -0.003003835678100586, -0.0026055574417114258, -0.0022072792053222656, -0.0018090009689331055, -0.0014107227325439453, -0.0010124444961547852, -0.000614166259765625, -0.00021588802337646484, 0.0001823902130126953, 0.0005806684494018555, 0.0009789466857910156, 0.0013772249221801758, 0.001775503158569336, 0.002173781394958496, 0.0025720596313476562, 0.0029703378677368164, 0.0033686161041259766, 0.0037668943405151367, 0.004165172576904297, 0.004563450813293457, 0.004961729049682617, 0.005360007286071777, 0.0057582855224609375, 0.006156563758850098, 0.006554841995239258, 0.006953120231628418, 0.007351398468017578, 0.007749676704406738, 0.008147954940795898, 0.008546233177185059, 0.008944511413574219, 0.009342789649963379, 0.009741067886352539, 0.0101393461227417, 0.01053762435913086, 0.01093590259552002, 0.01133418083190918, 0.01173245906829834, 0.0121307373046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 14.0, 18.0, 38.0, 50.0, 82.0, 106.0, 165.0, 236.0, 330.0, 525.0, 757.0, 1108.0, 1655.0, 2384.0, 3560.0, 5314.0, 8347.0, 12739.0, 20757.0, 33003.0, 54842.0, 91852.0, 147850.0, 196867.0, 173021.0, 112977.0, 68700.0, 41366.0, 25094.0, 15666.0, 9798.0, 6403.0, 4247.0, 2723.0, 1866.0, 1294.0, 867.0, 603.0, 409.0, 284.0, 193.0, 143.0, 95.0, 66.0, 56.0, 30.0, 28.0, 9.0, 5.0, 6.0, 4.0, 1.0, 3.0], "bins": [-64.1875, -62.33837890625, -60.4892578125, -58.64013671875, -56.791015625, -54.94189453125, -53.0927734375, -51.24365234375, -49.39453125, -47.54541015625, -45.6962890625, -43.84716796875, -41.998046875, -40.14892578125, -38.2998046875, -36.45068359375, -34.6015625, -32.75244140625, -30.9033203125, -29.05419921875, -27.205078125, -25.35595703125, -23.5068359375, -21.65771484375, -19.80859375, -17.95947265625, -16.1103515625, -14.26123046875, -12.412109375, -10.56298828125, -8.7138671875, -6.86474609375, -5.015625, -3.16650390625, -1.3173828125, 0.53173828125, 2.380859375, 4.22998046875, 6.0791015625, 7.92822265625, 9.77734375, 11.62646484375, 13.4755859375, 15.32470703125, 17.173828125, 19.02294921875, 20.8720703125, 22.72119140625, 24.5703125, 26.41943359375, 28.2685546875, 30.11767578125, 31.966796875, 33.81591796875, 35.6650390625, 37.51416015625, 39.36328125, 41.21240234375, 43.0615234375, 44.91064453125, 46.759765625, 48.60888671875, 50.4580078125, 52.30712890625, 54.15625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 9.0, 20.0, 22.0, 22.0, 18.0, 22.0, 29.0, 30.0, 29.0, 38.0, 45.0, 35.0, 52.0, 49.0, 38.0, 47.0, 49.0, 42.0, 31.0, 38.0, 29.0, 42.0, 33.0, 29.0, 21.0, 20.0, 21.0, 16.0, 13.0, 8.0, 10.0, 8.0, 6.0, 8.0, 6.0, 6.0, 7.0, 3.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.875, -13.407470703125, -12.93994140625, -12.472412109375, -12.0048828125, -11.537353515625, -11.06982421875, -10.602294921875, -10.134765625, -9.667236328125, -9.19970703125, -8.732177734375, -8.2646484375, -7.797119140625, -7.32958984375, -6.862060546875, -6.39453125, -5.927001953125, -5.45947265625, -4.991943359375, -4.5244140625, -4.056884765625, -3.58935546875, -3.121826171875, -2.654296875, -2.186767578125, -1.71923828125, -1.251708984375, -0.7841796875, -0.316650390625, 0.15087890625, 0.618408203125, 1.0859375, 1.553466796875, 2.02099609375, 2.488525390625, 2.9560546875, 3.423583984375, 3.89111328125, 4.358642578125, 4.826171875, 5.293701171875, 5.76123046875, 6.228759765625, 6.6962890625, 7.163818359375, 7.63134765625, 8.098876953125, 8.56640625, 9.033935546875, 9.50146484375, 9.968994140625, 10.4365234375, 10.904052734375, 11.37158203125, 11.839111328125, 12.306640625, 12.774169921875, 13.24169921875, 13.709228515625, 14.1767578125, 14.644287109375, 15.11181640625, 15.579345703125, 16.046875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 8.0, 7.0, 7.0, 20.0, 14.0, 24.0, 19.0, 32.0, 31.0, 48.0, 59.0, 59.0, 67.0, 69.0, 79.0, 75.0, 63.0, 58.0, 54.0, 35.0, 44.0, 24.0, 25.0, 11.0, 16.0, 7.0, 9.0, 10.0, 5.0, 3.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-179.46360778808594, -174.63201904296875, -169.8004150390625, -164.96881103515625, -160.13722229003906, -155.30563354492188, -150.47402954101562, -145.64242553710938, -140.8108367919922, -135.979248046875, -131.14764404296875, -126.31604766845703, -121.48445129394531, -116.6528549194336, -111.82125854492188, -106.98966217041016, -102.15806579589844, -97.32646942138672, -92.494873046875, -87.66327667236328, -82.83168029785156, -78.00008392333984, -73.16848754882812, -68.3368911743164, -63.50529479980469, -58.67369842529297, -53.84210205078125, -49.01050567626953, -44.17890930175781, -39.347312927246094, -34.515716552734375, -29.684120178222656, -24.8525390625, -20.02094268798828, -15.189346313476562, -10.357749938964844, -5.526153564453125, -0.6945571899414062, 4.1370391845703125, 8.968635559082031, 13.80023193359375, 18.63182830810547, 23.463424682617188, 28.295021057128906, 33.126617431640625, 37.958213806152344, 42.78981018066406, 47.62140655517578, 52.4530029296875, 57.28459930419922, 62.11619567871094, 66.94779205322266, 71.77938842773438, 76.6109848022461, 81.44258117675781, 86.27417755126953, 91.10577392578125, 95.93737030029297, 100.76896667480469, 105.6005630493164, 110.43215942382812, 115.26375579833984, 120.09535217285156, 124.92694854736328, 129.758544921875]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 4.0, 7.0, 9.0, 8.0, 10.0, 6.0, 16.0, 22.0, 24.0, 30.0, 22.0, 33.0, 46.0, 56.0, 46.0, 45.0, 59.0, 52.0, 62.0, 63.0, 56.0, 49.0, 44.0, 33.0, 37.0, 38.0, 18.0, 13.0, 22.0, 15.0, 13.0, 11.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-125.78013610839844, -121.90802001953125, -118.0359115600586, -114.16380310058594, -110.29168701171875, -106.41957092285156, -102.5474624633789, -98.67535400390625, -94.80323791503906, -90.93112182617188, -87.05901336669922, -83.18690490722656, -79.31478881835938, -75.44267272949219, -71.57056427001953, -67.69845581054688, -63.82633972167969, -59.954227447509766, -56.082115173339844, -52.21000289916992, -48.337890625, -44.46577835083008, -40.593666076660156, -36.721553802490234, -32.84944152832031, -28.97732925415039, -25.10521697998047, -21.233104705810547, -17.360992431640625, -13.488880157470703, -9.616767883300781, -5.744655609130859, -1.8725433349609375, 1.9995689392089844, 5.871681213378906, 9.743793487548828, 13.61590576171875, 17.488018035888672, 21.360130310058594, 25.232242584228516, 29.104354858398438, 32.97646713256836, 36.84857940673828, 40.7206916809082, 44.592803955078125, 48.46491622924805, 52.33702850341797, 56.20914077758789, 60.08125305175781, 63.953365325927734, 67.82547760009766, 71.69758605957031, 75.5697021484375, 79.44181823730469, 83.31392669677734, 87.18603515625, 91.05815124511719, 94.93026733398438, 98.80237579345703, 102.67448425292969, 106.54660034179688, 110.41871643066406, 114.29082489013672, 118.16293334960938, 122.03504943847656]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 2.0, 11.0, 8.0, 11.0, 13.0, 18.0, 27.0, 23.0, 39.0, 30.0, 46.0, 62.0, 94.0, 146.0, 198.0, 294.0, 456.0, 806.0, 1468.0, 4237.0, 512340.0, 1600.0, 797.0, 460.0, 304.0, 191.0, 148.0, 96.0, 70.0, 59.0, 40.0, 24.0, 33.0, 14.0, 14.0, 13.0, 11.0, 10.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-2329.248291015625, -2258.72705078125, -2188.2060546875, -2117.684814453125, -2047.163818359375, -1976.642578125, -1906.1214599609375, -1835.600341796875, -1765.0792236328125, -1694.55810546875, -1624.0369873046875, -1553.515869140625, -1482.99462890625, -1412.4736328125, -1341.952392578125, -1271.4312744140625, -1200.91015625, -1130.3890380859375, -1059.867919921875, -989.3467407226562, -918.8256225585938, -848.3045043945312, -777.7833251953125, -707.26220703125, -636.7410888671875, -566.219970703125, -495.6988220214844, -425.17767333984375, -354.65655517578125, -284.13543701171875, -213.61428833007812, -143.0931396484375, -72.572265625, -2.0511322021484375, 68.47000122070312, 138.9911346435547, 209.51226806640625, 280.03338623046875, 350.5545349121094, 421.07568359375, 491.5968017578125, 562.117919921875, 632.6390380859375, 703.1602172851562, 773.6813354492188, 844.2024536132812, 914.7236328125, 985.2447509765625, 1055.765869140625, 1126.2869873046875, 1196.80810546875, 1267.3292236328125, 1337.850341796875, 1408.37158203125, 1478.8927001953125, 1549.413818359375, 1619.9349365234375, 1690.4560546875, 1760.9771728515625, 1831.498291015625, 1902.01953125, 1972.54052734375, 2043.061767578125, 2113.5830078125, 2184.10400390625]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 7.0, 2.0, 8.0, 9.0, 11.0, 7.0, 8.0, 25.0, 17.0, 34.0, 25.0, 26.0, 36.0, 62.0, 42.0, 41.0, 60.0, 1075.0, 68.0, 56.0, 64.0, 46.0, 51.0, 34.0, 37.0, 32.0, 31.0, 14.0, 20.0, 16.0, 12.0, 15.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4107.04736328125, -3982.537353515625, -3858.02734375, -3733.517333984375, -3609.00732421875, -3484.497314453125, -3359.9873046875, -3235.477294921875, -3110.96728515625, -2986.457275390625, -2861.947265625, -2737.437255859375, -2612.92724609375, -2488.417236328125, -2363.9072265625, -2239.397216796875, -2114.88720703125, -1990.377197265625, -1865.8671875, -1741.357177734375, -1616.84716796875, -1492.337158203125, -1367.8271484375, -1243.317138671875, -1118.80712890625, -994.297119140625, -869.787109375, -745.277099609375, -620.76708984375, -496.257080078125, -371.7470703125, -247.237060546875, -122.727294921875, 1.78271484375, 126.292724609375, 250.802734375, 375.312744140625, 499.82275390625, 624.332763671875, 748.8427734375, 873.352783203125, 997.86279296875, 1122.372802734375, 1246.8828125, 1371.392822265625, 1495.90283203125, 1620.412841796875, 1744.9228515625, 1869.432861328125, 1993.94287109375, 2118.452880859375, 2242.962890625, 2367.472900390625, 2491.98291015625, 2616.492919921875, 2741.0029296875, 2865.512939453125, 2990.02294921875, 3114.532958984375, 3239.04296875, 3363.552978515625, 3488.06298828125, 3612.572998046875, 3737.0830078125, 3861.593017578125]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 11.0, 15.0, 15.0, 21.0, 23.0, 39.0, 36.0, 46.0, 58.0, 84.0, 97.0, 120.0, 209.0, 383.0, 690.0, 1377.0, 2404.0, 4011.0, 8809.0, 31203860.0, 18826.0, 9726.0, 1608.0, 739.0, 379.0, 227.0, 140.0, 106.0, 81.0, 63.0, 49.0, 45.0, 40.0, 32.0, 23.0, 25.0, 14.0, 11.0, 14.0, 14.0, 7.0, 5.0, 4.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2727.01513671875, -2643.531982421875, -2560.048828125, -2476.5654296875, -2393.082275390625, -2309.59912109375, -2226.115966796875, -2142.6328125, -2059.1494140625, -1975.666259765625, -1892.1829833984375, -1808.6998291015625, -1725.216552734375, -1641.7333984375, -1558.250244140625, -1474.76708984375, -1391.283935546875, -1307.80078125, -1224.3175048828125, -1140.8343505859375, -1057.35107421875, -973.867919921875, -890.384765625, -806.9015502929688, -723.4183349609375, -639.9351196289062, -556.451904296875, -472.96875, -389.48553466796875, -306.0023193359375, -222.51913452148438, -139.03594970703125, -55.552490234375, 27.930709838867188, 111.41390991210938, 194.89710998535156, 278.38031005859375, 361.863525390625, 445.3467102050781, 528.8298950195312, 612.3131103515625, 695.7963256835938, 779.279541015625, 862.7626953125, 946.2459106445312, 1029.7291259765625, 1113.2122802734375, 1196.695556640625, 1280.1787109375, 1363.661865234375, 1447.1451416015625, 1530.6282958984375, 1614.111572265625, 1697.5947265625, 1781.077880859375, 1864.56103515625, 1948.0443115234375, 2031.5274658203125, 2115.0107421875, 2198.493896484375, 2281.97705078125, 2365.46044921875, 2448.943603515625, 2532.4267578125, 2615.909912109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 13.0, 22.0, 32.0, 52.0, 54.0, 93.0, 134.0, 206.0, 299.0, 396.0, 602.0, 839.0, 1394.0, 2276.0, 3450.0, 5744.0, 9429.0, 16818.0, 30531.0, 57884.0, 117381.0, 258450.0, 656203.0, 2029128.0, 1967592.0, 640271.0, 251579.0, 114232.0, 56230.0, 29890.0, 16332.0, 9135.0, 5499.0, 3307.0, 2048.0, 1279.0, 887.0, 533.0, 400.0, 259.0, 147.0, 110.0, 88.0, 52.0, 41.0, 34.0, 14.0, 11.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-141.0, -136.44921875, -131.8984375, -127.34765625, -122.796875, -118.24609375, -113.6953125, -109.14453125, -104.59375, -100.04296875, -95.4921875, -90.94140625, -86.390625, -81.83984375, -77.2890625, -72.73828125, -68.1875, -63.63671875, -59.0859375, -54.53515625, -49.984375, -45.43359375, -40.8828125, -36.33203125, -31.78125, -27.23046875, -22.6796875, -18.12890625, -13.578125, -9.02734375, -4.4765625, 0.07421875, 4.625, 9.17578125, 13.7265625, 18.27734375, 22.828125, 27.37890625, 31.9296875, 36.48046875, 41.03125, 45.58203125, 50.1328125, 54.68359375, 59.234375, 63.78515625, 68.3359375, 72.88671875, 77.4375, 81.98828125, 86.5390625, 91.08984375, 95.640625, 100.19140625, 104.7421875, 109.29296875, 113.84375, 118.39453125, 122.9453125, 127.49609375, 132.046875, 136.59765625, 141.1484375, 145.69921875, 150.25]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 13.0, 4.0, 7.0, 11.0, 9.0, 19.0, 17.0, 17.0, 16.0, 25.0, 39.0, 45.0, 39.0, 46.0, 67.0, 112.0, 83.0, 128.0, 131.0, 158.0, 132.0, 157.0, 105.0, 106.0, 98.0, 84.0, 57.0, 44.0, 39.0, 34.0, 31.0, 32.0, 21.0, 17.0, 6.0, 13.0, 17.0, 10.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.625, -40.3349609375, -39.044921875, -37.7548828125, -36.46484375, -35.1748046875, -33.884765625, -32.5947265625, -31.3046875, -30.0146484375, -28.724609375, -27.4345703125, -26.14453125, -24.8544921875, -23.564453125, -22.2744140625, -20.984375, -19.6943359375, -18.404296875, -17.1142578125, -15.82421875, -14.5341796875, -13.244140625, -11.9541015625, -10.6640625, -9.3740234375, -8.083984375, -6.7939453125, -5.50390625, -4.2138671875, -2.923828125, -1.6337890625, -0.34375, 0.9462890625, 2.236328125, 3.5263671875, 4.81640625, 6.1064453125, 7.396484375, 8.6865234375, 9.9765625, 11.2666015625, 12.556640625, 13.8466796875, 15.13671875, 16.4267578125, 17.716796875, 19.0068359375, 20.296875, 21.5869140625, 22.876953125, 24.1669921875, 25.45703125, 26.7470703125, 28.037109375, 29.3271484375, 30.6171875, 31.9072265625, 33.197265625, 34.4873046875, 35.77734375, 37.0673828125, 38.357421875, 39.6474609375, 40.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 12.0, 17.0, 23.0, 36.0, 54.0, 97.0, 143.0, 215.0, 364.0, 524.0, 850.0, 1390.0, 2248.0, 3790.0, 6477.0, 11841.0, 21297.0, 39941.0, 76933.0, 147869.0, 287164.0, 583111.0, 1411813.0, 2042298.0, 844703.0, 391660.0, 197579.0, 102019.0, 52883.0, 28191.0, 15332.0, 8290.0, 4897.0, 2804.0, 1685.0, 1056.0, 623.0, 397.0, 274.0, 180.0, 112.0, 75.0, 55.0, 41.0, 19.0, 14.0, 7.0, 14.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-78.8125, -76.205078125, -73.59765625, -70.990234375, -68.3828125, -65.775390625, -63.16796875, -60.560546875, -57.953125, -55.345703125, -52.73828125, -50.130859375, -47.5234375, -44.916015625, -42.30859375, -39.701171875, -37.09375, -34.486328125, -31.87890625, -29.271484375, -26.6640625, -24.056640625, -21.44921875, -18.841796875, -16.234375, -13.626953125, -11.01953125, -8.412109375, -5.8046875, -3.197265625, -0.58984375, 2.017578125, 4.625, 7.232421875, 9.83984375, 12.447265625, 15.0546875, 17.662109375, 20.26953125, 22.876953125, 25.484375, 28.091796875, 30.69921875, 33.306640625, 35.9140625, 38.521484375, 41.12890625, 43.736328125, 46.34375, 48.951171875, 51.55859375, 54.166015625, 56.7734375, 59.380859375, 61.98828125, 64.595703125, 67.203125, 69.810546875, 72.41796875, 75.025390625, 77.6328125, 80.240234375, 82.84765625, 85.455078125, 88.0625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 5.0, 12.0, 15.0, 27.0, 29.0, 26.0, 48.0, 43.0, 61.0, 59.0, 76.0, 89.0, 81.0, 143.0, 142.0, 169.0, 163.0, 125.0, 127.0, 103.0, 102.0, 74.0, 38.0, 44.0, 44.0, 38.0, 25.0, 17.0, 19.0, 17.0, 14.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.1875, -62.294921875, -60.40234375, -58.509765625, -56.6171875, -54.724609375, -52.83203125, -50.939453125, -49.046875, -47.154296875, -45.26171875, -43.369140625, -41.4765625, -39.583984375, -37.69140625, -35.798828125, -33.90625, -32.013671875, -30.12109375, -28.228515625, -26.3359375, -24.443359375, -22.55078125, -20.658203125, -18.765625, -16.873046875, -14.98046875, -13.087890625, -11.1953125, -9.302734375, -7.41015625, -5.517578125, -3.625, -1.732421875, 0.16015625, 2.052734375, 3.9453125, 5.837890625, 7.73046875, 9.623046875, 11.515625, 13.408203125, 15.30078125, 17.193359375, 19.0859375, 20.978515625, 22.87109375, 24.763671875, 26.65625, 28.548828125, 30.44140625, 32.333984375, 34.2265625, 36.119140625, 38.01171875, 39.904296875, 41.796875, 43.689453125, 45.58203125, 47.474609375, 49.3671875, 51.259765625, 53.15234375, 55.044921875, 56.9375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 13.0, 8.0, 9.0, 11.0, 39.0, 52.0, 63.0, 75.0, 107.0, 166.0, 232.0, 422.0, 547.0, 874.0, 1307.0, 2269.0, 3511.0, 5424.0, 9240.0, 16062.0, 28370.0, 56795.0, 137509.0, 5461163.0, 374627.0, 94201.0, 42528.0, 22589.0, 12572.0, 7576.0, 4708.0, 2774.0, 1822.0, 1209.0, 838.0, 512.0, 359.0, 250.0, 172.0, 119.0, 80.0, 68.0, 49.0, 29.0, 22.0, 17.0, 14.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-249.875, -241.767578125, -233.66015625, -225.552734375, -217.4453125, -209.337890625, -201.23046875, -193.123046875, -185.015625, -176.908203125, -168.80078125, -160.693359375, -152.5859375, -144.478515625, -136.37109375, -128.263671875, -120.15625, -112.048828125, -103.94140625, -95.833984375, -87.7265625, -79.619140625, -71.51171875, -63.404296875, -55.296875, -47.189453125, -39.08203125, -30.974609375, -22.8671875, -14.759765625, -6.65234375, 1.455078125, 9.5625, 17.669921875, 25.77734375, 33.884765625, 41.9921875, 50.099609375, 58.20703125, 66.314453125, 74.421875, 82.529296875, 90.63671875, 98.744140625, 106.8515625, 114.958984375, 123.06640625, 131.173828125, 139.28125, 147.388671875, 155.49609375, 163.603515625, 171.7109375, 179.818359375, 187.92578125, 196.033203125, 204.140625, 212.248046875, 220.35546875, 228.462890625, 236.5703125, 244.677734375, 252.78515625, 260.892578125, 269.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 7.0, 14.0, 11.0, 16.0, 17.0, 17.0, 24.0, 28.0, 24.0, 38.0, 48.0, 55.0, 46.0, 74.0, 106.0, 139.0, 186.0, 212.0, 228.0, 154.0, 132.0, 84.0, 72.0, 60.0, 43.0, 34.0, 25.0, 24.0, 23.0, 12.0, 16.0, 9.0, 9.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-115.125, -112.06640625, -109.0078125, -105.94921875, -102.890625, -99.83203125, -96.7734375, -93.71484375, -90.65625, -87.59765625, -84.5390625, -81.48046875, -78.421875, -75.36328125, -72.3046875, -69.24609375, -66.1875, -63.12890625, -60.0703125, -57.01171875, -53.953125, -50.89453125, -47.8359375, -44.77734375, -41.71875, -38.66015625, -35.6015625, -32.54296875, -29.484375, -26.42578125, -23.3671875, -20.30859375, -17.25, -14.19140625, -11.1328125, -8.07421875, -5.015625, -1.95703125, 1.1015625, 4.16015625, 7.21875, 10.27734375, 13.3359375, 16.39453125, 19.453125, 22.51171875, 25.5703125, 28.62890625, 31.6875, 34.74609375, 37.8046875, 40.86328125, 43.921875, 46.98046875, 50.0390625, 53.09765625, 56.15625, 59.21484375, 62.2734375, 65.33203125, 68.390625, 71.44921875, 74.5078125, 77.56640625, 80.625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 6.0, 10.0, 19.0, 41.0, 65.0, 118.0, 481.0, 146.0, 48.0, 30.0, 11.0, 12.0, 5.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-29289.205078125, -28697.8671875, -28106.53125, -27515.193359375, -26923.85546875, -26332.517578125, -25741.1796875, -25149.84375, -24558.505859375, -23967.16796875, -23375.83203125, -22784.494140625, -22193.15625, -21601.818359375, -21010.48046875, -20419.14453125, -19827.806640625, -19236.46875, -18645.1328125, -18053.794921875, -17462.45703125, -16871.119140625, -16279.7822265625, -15688.4453125, -15097.107421875, -14505.76953125, -13914.4326171875, -13323.095703125, -12731.7578125, -12140.419921875, -11549.0830078125, -10957.74609375, -10366.40625, -9775.068359375, -9183.7314453125, -8592.39453125, -8001.056640625, -7409.71923828125, -6818.3818359375, -6227.04443359375, -5635.70703125, -5044.36962890625, -4453.0322265625, -3861.69482421875, -3270.357421875, -2679.02001953125, -2087.6826171875, -1496.34521484375, -905.0078125, -313.67041015625, 277.6669921875, 869.00439453125, 1460.341796875, 2051.67919921875, 2643.0166015625, 3234.35400390625, 3825.69140625, 4417.02880859375, 5008.3662109375, 5599.70361328125, 6191.041015625, 6782.37841796875, 7373.7158203125, 7965.05322265625, 8556.390625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 2.0, 7.0, 1.0, 10.0, 1.0, 8.0, 7.0, 8.0, 10.0, 18.0, 10.0, 17.0, 21.0, 18.0, 19.0, 17.0, 22.0, 46.0, 76.0, 126.0, 165.0, 92.0, 54.0, 41.0, 23.0, 29.0, 24.0, 19.0, 10.0, 7.0, 12.0, 10.0, 12.0, 13.0, 10.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2373.5947265625, -2302.244873046875, -2230.895263671875, -2159.54541015625, -2088.195556640625, -2016.845947265625, -1945.49609375, -1874.1463623046875, -1802.796630859375, -1731.4468994140625, -1660.0970458984375, -1588.747314453125, -1517.3975830078125, -1446.0478515625, -1374.697998046875, -1303.3482666015625, -1231.9984130859375, -1160.648681640625, -1089.298828125, -1017.9490966796875, -946.599365234375, -875.2495727539062, -803.8997802734375, -732.550048828125, -661.2002563476562, -589.8504638671875, -518.500732421875, -447.15093994140625, -375.8011779785156, -304.451416015625, -233.10162353515625, -161.75186157226562, -90.402099609375, -19.052330017089844, 52.29743957519531, 123.647216796875, 194.99697875976562, 266.34674072265625, 337.696533203125, 409.0462951660156, 480.39605712890625, 551.745849609375, 623.0955810546875, 694.4453735351562, 765.795166015625, 837.1448974609375, 908.4946899414062, 979.844482421875, 1051.1942138671875, 1122.5439453125, 1193.893798828125, 1265.2435302734375, 1336.59326171875, 1407.943115234375, 1479.2928466796875, 1550.642578125, 1621.992431640625, 1693.3421630859375, 1764.6920166015625, 1836.041748046875, 1907.3914794921875, 1978.7412109375, 2050.091064453125, 2121.44091796875, 2192.79052734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 1.0, 5.0, 6.0, 8.0, 14.0, 14.0, 17.0, 28.0, 46.0, 50.0, 82.0, 127.0, 152.0, 240.0, 405.0, 589.0, 968.0, 1453.0, 2354.0, 3848.0, 6569.0, 11784.0, 22641.0, 47996.0, 137289.0, 843552.0, 2771360.0, 221554.0, 63832.0, 26600.0, 13072.0, 7207.0, 4245.0, 2476.0, 1452.0, 845.0, 523.0, 318.0, 214.0, 125.0, 76.0, 52.0, 31.0, 17.0, 12.0, 9.0, 5.0, 7.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-64.625, -62.78662109375, -60.9482421875, -59.10986328125, -57.271484375, -55.43310546875, -53.5947265625, -51.75634765625, -49.91796875, -48.07958984375, -46.2412109375, -44.40283203125, -42.564453125, -40.72607421875, -38.8876953125, -37.04931640625, -35.2109375, -33.37255859375, -31.5341796875, -29.69580078125, -27.857421875, -26.01904296875, -24.1806640625, -22.34228515625, -20.50390625, -18.66552734375, -16.8271484375, -14.98876953125, -13.150390625, -11.31201171875, -9.4736328125, -7.63525390625, -5.796875, -3.95849609375, -2.1201171875, -0.28173828125, 1.556640625, 3.39501953125, 5.2333984375, 7.07177734375, 8.91015625, 10.74853515625, 12.5869140625, 14.42529296875, 16.263671875, 18.10205078125, 19.9404296875, 21.77880859375, 23.6171875, 25.45556640625, 27.2939453125, 29.13232421875, 30.970703125, 32.80908203125, 34.6474609375, 36.48583984375, 38.32421875, 40.16259765625, 42.0009765625, 43.83935546875, 45.677734375, 47.51611328125, 49.3544921875, 51.19287109375, 53.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 2.0, 7.0, 11.0, 13.0, 29.0, 30.0, 40.0, 59.0, 62.0, 98.0, 110.0, 116.0, 99.0, 90.0, 56.0, 50.0, 30.0, 17.0, 20.0, 10.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.494140625, -3.39459228515625, -3.2950439453125, -3.19549560546875, -3.095947265625, -2.99639892578125, -2.8968505859375, -2.79730224609375, -2.69775390625, -2.59820556640625, -2.4986572265625, -2.39910888671875, -2.299560546875, -2.20001220703125, -2.1004638671875, -2.00091552734375, -1.9013671875, -1.80181884765625, -1.7022705078125, -1.60272216796875, -1.503173828125, -1.40362548828125, -1.3040771484375, -1.20452880859375, -1.10498046875, -1.00543212890625, -0.9058837890625, -0.80633544921875, -0.706787109375, -0.60723876953125, -0.5076904296875, -0.40814208984375, -0.30859375, -0.20904541015625, -0.1094970703125, -0.00994873046875, 0.089599609375, 0.18914794921875, 0.2886962890625, 0.38824462890625, 0.48779296875, 0.58734130859375, 0.6868896484375, 0.78643798828125, 0.885986328125, 0.98553466796875, 1.0850830078125, 1.18463134765625, 1.2841796875, 1.38372802734375, 1.4832763671875, 1.58282470703125, 1.682373046875, 1.78192138671875, 1.8814697265625, 1.98101806640625, 2.08056640625, 2.18011474609375, 2.2796630859375, 2.37921142578125, 2.478759765625, 2.57830810546875, 2.6778564453125, 2.77740478515625, 2.876953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 12.0, 14.0, 21.0, 39.0, 41.0, 94.0, 106.0, 160.0, 238.0, 400.0, 629.0, 1066.0, 1823.0, 3646.0, 7537.0, 18319.0, 48716.0, 148731.0, 570236.0, 2405466.0, 708703.0, 179679.0, 58367.0, 21610.0, 9199.0, 4211.0, 2116.0, 1225.0, 696.0, 405.0, 259.0, 167.0, 113.0, 78.0, 46.0, 35.0, 30.0, 12.0, 11.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-54.3125, -52.6943359375, -51.076171875, -49.4580078125, -47.83984375, -46.2216796875, -44.603515625, -42.9853515625, -41.3671875, -39.7490234375, -38.130859375, -36.5126953125, -34.89453125, -33.2763671875, -31.658203125, -30.0400390625, -28.421875, -26.8037109375, -25.185546875, -23.5673828125, -21.94921875, -20.3310546875, -18.712890625, -17.0947265625, -15.4765625, -13.8583984375, -12.240234375, -10.6220703125, -9.00390625, -7.3857421875, -5.767578125, -4.1494140625, -2.53125, -0.9130859375, 0.705078125, 2.3232421875, 3.94140625, 5.5595703125, 7.177734375, 8.7958984375, 10.4140625, 12.0322265625, 13.650390625, 15.2685546875, 16.88671875, 18.5048828125, 20.123046875, 21.7412109375, 23.359375, 24.9775390625, 26.595703125, 28.2138671875, 29.83203125, 31.4501953125, 33.068359375, 34.6865234375, 36.3046875, 37.9228515625, 39.541015625, 41.1591796875, 42.77734375, 44.3955078125, 46.013671875, 47.6318359375, 49.25]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 0.0, 10.0, 10.0, 17.0, 16.0, 32.0, 53.0, 68.0, 92.0, 118.0, 149.0, 251.0, 297.0, 424.0, 713.0, 436.0, 318.0, 262.0, 181.0, 158.0, 127.0, 92.0, 53.0, 51.0, 37.0, 21.0, 21.0, 14.0, 10.0, 11.0, 4.0, 3.0, 7.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.4453125, -14.013671875, -13.58203125, -13.150390625, -12.71875, -12.287109375, -11.85546875, -11.423828125, -10.9921875, -10.560546875, -10.12890625, -9.697265625, -9.265625, -8.833984375, -8.40234375, -7.970703125, -7.5390625, -7.107421875, -6.67578125, -6.244140625, -5.8125, -5.380859375, -4.94921875, -4.517578125, -4.0859375, -3.654296875, -3.22265625, -2.791015625, -2.359375, -1.927734375, -1.49609375, -1.064453125, -0.6328125, -0.201171875, 0.23046875, 0.662109375, 1.09375, 1.525390625, 1.95703125, 2.388671875, 2.8203125, 3.251953125, 3.68359375, 4.115234375, 4.546875, 4.978515625, 5.41015625, 5.841796875, 6.2734375, 6.705078125, 7.13671875, 7.568359375, 8.0, 8.431640625, 8.86328125, 9.294921875, 9.7265625, 10.158203125, 10.58984375, 11.021484375, 11.453125, 11.884765625, 12.31640625, 12.748046875, 13.1796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 16.0, 47.0, 124.0, 280.0, 285.0, 138.0, 63.0, 22.0, 17.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-395.7984619140625, -379.9058837890625, -364.0133361816406, -348.1207580566406, -332.2281799316406, -316.33563232421875, -300.44305419921875, -284.55047607421875, -268.65789794921875, -252.7653350830078, -236.8727569580078, -220.98019409179688, -205.08761596679688, -189.19505310058594, -173.302490234375, -157.409912109375, -141.51734924316406, -125.6247787475586, -109.73220825195312, -93.83964538574219, -77.94706726074219, -62.05450439453125, -46.16193389892578, -30.269363403320312, -14.376792907714844, 1.5157766342163086, 17.40834617614746, 33.3009147644043, 49.193485260009766, 65.08605194091797, 80.97862243652344, 96.8711929321289, 112.76376342773438, 128.6563262939453, 144.5489044189453, 160.44146728515625, 176.33404541015625, 192.2266082763672, 208.11917114257812, 224.01174926757812, 239.90432739257812, 255.79689025878906, 271.689453125, 287.58203125, 303.474609375, 319.3671875, 335.2597351074219, 351.1523132324219, 367.04486083984375, 382.93743896484375, 398.8299865722656, 414.7225646972656, 430.6151428222656, 446.5076904296875, 462.4002685546875, 478.2928466796875, 494.1854248046875, 510.0780029296875, 525.9705810546875, 541.8631591796875, 557.7556762695312, 573.6482543945312, 589.5408325195312, 605.4334106445312, 621.3259887695312]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 13.0, 13.0, 27.0, 23.0, 39.0, 50.0, 39.0, 60.0, 59.0, 52.0, 56.0, 59.0, 59.0, 57.0, 58.0, 64.0, 52.0, 30.0, 44.0, 30.0, 19.0, 20.0, 12.0, 14.0, 5.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-125.65234375, -121.87139892578125, -118.0904541015625, -114.30950164794922, -110.52855682373047, -106.74761199951172, -102.96665954589844, -99.18571472167969, -95.40476989746094, -91.62382507324219, -87.84288024902344, -84.06192779541016, -80.2809829711914, -76.50003814697266, -72.71908569335938, -68.93814086914062, -65.15719604492188, -61.376251220703125, -57.59530258178711, -53.814353942871094, -50.033409118652344, -46.252464294433594, -42.47151565551758, -38.69056701660156, -34.90962219238281, -31.12867546081543, -27.347728729248047, -23.566781997680664, -19.78583526611328, -16.0048885345459, -12.223941802978516, -8.442995071411133, -4.662055969238281, -0.8811092376708984, 2.8998374938964844, 6.680784225463867, 10.46173095703125, 14.242677688598633, 18.023624420166016, 21.8045711517334, 25.58551788330078, 29.366464614868164, 33.14741134643555, 36.92835998535156, 40.70930480957031, 44.49024963378906, 48.27119827270508, 52.052146911621094, 55.833091735839844, 59.614036560058594, 63.39498519897461, 67.17593383789062, 70.95687866210938, 74.73782348632812, 78.51876831054688, 82.29972076416016, 86.0806655883789, 89.86161041259766, 93.64256286621094, 97.42350769042969, 101.20445251464844, 104.98539733886719, 108.76634216308594, 112.54729461669922, 116.32823944091797]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 9.0, 17.0, 18.0, 20.0, 22.0, 34.0, 52.0, 98.0, 140.0, 212.0, 394.0, 883.0, 2281.0, 7240.0, 31933.0, 219958.0, 664303.0, 95930.0, 17323.0, 4568.0, 1560.0, 645.0, 301.0, 182.0, 109.0, 79.0, 49.0, 30.0, 33.0, 22.0, 18.0, 16.0, 9.0, 13.0, 10.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-51.5625, -50.10205078125, -48.6416015625, -47.18115234375, -45.720703125, -44.26025390625, -42.7998046875, -41.33935546875, -39.87890625, -38.41845703125, -36.9580078125, -35.49755859375, -34.037109375, -32.57666015625, -31.1162109375, -29.65576171875, -28.1953125, -26.73486328125, -25.2744140625, -23.81396484375, -22.353515625, -20.89306640625, -19.4326171875, -17.97216796875, -16.51171875, -15.05126953125, -13.5908203125, -12.13037109375, -10.669921875, -9.20947265625, -7.7490234375, -6.28857421875, -4.828125, -3.36767578125, -1.9072265625, -0.44677734375, 1.013671875, 2.47412109375, 3.9345703125, 5.39501953125, 6.85546875, 8.31591796875, 9.7763671875, 11.23681640625, 12.697265625, 14.15771484375, 15.6181640625, 17.07861328125, 18.5390625, 19.99951171875, 21.4599609375, 22.92041015625, 24.380859375, 25.84130859375, 27.3017578125, 28.76220703125, 30.22265625, 31.68310546875, 33.1435546875, 34.60400390625, 36.064453125, 37.52490234375, 38.9853515625, 40.44580078125, 41.90625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 14.0, 20.0, 38.0, 62.0, 87.0, 124.0, 131.0, 126.0, 115.0, 104.0, 72.0, 33.0, 31.0, 19.0, 12.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.649169921875, -4.40771484375, -4.166259765625, -3.9248046875, -3.683349609375, -3.44189453125, -3.200439453125, -2.958984375, -2.717529296875, -2.47607421875, -2.234619140625, -1.9931640625, -1.751708984375, -1.51025390625, -1.268798828125, -1.02734375, -0.785888671875, -0.54443359375, -0.302978515625, -0.0615234375, 0.179931640625, 0.42138671875, 0.662841796875, 0.904296875, 1.145751953125, 1.38720703125, 1.628662109375, 1.8701171875, 2.111572265625, 2.35302734375, 2.594482421875, 2.8359375, 3.077392578125, 3.31884765625, 3.560302734375, 3.8017578125, 4.043212890625, 4.28466796875, 4.526123046875, 4.767578125, 5.009033203125, 5.25048828125, 5.491943359375, 5.7333984375, 5.974853515625, 6.21630859375, 6.457763671875, 6.69921875, 6.940673828125, 7.18212890625, 7.423583984375, 7.6650390625, 7.906494140625, 8.14794921875, 8.389404296875, 8.630859375, 8.872314453125, 9.11376953125, 9.355224609375, 9.5966796875, 9.838134765625, 10.07958984375, 10.321044921875, 10.5625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 11.0, 9.0, 11.0, 9.0, 13.0, 36.0, 50.0, 54.0, 85.0, 135.0, 213.0, 328.0, 568.0, 961.0, 1502.0, 2986.0, 5711.0, 11842.0, 27104.0, 72878.0, 246813.0, 451202.0, 142374.0, 46946.0, 18568.0, 8672.0, 4167.0, 2223.0, 1282.0, 705.0, 393.0, 251.0, 166.0, 92.0, 71.0, 43.0, 30.0, 18.0, 13.0, 4.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.890625, -27.0771484375, -26.263671875, -25.4501953125, -24.63671875, -23.8232421875, -23.009765625, -22.1962890625, -21.3828125, -20.5693359375, -19.755859375, -18.9423828125, -18.12890625, -17.3154296875, -16.501953125, -15.6884765625, -14.875, -14.0615234375, -13.248046875, -12.4345703125, -11.62109375, -10.8076171875, -9.994140625, -9.1806640625, -8.3671875, -7.5537109375, -6.740234375, -5.9267578125, -5.11328125, -4.2998046875, -3.486328125, -2.6728515625, -1.859375, -1.0458984375, -0.232421875, 0.5810546875, 1.39453125, 2.2080078125, 3.021484375, 3.8349609375, 4.6484375, 5.4619140625, 6.275390625, 7.0888671875, 7.90234375, 8.7158203125, 9.529296875, 10.3427734375, 11.15625, 11.9697265625, 12.783203125, 13.5966796875, 14.41015625, 15.2236328125, 16.037109375, 16.8505859375, 17.6640625, 18.4775390625, 19.291015625, 20.1044921875, 20.91796875, 21.7314453125, 22.544921875, 23.3583984375, 24.171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 8.0, 12.0, 12.0, 19.0, 22.0, 33.0, 42.0, 48.0, 34.0, 52.0, 49.0, 55.0, 55.0, 59.0, 46.0, 58.0, 66.0, 42.0, 60.0, 30.0, 29.0, 35.0, 18.0, 28.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.25, -22.402587890625, -21.55517578125, -20.707763671875, -19.8603515625, -19.012939453125, -18.16552734375, -17.318115234375, -16.470703125, -15.623291015625, -14.77587890625, -13.928466796875, -13.0810546875, -12.233642578125, -11.38623046875, -10.538818359375, -9.69140625, -8.843994140625, -7.99658203125, -7.149169921875, -6.3017578125, -5.454345703125, -4.60693359375, -3.759521484375, -2.912109375, -2.064697265625, -1.21728515625, -0.369873046875, 0.4775390625, 1.324951171875, 2.17236328125, 3.019775390625, 3.8671875, 4.714599609375, 5.56201171875, 6.409423828125, 7.2568359375, 8.104248046875, 8.95166015625, 9.799072265625, 10.646484375, 11.493896484375, 12.34130859375, 13.188720703125, 14.0361328125, 14.883544921875, 15.73095703125, 16.578369140625, 17.42578125, 18.273193359375, 19.12060546875, 19.968017578125, 20.8154296875, 21.662841796875, 22.51025390625, 23.357666015625, 24.205078125, 25.052490234375, 25.89990234375, 26.747314453125, 27.5947265625, 28.442138671875, 29.28955078125, 30.136962890625, 30.984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 4.0, 16.0, 21.0, 14.0, 30.0, 36.0, 66.0, 73.0, 118.0, 168.0, 364.0, 583.0, 1083.0, 2217.0, 4904.0, 12541.0, 40369.0, 183660.0, 563533.0, 177964.0, 39024.0, 12239.0, 4822.0, 2059.0, 1077.0, 587.0, 320.0, 219.0, 151.0, 96.0, 43.0, 33.0, 27.0, 13.0, 15.0, 8.0, 8.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.109375, -24.359619140625, -23.60986328125, -22.860107421875, -22.1103515625, -21.360595703125, -20.61083984375, -19.861083984375, -19.111328125, -18.361572265625, -17.61181640625, -16.862060546875, -16.1123046875, -15.362548828125, -14.61279296875, -13.863037109375, -13.11328125, -12.363525390625, -11.61376953125, -10.864013671875, -10.1142578125, -9.364501953125, -8.61474609375, -7.864990234375, -7.115234375, -6.365478515625, -5.61572265625, -4.865966796875, -4.1162109375, -3.366455078125, -2.61669921875, -1.866943359375, -1.1171875, -0.367431640625, 0.38232421875, 1.132080078125, 1.8818359375, 2.631591796875, 3.38134765625, 4.131103515625, 4.880859375, 5.630615234375, 6.38037109375, 7.130126953125, 7.8798828125, 8.629638671875, 9.37939453125, 10.129150390625, 10.87890625, 11.628662109375, 12.37841796875, 13.128173828125, 13.8779296875, 14.627685546875, 15.37744140625, 16.127197265625, 16.876953125, 17.626708984375, 18.37646484375, 19.126220703125, 19.8759765625, 20.625732421875, 21.37548828125, 22.125244140625, 22.875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 7.0, 7.0, 10.0, 13.0, 10.0, 20.0, 23.0, 47.0, 40.0, 45.0, 63.0, 78.0, 88.0, 78.0, 91.0, 78.0, 73.0, 46.0, 40.0, 24.0, 26.0, 27.0, 12.0, 14.0, 10.0, 7.0, 9.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010595321655273438, -0.001018241047859192, -0.00097694993019104, -0.0009356588125228882, -0.0008943676948547363, -0.0008530765771865845, -0.0008117854595184326, -0.0007704943418502808, -0.0007292032241821289, -0.000687912106513977, -0.0006466209888458252, -0.0006053298711776733, -0.0005640387535095215, -0.0005227476358413696, -0.0004814565181732178, -0.0004401654005050659, -0.00039887428283691406, -0.0003575831651687622, -0.00031629204750061035, -0.0002750009298324585, -0.00023370981216430664, -0.00019241869449615479, -0.00015112757682800293, -0.00010983645915985107, -6.854534149169922e-05, -2.7254223823547363e-05, 1.4036893844604492e-05, 5.532801151275635e-05, 9.66191291809082e-05, 0.00013791024684906006, 0.00017920136451721191, 0.00022049248218536377, 0.0002617835998535156, 0.0003030747175216675, 0.00034436583518981934, 0.0003856569528579712, 0.00042694807052612305, 0.0004682391881942749, 0.0005095303058624268, 0.0005508214235305786, 0.0005921125411987305, 0.0006334036588668823, 0.0006746947765350342, 0.000715985894203186, 0.0007572770118713379, 0.0007985681295394897, 0.0008398592472076416, 0.0008811503648757935, 0.0009224414825439453, 0.0009637326002120972, 0.001005023717880249, 0.0010463148355484009, 0.0010876059532165527, 0.0011288970708847046, 0.0011701881885528564, 0.0012114793062210083, 0.0012527704238891602, 0.001294061541557312, 0.0013353526592254639, 0.0013766437768936157, 0.0014179348945617676, 0.0014592260122299194, 0.0015005171298980713, 0.0015418082475662231, 0.001583099365234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 16.0, 14.0, 26.0, 37.0, 47.0, 82.0, 121.0, 219.0, 402.0, 708.0, 1374.0, 3218.0, 8486.0, 26476.0, 110768.0, 494135.0, 311670.0, 63025.0, 17089.0, 5687.0, 2442.0, 1121.0, 601.0, 304.0, 171.0, 111.0, 65.0, 39.0, 34.0, 22.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.307373046875, -21.58349609375, -20.859619140625, -20.1357421875, -19.411865234375, -18.68798828125, -17.964111328125, -17.240234375, -16.516357421875, -15.79248046875, -15.068603515625, -14.3447265625, -13.620849609375, -12.89697265625, -12.173095703125, -11.44921875, -10.725341796875, -10.00146484375, -9.277587890625, -8.5537109375, -7.829833984375, -7.10595703125, -6.382080078125, -5.658203125, -4.934326171875, -4.21044921875, -3.486572265625, -2.7626953125, -2.038818359375, -1.31494140625, -0.591064453125, 0.1328125, 0.856689453125, 1.58056640625, 2.304443359375, 3.0283203125, 3.752197265625, 4.47607421875, 5.199951171875, 5.923828125, 6.647705078125, 7.37158203125, 8.095458984375, 8.8193359375, 9.543212890625, 10.26708984375, 10.990966796875, 11.71484375, 12.438720703125, 13.16259765625, 13.886474609375, 14.6103515625, 15.334228515625, 16.05810546875, 16.781982421875, 17.505859375, 18.229736328125, 18.95361328125, 19.677490234375, 20.4013671875, 21.125244140625, 21.84912109375, 22.572998046875, 23.296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 8.0, 11.0, 10.0, 12.0, 19.0, 38.0, 33.0, 48.0, 68.0, 64.0, 57.0, 70.0, 65.0, 84.0, 81.0, 64.0, 50.0, 37.0, 39.0, 40.0, 32.0, 18.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.2041015625, -8.869140625, -8.5341796875, -8.19921875, -7.8642578125, -7.529296875, -7.1943359375, -6.859375, -6.5244140625, -6.189453125, -5.8544921875, -5.51953125, -5.1845703125, -4.849609375, -4.5146484375, -4.1796875, -3.8447265625, -3.509765625, -3.1748046875, -2.83984375, -2.5048828125, -2.169921875, -1.8349609375, -1.5, -1.1650390625, -0.830078125, -0.4951171875, -0.16015625, 0.1748046875, 0.509765625, 0.8447265625, 1.1796875, 1.5146484375, 1.849609375, 2.1845703125, 2.51953125, 2.8544921875, 3.189453125, 3.5244140625, 3.859375, 4.1943359375, 4.529296875, 4.8642578125, 5.19921875, 5.5341796875, 5.869140625, 6.2041015625, 6.5390625, 6.8740234375, 7.208984375, 7.5439453125, 7.87890625, 8.2138671875, 8.548828125, 8.8837890625, 9.21875, 9.5537109375, 9.888671875, 10.2236328125, 10.55859375, 10.8935546875, 11.228515625, 11.5634765625, 11.8984375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 7.0, 7.0, 18.0, 40.0, 56.0, 141.0, 227.0, 227.0, 115.0, 68.0, 30.0, 20.0, 14.0, 3.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.4768829345703, -195.0966339111328, -184.71636962890625, -174.33612060546875, -163.9558563232422, -153.5756072998047, -143.19534301757812, -132.81509399414062, -122.4348373413086, -112.05458068847656, -101.67432403564453, -91.2940673828125, -80.913818359375, -70.53355407714844, -60.15330505371094, -49.773048400878906, -39.392791748046875, -29.012535095214844, -18.632280349731445, -8.252025604248047, 2.1282310485839844, 12.508487701416016, 22.88874053955078, 33.26899719238281, 43.649253845214844, 54.029510498046875, 64.4097671508789, 74.79002380371094, 85.17027282714844, 95.550537109375, 105.9307861328125, 116.31104278564453, 126.69131469726562, 137.07156372070312, 147.4518280029297, 157.8320770263672, 168.21234130859375, 178.59259033203125, 188.97283935546875, 199.3531036376953, 209.73336791992188, 220.11361694335938, 230.49388122558594, 240.87413024902344, 251.25439453125, 261.6346435546875, 272.014892578125, 282.3951416015625, 292.775390625, 303.1556396484375, 313.535888671875, 323.9161682128906, 334.2964172363281, 344.6766662597656, 355.0569152832031, 365.43719482421875, 375.81744384765625, 386.19769287109375, 396.57794189453125, 406.9582214355469, 417.3384704589844, 427.7187194824219, 438.0989685058594, 448.479248046875, 458.8594970703125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 7.0, 8.0, 17.0, 18.0, 56.0, 69.0, 119.0, 139.0, 174.0, 134.0, 97.0, 41.0, 30.0, 23.0, 16.0, 12.0, 5.0, 8.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-405.77960205078125, -393.95550537109375, -382.13140869140625, -370.30731201171875, -358.48321533203125, -346.65911865234375, -334.83502197265625, -323.01092529296875, -311.18682861328125, -299.36273193359375, -287.53863525390625, -275.71453857421875, -263.89044189453125, -252.06634521484375, -240.2422637939453, -228.4181671142578, -216.59408569335938, -204.76998901367188, -192.94589233398438, -181.12179565429688, -169.29769897460938, -157.47360229492188, -145.64952087402344, -133.82542419433594, -122.00132751464844, -110.17723083496094, -98.35313415527344, -86.52904510498047, -74.70494842529297, -62.88085174560547, -51.0567626953125, -39.232666015625, -27.4085693359375, -15.584474563598633, -3.7603797912597656, 8.063713073730469, 19.88780975341797, 31.71190643310547, 43.53599548339844, 55.36009216308594, 67.18418884277344, 79.00828552246094, 90.83238220214844, 102.6564712524414, 114.4805679321289, 126.3046646118164, 138.12875366210938, 149.95285034179688, 161.77694702148438, 173.60104370117188, 185.42514038085938, 197.24923706054688, 209.07333374023438, 220.89743041992188, 232.7215118408203, 244.5456085205078, 256.36968994140625, 268.19378662109375, 280.01788330078125, 291.84197998046875, 303.66607666015625, 315.49017333984375, 327.31427001953125, 339.13836669921875, 350.96246337890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 9.0, 13.0, 13.0, 21.0, 36.0, 62.0, 94.0, 146.0, 232.0, 452.0, 849.0, 1666.0, 3657.0, 9032.0, 29492.0, 165049.0, 3784712.0, 155120.0, 27674.0, 8902.0, 3492.0, 1623.0, 826.0, 422.0, 261.0, 155.0, 88.0, 70.0, 39.0, 18.0, 11.0, 11.0, 8.0, 10.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-108.5625, -104.4638671875, -100.365234375, -96.2666015625, -92.16796875, -88.0693359375, -83.970703125, -79.8720703125, -75.7734375, -71.6748046875, -67.576171875, -63.4775390625, -59.37890625, -55.2802734375, -51.181640625, -47.0830078125, -42.984375, -38.8857421875, -34.787109375, -30.6884765625, -26.58984375, -22.4912109375, -18.392578125, -14.2939453125, -10.1953125, -6.0966796875, -1.998046875, 2.1005859375, 6.19921875, 10.2978515625, 14.396484375, 18.4951171875, 22.59375, 26.6923828125, 30.791015625, 34.8896484375, 38.98828125, 43.0869140625, 47.185546875, 51.2841796875, 55.3828125, 59.4814453125, 63.580078125, 67.6787109375, 71.77734375, 75.8759765625, 79.974609375, 84.0732421875, 88.171875, 92.2705078125, 96.369140625, 100.4677734375, 104.56640625, 108.6650390625, 112.763671875, 116.8623046875, 120.9609375, 125.0595703125, 129.158203125, 133.2568359375, 137.35546875, 141.4541015625, 145.552734375, 149.6513671875, 153.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 9.0, 8.0, 12.0, 17.0, 37.0, 24.0, 51.0, 68.0, 63.0, 72.0, 79.0, 82.0, 75.0, 81.0, 75.0, 65.0, 43.0, 38.0, 24.0, 19.0, 17.0, 8.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.96856689453125, -4.8160400390625, -4.66351318359375, -4.510986328125, -4.35845947265625, -4.2059326171875, -4.05340576171875, -3.90087890625, -3.74835205078125, -3.5958251953125, -3.44329833984375, -3.290771484375, -3.13824462890625, -2.9857177734375, -2.83319091796875, -2.6806640625, -2.52813720703125, -2.3756103515625, -2.22308349609375, -2.070556640625, -1.91802978515625, -1.7655029296875, -1.61297607421875, -1.46044921875, -1.30792236328125, -1.1553955078125, -1.00286865234375, -0.850341796875, -0.69781494140625, -0.5452880859375, -0.39276123046875, -0.240234375, -0.08770751953125, 0.0648193359375, 0.21734619140625, 0.369873046875, 0.52239990234375, 0.6749267578125, 0.82745361328125, 0.97998046875, 1.13250732421875, 1.2850341796875, 1.43756103515625, 1.590087890625, 1.74261474609375, 1.8951416015625, 2.04766845703125, 2.2001953125, 2.35272216796875, 2.5052490234375, 2.65777587890625, 2.810302734375, 2.96282958984375, 3.1153564453125, 3.26788330078125, 3.42041015625, 3.57293701171875, 3.7254638671875, 3.87799072265625, 4.030517578125, 4.18304443359375, 4.3355712890625, 4.48809814453125, 4.640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 4.0, 9.0, 6.0, 17.0, 21.0, 30.0, 36.0, 70.0, 82.0, 110.0, 161.0, 278.0, 457.0, 683.0, 1169.0, 2094.0, 3751.0, 7322.0, 14622.0, 31833.0, 78664.0, 261681.0, 3023380.0, 557711.0, 123569.0, 45608.0, 19946.0, 9664.0, 5020.0, 2636.0, 1472.0, 868.0, 471.0, 305.0, 183.0, 100.0, 79.0, 52.0, 44.0, 28.0, 15.0, 12.0, 4.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.625, -77.3310546875, -75.037109375, -72.7431640625, -70.44921875, -68.1552734375, -65.861328125, -63.5673828125, -61.2734375, -58.9794921875, -56.685546875, -54.3916015625, -52.09765625, -49.8037109375, -47.509765625, -45.2158203125, -42.921875, -40.6279296875, -38.333984375, -36.0400390625, -33.74609375, -31.4521484375, -29.158203125, -26.8642578125, -24.5703125, -22.2763671875, -19.982421875, -17.6884765625, -15.39453125, -13.1005859375, -10.806640625, -8.5126953125, -6.21875, -3.9248046875, -1.630859375, 0.6630859375, 2.95703125, 5.2509765625, 7.544921875, 9.8388671875, 12.1328125, 14.4267578125, 16.720703125, 19.0146484375, 21.30859375, 23.6025390625, 25.896484375, 28.1904296875, 30.484375, 32.7783203125, 35.072265625, 37.3662109375, 39.66015625, 41.9541015625, 44.248046875, 46.5419921875, 48.8359375, 51.1298828125, 53.423828125, 55.7177734375, 58.01171875, 60.3056640625, 62.599609375, 64.8935546875, 67.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 6.0, 8.0, 4.0, 12.0, 18.0, 24.0, 28.0, 30.0, 38.0, 46.0, 86.0, 104.0, 143.0, 219.0, 506.0, 1686.0, 388.0, 194.0, 144.0, 88.0, 65.0, 59.0, 31.0, 34.0, 27.0, 22.0, 11.0, 13.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.84375, -12.45849609375, -12.0732421875, -11.68798828125, -11.302734375, -10.91748046875, -10.5322265625, -10.14697265625, -9.76171875, -9.37646484375, -8.9912109375, -8.60595703125, -8.220703125, -7.83544921875, -7.4501953125, -7.06494140625, -6.6796875, -6.29443359375, -5.9091796875, -5.52392578125, -5.138671875, -4.75341796875, -4.3681640625, -3.98291015625, -3.59765625, -3.21240234375, -2.8271484375, -2.44189453125, -2.056640625, -1.67138671875, -1.2861328125, -0.90087890625, -0.515625, -0.13037109375, 0.2548828125, 0.64013671875, 1.025390625, 1.41064453125, 1.7958984375, 2.18115234375, 2.56640625, 2.95166015625, 3.3369140625, 3.72216796875, 4.107421875, 4.49267578125, 4.8779296875, 5.26318359375, 5.6484375, 6.03369140625, 6.4189453125, 6.80419921875, 7.189453125, 7.57470703125, 7.9599609375, 8.34521484375, 8.73046875, 9.11572265625, 9.5009765625, 9.88623046875, 10.271484375, 10.65673828125, 11.0419921875, 11.42724609375, 11.8125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0, 6.0, 7.0, 15.0, 38.0, 74.0, 153.0, 175.0, 241.0, 161.0, 82.0, 27.0, 14.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-146.32127380371094, -141.4709930419922, -136.62069702148438, -131.77041625976562, -126.92013549804688, -122.06985473632812, -117.21956634521484, -112.36927795410156, -107.51899719238281, -102.66871643066406, -97.81842803955078, -92.9681396484375, -88.11785888671875, -83.267578125, -78.41728973388672, -73.56700134277344, -68.71672058105469, -63.86643600463867, -59.016151428222656, -54.16586685180664, -49.315582275390625, -44.46529769897461, -39.615013122558594, -34.76472854614258, -29.914443969726562, -25.064159393310547, -20.21387481689453, -15.363590240478516, -10.5133056640625, -5.663021087646484, -0.8127365112304688, 4.037548065185547, 8.8878173828125, 13.738101959228516, 18.58838653564453, 23.438671112060547, 28.288955688476562, 33.13924026489258, 37.989524841308594, 42.83980941772461, 47.690093994140625, 52.54037857055664, 57.390663146972656, 62.24094772338867, 67.09123229980469, 71.94151306152344, 76.79180145263672, 81.64208984375, 86.49237060546875, 91.3426513671875, 96.19293975830078, 101.04322814941406, 105.89350891113281, 110.74378967285156, 115.59407806396484, 120.44436645507812, 125.29464721679688, 130.14492797851562, 134.99520874023438, 139.8455047607422, 144.69578552246094, 149.5460662841797, 154.3963623046875, 159.24664306640625, 164.096923828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 6.0, 7.0, 5.0, 11.0, 13.0, 15.0, 26.0, 27.0, 36.0, 47.0, 50.0, 70.0, 49.0, 80.0, 72.0, 79.0, 47.0, 71.0, 44.0, 46.0, 38.0, 38.0, 34.0, 22.0, 16.0, 22.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.88868713378906, -76.93315887451172, -74.9776382446289, -73.02210998535156, -71.06658172607422, -69.11105346679688, -67.15553283691406, -65.20000457763672, -63.244476318359375, -61.2889518737793, -59.33342361450195, -57.377899169921875, -55.42237091064453, -53.46684646606445, -51.511322021484375, -49.55579376220703, -47.60026931762695, -45.644744873046875, -43.68921661376953, -41.73369216918945, -39.77816390991211, -37.82263946533203, -35.86711120605469, -33.91158676147461, -31.9560604095459, -30.000534057617188, -28.045007705688477, -26.089481353759766, -24.133956909179688, -22.178428649902344, -20.222904205322266, -18.267377853393555, -16.311851501464844, -14.356325149536133, -12.400798797607422, -10.445273399353027, -8.489747047424316, -6.5342206954956055, -4.578695297241211, -2.6231689453125, -0.6676425933837891, 1.2878835201263428, 3.2434096336364746, 5.198935508728027, 7.154461860656738, 9.10998821258545, 11.065513610839844, 13.021039962768555, 14.976566314697266, 16.932092666625977, 18.887619018554688, 20.843143463134766, 22.79867172241211, 24.754196166992188, 26.7097225189209, 28.66524887084961, 30.62077522277832, 32.57630157470703, 34.53182601928711, 36.48735427856445, 38.44287872314453, 40.398406982421875, 42.35393142700195, 44.30945587158203, 46.264984130859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 4.0, 7.0, 9.0, 12.0, 16.0, 36.0, 24.0, 56.0, 94.0, 147.0, 239.0, 551.0, 1480.0, 4683.0, 21491.0, 229595.0, 719825.0, 57255.0, 8920.0, 2364.0, 867.0, 358.0, 184.0, 101.0, 69.0, 51.0, 31.0, 14.0, 13.0, 14.0, 10.0, 1.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-100.5625, -97.123046875, -93.68359375, -90.244140625, -86.8046875, -83.365234375, -79.92578125, -76.486328125, -73.046875, -69.607421875, -66.16796875, -62.728515625, -59.2890625, -55.849609375, -52.41015625, -48.970703125, -45.53125, -42.091796875, -38.65234375, -35.212890625, -31.7734375, -28.333984375, -24.89453125, -21.455078125, -18.015625, -14.576171875, -11.13671875, -7.697265625, -4.2578125, -0.818359375, 2.62109375, 6.060546875, 9.5, 12.939453125, 16.37890625, 19.818359375, 23.2578125, 26.697265625, 30.13671875, 33.576171875, 37.015625, 40.455078125, 43.89453125, 47.333984375, 50.7734375, 54.212890625, 57.65234375, 61.091796875, 64.53125, 67.970703125, 71.41015625, 74.849609375, 78.2890625, 81.728515625, 85.16796875, 88.607421875, 92.046875, 95.486328125, 98.92578125, 102.365234375, 105.8046875, 109.244140625, 112.68359375, 116.123046875, 119.5625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 10.0, 14.0, 20.0, 30.0, 54.0, 96.0, 113.0, 124.0, 121.0, 126.0, 95.0, 81.0, 52.0, 37.0, 14.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.8125, -13.53778076171875, -13.2630615234375, -12.98834228515625, -12.713623046875, -12.43890380859375, -12.1641845703125, -11.88946533203125, -11.61474609375, -11.34002685546875, -11.0653076171875, -10.79058837890625, -10.515869140625, -10.24114990234375, -9.9664306640625, -9.69171142578125, -9.4169921875, -9.14227294921875, -8.8675537109375, -8.59283447265625, -8.318115234375, -8.04339599609375, -7.7686767578125, -7.49395751953125, -7.21923828125, -6.94451904296875, -6.6697998046875, -6.39508056640625, -6.120361328125, -5.84564208984375, -5.5709228515625, -5.29620361328125, -5.021484375, -4.74676513671875, -4.4720458984375, -4.19732666015625, -3.922607421875, -3.64788818359375, -3.3731689453125, -3.09844970703125, -2.82373046875, -2.54901123046875, -2.2742919921875, -1.99957275390625, -1.724853515625, -1.45013427734375, -1.1754150390625, -0.90069580078125, -0.6259765625, -0.35125732421875, -0.0765380859375, 0.19818115234375, 0.472900390625, 0.74761962890625, 1.0223388671875, 1.29705810546875, 1.57177734375, 1.84649658203125, 2.1212158203125, 2.39593505859375, 2.670654296875, 2.94537353515625, 3.2200927734375, 3.49481201171875, 3.76953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 14.0, 11.0, 20.0, 27.0, 51.0, 81.0, 133.0, 234.0, 448.0, 792.0, 1547.0, 3252.0, 7497.0, 19305.0, 60427.0, 262051.0, 503816.0, 129967.0, 35976.0, 12751.0, 5194.0, 2460.0, 1160.0, 546.0, 328.0, 176.0, 108.0, 51.0, 41.0, 32.0, 10.0, 11.0, 8.0, 9.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.4375, -43.0166015625, -41.595703125, -40.1748046875, -38.75390625, -37.3330078125, -35.912109375, -34.4912109375, -33.0703125, -31.6494140625, -30.228515625, -28.8076171875, -27.38671875, -25.9658203125, -24.544921875, -23.1240234375, -21.703125, -20.2822265625, -18.861328125, -17.4404296875, -16.01953125, -14.5986328125, -13.177734375, -11.7568359375, -10.3359375, -8.9150390625, -7.494140625, -6.0732421875, -4.65234375, -3.2314453125, -1.810546875, -0.3896484375, 1.03125, 2.4521484375, 3.873046875, 5.2939453125, 6.71484375, 8.1357421875, 9.556640625, 10.9775390625, 12.3984375, 13.8193359375, 15.240234375, 16.6611328125, 18.08203125, 19.5029296875, 20.923828125, 22.3447265625, 23.765625, 25.1865234375, 26.607421875, 28.0283203125, 29.44921875, 30.8701171875, 32.291015625, 33.7119140625, 35.1328125, 36.5537109375, 37.974609375, 39.3955078125, 40.81640625, 42.2373046875, 43.658203125, 45.0791015625, 46.5]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 19.0, 9.0, 21.0, 24.0, 38.0, 29.0, 38.0, 47.0, 44.0, 48.0, 52.0, 48.0, 72.0, 53.0, 55.0, 50.0, 45.0, 61.0, 35.0, 32.0, 35.0, 23.0, 22.0, 22.0, 15.0, 8.0, 8.0, 8.0, 7.0, 4.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.921875, -23.25, -22.578125, -21.90625, -21.234375, -20.5625, -19.890625, -19.21875, -18.546875, -17.875, -17.203125, -16.53125, -15.859375, -15.1875, -14.515625, -13.84375, -13.171875, -12.5, -11.828125, -11.15625, -10.484375, -9.8125, -9.140625, -8.46875, -7.796875, -7.125, -6.453125, -5.78125, -5.109375, -4.4375, -3.765625, -3.09375, -2.421875, -1.75, -1.078125, -0.40625, 0.265625, 0.9375, 1.609375, 2.28125, 2.953125, 3.625, 4.296875, 4.96875, 5.640625, 6.3125, 6.984375, 7.65625, 8.328125, 9.0, 9.671875, 10.34375, 11.015625, 11.6875, 12.359375, 13.03125, 13.703125, 14.375, 15.046875, 15.71875, 16.390625, 17.0625, 17.734375, 18.40625, 19.078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 12.0, 16.0, 12.0, 22.0, 37.0, 52.0, 63.0, 106.0, 169.0, 228.0, 409.0, 568.0, 977.0, 1706.0, 3320.0, 6286.0, 12852.0, 28253.0, 67327.0, 166395.0, 327169.0, 247656.0, 104060.0, 42785.0, 18903.0, 8772.0, 4510.0, 2382.0, 1391.0, 787.0, 440.0, 277.0, 195.0, 114.0, 99.0, 48.0, 45.0, 27.0, 19.0, 13.0, 14.0, 14.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.296875, -27.482421875, -26.66796875, -25.853515625, -25.0390625, -24.224609375, -23.41015625, -22.595703125, -21.78125, -20.966796875, -20.15234375, -19.337890625, -18.5234375, -17.708984375, -16.89453125, -16.080078125, -15.265625, -14.451171875, -13.63671875, -12.822265625, -12.0078125, -11.193359375, -10.37890625, -9.564453125, -8.75, -7.935546875, -7.12109375, -6.306640625, -5.4921875, -4.677734375, -3.86328125, -3.048828125, -2.234375, -1.419921875, -0.60546875, 0.208984375, 1.0234375, 1.837890625, 2.65234375, 3.466796875, 4.28125, 5.095703125, 5.91015625, 6.724609375, 7.5390625, 8.353515625, 9.16796875, 9.982421875, 10.796875, 11.611328125, 12.42578125, 13.240234375, 14.0546875, 14.869140625, 15.68359375, 16.498046875, 17.3125, 18.126953125, 18.94140625, 19.755859375, 20.5703125, 21.384765625, 22.19921875, 23.013671875, 23.828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 13.0, 10.0, 19.0, 18.0, 30.0, 57.0, 62.0, 81.0, 113.0, 101.0, 103.0, 117.0, 62.0, 55.0, 44.0, 21.0, 20.0, 8.0, 4.0, 13.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022125244140625, -0.0021327435970306396, -0.0020529627799987793, -0.001973181962966919, -0.0018934011459350586, -0.0018136203289031982, -0.0017338395118713379, -0.0016540586948394775, -0.0015742778778076172, -0.0014944970607757568, -0.0014147162437438965, -0.0013349354267120361, -0.0012551546096801758, -0.0011753737926483154, -0.001095592975616455, -0.0010158121585845947, -0.0009360313415527344, -0.000856250524520874, -0.0007764697074890137, -0.0006966888904571533, -0.000616908073425293, -0.0005371272563934326, -0.00045734643936157227, -0.0003775656223297119, -0.00029778480529785156, -0.0002180039882659912, -0.00013822317123413086, -5.844235420227051e-05, 2.1338462829589844e-05, 0.0001011192798614502, 0.00018090009689331055, 0.0002606809139251709, 0.00034046173095703125, 0.0004202425479888916, 0.000500023365020752, 0.0005798041820526123, 0.0006595849990844727, 0.000739365816116333, 0.0008191466331481934, 0.0008989274501800537, 0.000978708267211914, 0.0010584890842437744, 0.0011382699012756348, 0.0012180507183074951, 0.0012978315353393555, 0.0013776123523712158, 0.0014573931694030762, 0.0015371739864349365, 0.0016169548034667969, 0.0016967356204986572, 0.0017765164375305176, 0.001856297254562378, 0.0019360780715942383, 0.0020158588886260986, 0.002095639705657959, 0.0021754205226898193, 0.0022552013397216797, 0.00233498215675354, 0.0024147629737854004, 0.0024945437908172607, 0.002574324607849121, 0.0026541054248809814, 0.002733886241912842, 0.002813667058944702, 0.0028934478759765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 18.0, 18.0, 26.0, 28.0, 32.0, 70.0, 145.0, 188.0, 287.0, 522.0, 984.0, 1990.0, 4013.0, 9315.0, 23482.0, 66652.0, 204381.0, 400655.0, 219737.0, 72051.0, 24893.0, 10016.0, 4440.0, 2083.0, 1018.0, 620.0, 307.0, 189.0, 142.0, 68.0, 47.0, 29.0, 19.0, 18.0, 15.0, 8.0, 6.0, 12.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.21875, -32.19775390625, -31.1767578125, -30.15576171875, -29.134765625, -28.11376953125, -27.0927734375, -26.07177734375, -25.05078125, -24.02978515625, -23.0087890625, -21.98779296875, -20.966796875, -19.94580078125, -18.9248046875, -17.90380859375, -16.8828125, -15.86181640625, -14.8408203125, -13.81982421875, -12.798828125, -11.77783203125, -10.7568359375, -9.73583984375, -8.71484375, -7.69384765625, -6.6728515625, -5.65185546875, -4.630859375, -3.60986328125, -2.5888671875, -1.56787109375, -0.546875, 0.47412109375, 1.4951171875, 2.51611328125, 3.537109375, 4.55810546875, 5.5791015625, 6.60009765625, 7.62109375, 8.64208984375, 9.6630859375, 10.68408203125, 11.705078125, 12.72607421875, 13.7470703125, 14.76806640625, 15.7890625, 16.81005859375, 17.8310546875, 18.85205078125, 19.873046875, 20.89404296875, 21.9150390625, 22.93603515625, 23.95703125, 24.97802734375, 25.9990234375, 27.02001953125, 28.041015625, 29.06201171875, 30.0830078125, 31.10400390625, 32.125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 2.0, 8.0, 12.0, 9.0, 16.0, 26.0, 34.0, 23.0, 44.0, 46.0, 51.0, 52.0, 56.0, 67.0, 77.0, 72.0, 88.0, 49.0, 52.0, 39.0, 35.0, 26.0, 20.0, 17.0, 13.0, 15.0, 10.0, 4.0, 8.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.4765625, -13.0728759765625, -12.669189453125, -12.2655029296875, -11.86181640625, -11.4581298828125, -11.054443359375, -10.6507568359375, -10.2470703125, -9.8433837890625, -9.439697265625, -9.0360107421875, -8.63232421875, -8.2286376953125, -7.824951171875, -7.4212646484375, -7.017578125, -6.6138916015625, -6.210205078125, -5.8065185546875, -5.40283203125, -4.9991455078125, -4.595458984375, -4.1917724609375, -3.7880859375, -3.3843994140625, -2.980712890625, -2.5770263671875, -2.17333984375, -1.7696533203125, -1.365966796875, -0.9622802734375, -0.55859375, -0.1549072265625, 0.248779296875, 0.6524658203125, 1.05615234375, 1.4598388671875, 1.863525390625, 2.2672119140625, 2.6708984375, 3.0745849609375, 3.478271484375, 3.8819580078125, 4.28564453125, 4.6893310546875, 5.093017578125, 5.4967041015625, 5.900390625, 6.3040771484375, 6.707763671875, 7.1114501953125, 7.51513671875, 7.9188232421875, 8.322509765625, 8.7261962890625, 9.1298828125, 9.5335693359375, 9.937255859375, 10.3409423828125, 10.74462890625, 11.1483154296875, 11.552001953125, 11.9556884765625, 12.359375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 18.0, 23.0, 30.0, 43.0, 67.0, 110.0, 122.0, 126.0, 118.0, 106.0, 80.0, 38.0, 24.0, 21.0, 20.0, 10.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-189.30255126953125, -182.3919219970703, -175.48130798339844, -168.5706787109375, -161.66004943847656, -154.74942016601562, -147.83880615234375, -140.9281768798828, -134.01754760742188, -127.10692596435547, -120.19629669189453, -113.28567504882812, -106.37504577636719, -99.46442413330078, -92.55380249023438, -85.64317321777344, -78.73255157470703, -71.82192993164062, -64.91130065917969, -58.00067901611328, -51.090049743652344, -44.17942810058594, -37.268802642822266, -30.358177185058594, -23.447551727294922, -16.53692626953125, -9.626301765441895, -2.715677261352539, 4.194948196411133, 11.105571746826172, 18.016197204589844, 24.926822662353516, 31.837448120117188, 38.74807357788086, 45.65869903564453, 52.56932067871094, 59.479949951171875, 66.39057159423828, 73.30119323730469, 80.21182250976562, 87.12245178222656, 94.03307342529297, 100.9437026977539, 107.85432434082031, 114.76495361328125, 121.67557525634766, 128.58619689941406, 135.496826171875, 142.40744018554688, 149.3180694580078, 156.2286834716797, 163.13931274414062, 170.04994201660156, 176.9605712890625, 183.87118530273438, 190.7818145751953, 197.69244384765625, 204.6030731201172, 211.51368713378906, 218.42431640625, 225.33494567871094, 232.24557495117188, 239.15618896484375, 246.0668182373047, 252.97744750976562]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 6.0, 12.0, 8.0, 22.0, 21.0, 30.0, 26.0, 45.0, 51.0, 55.0, 61.0, 70.0, 77.0, 85.0, 49.0, 62.0, 58.0, 59.0, 37.0, 37.0, 32.0, 13.0, 21.0, 15.0, 13.0, 6.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-164.29312133789062, -159.32205200195312, -154.35098266601562, -149.37991333007812, -144.40882873535156, -139.43775939941406, -134.46669006347656, -129.49562072753906, -124.52455139160156, -119.55348205566406, -114.58240509033203, -109.61133575439453, -104.64026641845703, -99.669189453125, -94.6981201171875, -89.72705078125, -84.75597381591797, -79.78490447998047, -74.81382751464844, -69.84275817871094, -64.87168884277344, -59.90061569213867, -54.929542541503906, -49.958473205566406, -44.98740005493164, -40.016326904296875, -35.045257568359375, -30.07418441772461, -25.103113174438477, -20.132041931152344, -15.160968780517578, -10.189899444580078, -5.2188262939453125, -0.24775457382202148, 4.7233171463012695, 9.694389343261719, 14.665460586547852, 19.636531829833984, 24.60760498046875, 29.57867431640625, 34.549747467041016, 39.52082061767578, 44.49188995361328, 49.46296310424805, 54.43403625488281, 59.40510559082031, 64.37617492675781, 69.34724426269531, 74.31832122802734, 79.28939056396484, 84.26046752929688, 89.23153686523438, 94.20260620117188, 99.17367553710938, 104.1447525024414, 109.1158218383789, 114.08689880371094, 119.05796813964844, 124.02904510498047, 129.0001220703125, 133.97119140625, 138.9422607421875, 143.913330078125, 148.8843994140625, 153.85546875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 11.0, 12.0, 18.0, 12.0, 22.0, 25.0, 32.0, 57.0, 90.0, 145.0, 298.0, 476.0, 1134.0, 2666.0, 7890.0, 28807.0, 175520.0, 3787183.0, 151580.0, 26788.0, 7202.0, 2429.0, 979.0, 429.0, 224.0, 93.0, 59.0, 38.0, 21.0, 14.0, 12.0, 8.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.875, -211.900390625, -205.92578125, -199.951171875, -193.9765625, -188.001953125, -182.02734375, -176.052734375, -170.078125, -164.103515625, -158.12890625, -152.154296875, -146.1796875, -140.205078125, -134.23046875, -128.255859375, -122.28125, -116.306640625, -110.33203125, -104.357421875, -98.3828125, -92.408203125, -86.43359375, -80.458984375, -74.484375, -68.509765625, -62.53515625, -56.560546875, -50.5859375, -44.611328125, -38.63671875, -32.662109375, -26.6875, -20.712890625, -14.73828125, -8.763671875, -2.7890625, 3.185546875, 9.16015625, 15.134765625, 21.109375, 27.083984375, 33.05859375, 39.033203125, 45.0078125, 50.982421875, 56.95703125, 62.931640625, 68.90625, 74.880859375, 80.85546875, 86.830078125, 92.8046875, 98.779296875, 104.75390625, 110.728515625, 116.703125, 122.677734375, 128.65234375, 134.626953125, 140.6015625, 146.576171875, 152.55078125, 158.525390625, 164.5]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 15.0, 10.0, 22.0, 20.0, 36.0, 41.0, 56.0, 71.0, 95.0, 78.0, 80.0, 72.0, 92.0, 66.0, 66.0, 49.0, 40.0, 35.0, 19.0, 23.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.47119140625, -7.2822265625, -7.09326171875, -6.904296875, -6.71533203125, -6.5263671875, -6.33740234375, -6.1484375, -5.95947265625, -5.7705078125, -5.58154296875, -5.392578125, -5.20361328125, -5.0146484375, -4.82568359375, -4.63671875, -4.44775390625, -4.2587890625, -4.06982421875, -3.880859375, -3.69189453125, -3.5029296875, -3.31396484375, -3.125, -2.93603515625, -2.7470703125, -2.55810546875, -2.369140625, -2.18017578125, -1.9912109375, -1.80224609375, -1.61328125, -1.42431640625, -1.2353515625, -1.04638671875, -0.857421875, -0.66845703125, -0.4794921875, -0.29052734375, -0.1015625, 0.08740234375, 0.2763671875, 0.46533203125, 0.654296875, 0.84326171875, 1.0322265625, 1.22119140625, 1.41015625, 1.59912109375, 1.7880859375, 1.97705078125, 2.166015625, 2.35498046875, 2.5439453125, 2.73291015625, 2.921875, 3.11083984375, 3.2998046875, 3.48876953125, 3.677734375, 3.86669921875, 4.0556640625, 4.24462890625, 4.43359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 17.0, 17.0, 23.0, 31.0, 35.0, 71.0, 113.0, 244.0, 461.0, 1527.0, 8387.0, 85562.0, 3874086.0, 205582.0, 14554.0, 2261.0, 649.0, 255.0, 141.0, 82.0, 54.0, 29.0, 19.0, 18.0, 17.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-382.25, -371.81640625, -361.3828125, -350.94921875, -340.515625, -330.08203125, -319.6484375, -309.21484375, -298.78125, -288.34765625, -277.9140625, -267.48046875, -257.046875, -246.61328125, -236.1796875, -225.74609375, -215.3125, -204.87890625, -194.4453125, -184.01171875, -173.578125, -163.14453125, -152.7109375, -142.27734375, -131.84375, -121.41015625, -110.9765625, -100.54296875, -90.109375, -79.67578125, -69.2421875, -58.80859375, -48.375, -37.94140625, -27.5078125, -17.07421875, -6.640625, 3.79296875, 14.2265625, 24.66015625, 35.09375, 45.52734375, 55.9609375, 66.39453125, 76.828125, 87.26171875, 97.6953125, 108.12890625, 118.5625, 128.99609375, 139.4296875, 149.86328125, 160.296875, 170.73046875, 181.1640625, 191.59765625, 202.03125, 212.46484375, 222.8984375, 233.33203125, 243.765625, 254.19921875, 264.6328125, 275.06640625, 285.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 4.0, 7.0, 12.0, 23.0, 22.0, 43.0, 40.0, 65.0, 82.0, 125.0, 181.0, 389.0, 1777.0, 537.0, 243.0, 132.0, 98.0, 62.0, 66.0, 39.0, 28.0, 20.0, 21.0, 10.0, 12.0, 3.0, 8.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.192626953125, -12.63525390625, -12.077880859375, -11.5205078125, -10.963134765625, -10.40576171875, -9.848388671875, -9.291015625, -8.733642578125, -8.17626953125, -7.618896484375, -7.0615234375, -6.504150390625, -5.94677734375, -5.389404296875, -4.83203125, -4.274658203125, -3.71728515625, -3.159912109375, -2.6025390625, -2.045166015625, -1.48779296875, -0.930419921875, -0.373046875, 0.184326171875, 0.74169921875, 1.299072265625, 1.8564453125, 2.413818359375, 2.97119140625, 3.528564453125, 4.0859375, 4.643310546875, 5.20068359375, 5.758056640625, 6.3154296875, 6.872802734375, 7.43017578125, 7.987548828125, 8.544921875, 9.102294921875, 9.65966796875, 10.217041015625, 10.7744140625, 11.331787109375, 11.88916015625, 12.446533203125, 13.00390625, 13.561279296875, 14.11865234375, 14.676025390625, 15.2333984375, 15.790771484375, 16.34814453125, 16.905517578125, 17.462890625, 18.020263671875, 18.57763671875, 19.135009765625, 19.6923828125, 20.249755859375, 20.80712890625, 21.364501953125, 21.921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 17.0, 20.0, 43.0, 57.0, 120.0, 209.0, 216.0, 138.0, 86.0, 39.0, 32.0, 13.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-316.38458251953125, -308.3214416503906, -300.2582702636719, -292.19512939453125, -284.1319580078125, -276.0688171386719, -268.00567626953125, -259.9425048828125, -251.87936401367188, -243.8162078857422, -235.7530517578125, -227.68991088867188, -219.6267547607422, -211.5635986328125, -203.50045776367188, -195.4373016357422, -187.3741455078125, -179.3109893798828, -171.24783325195312, -163.1846923828125, -155.1215362548828, -147.05838012695312, -138.9952392578125, -130.9320831298828, -122.86892700195312, -114.80577087402344, -106.74262237548828, -98.67947387695312, -90.61631774902344, -82.55316162109375, -74.4900131225586, -66.42686462402344, -58.36372375488281, -50.30057144165039, -42.23741912841797, -34.17426681518555, -26.111114501953125, -18.047962188720703, -9.984809875488281, -1.9216575622558594, 6.1414947509765625, 14.204647064208984, 22.267799377441406, 30.330951690673828, 38.39410400390625, 46.45725631713867, 54.520408630371094, 62.583560943603516, 70.64671325683594, 78.70986938476562, 86.77301788330078, 94.83616638183594, 102.89932250976562, 110.96247863769531, 119.02562713623047, 127.08877563476562, 135.1519317626953, 143.215087890625, 151.27822875976562, 159.3413848876953, 167.404541015625, 175.4676971435547, 183.53085327148438, 191.593994140625, 199.6571502685547]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 13.0, 10.0, 15.0, 21.0, 20.0, 35.0, 32.0, 36.0, 39.0, 37.0, 50.0, 63.0, 51.0, 62.0, 44.0, 52.0, 60.0, 58.0, 35.0, 52.0, 42.0, 44.0, 30.0, 22.0, 20.0, 10.0, 9.0, 10.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.41670989990234, -61.7652702331543, -59.113826751708984, -56.46238708496094, -53.810943603515625, -51.15950393676758, -48.50806427001953, -45.85662078857422, -43.20518112182617, -40.553741455078125, -37.90229797363281, -35.250858306884766, -32.59941864013672, -29.947975158691406, -27.29653549194336, -24.64509391784668, -21.99365234375, -19.34221076965332, -16.69076919555664, -14.039329528808594, -11.387887954711914, -8.736446380615234, -6.085005760192871, -3.433565139770508, -0.7821235656738281, 1.8693175315856934, 4.520758628845215, 7.172199726104736, 9.823640823364258, 12.475082397460938, 15.1265230178833, 17.777963638305664, 20.429405212402344, 23.080846786499023, 25.732288360595703, 28.38372802734375, 31.03516960144043, 33.68661117553711, 36.338050842285156, 38.98949432373047, 41.640933990478516, 44.29237365722656, 46.943817138671875, 49.59525680541992, 52.24669647216797, 54.89813995361328, 57.54957962036133, 60.201019287109375, 62.85246276855469, 65.50390625, 68.15534210205078, 70.8067855834961, 73.4582290649414, 76.10966491699219, 78.7611083984375, 81.41255187988281, 84.06399536132812, 86.71543884277344, 89.36687469482422, 92.01831817626953, 94.66976165771484, 97.32119750976562, 99.97264099121094, 102.62408447265625, 105.27552032470703]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 8.0, 12.0, 18.0, 20.0, 25.0, 49.0, 67.0, 114.0, 247.0, 384.0, 831.0, 1915.0, 4795.0, 12682.0, 35827.0, 110398.0, 324619.0, 361004.0, 129366.0, 42233.0, 14370.0, 5396.0, 2165.0, 898.0, 468.0, 242.0, 141.0, 86.0, 57.0, 31.0, 24.0, 15.0, 9.0, 14.0, 9.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.6083984375, -75.904296875, -73.2001953125, -70.49609375, -67.7919921875, -65.087890625, -62.3837890625, -59.6796875, -56.9755859375, -54.271484375, -51.5673828125, -48.86328125, -46.1591796875, -43.455078125, -40.7509765625, -38.046875, -35.3427734375, -32.638671875, -29.9345703125, -27.23046875, -24.5263671875, -21.822265625, -19.1181640625, -16.4140625, -13.7099609375, -11.005859375, -8.3017578125, -5.59765625, -2.8935546875, -0.189453125, 2.5146484375, 5.21875, 7.9228515625, 10.626953125, 13.3310546875, 16.03515625, 18.7392578125, 21.443359375, 24.1474609375, 26.8515625, 29.5556640625, 32.259765625, 34.9638671875, 37.66796875, 40.3720703125, 43.076171875, 45.7802734375, 48.484375, 51.1884765625, 53.892578125, 56.5966796875, 59.30078125, 62.0048828125, 64.708984375, 67.4130859375, 70.1171875, 72.8212890625, 75.525390625, 78.2294921875, 80.93359375, 83.6376953125, 86.341796875, 89.0458984375, 91.75]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 2.0, 9.0, 6.0, 12.0, 9.0, 16.0, 18.0, 20.0, 22.0, 23.0, 22.0, 21.0, 25.0, 25.0, 43.0, 35.0, 48.0, 38.0, 44.0, 50.0, 46.0, 34.0, 47.0, 39.0, 30.0, 30.0, 34.0, 34.0, 34.0, 27.0, 26.0, 12.0, 17.0, 23.0, 19.0, 12.0, 7.0, 10.0, 6.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.48828125, -3.380340576171875, -3.27239990234375, -3.164459228515625, -3.0565185546875, -2.948577880859375, -2.84063720703125, -2.732696533203125, -2.624755859375, -2.516815185546875, -2.40887451171875, -2.300933837890625, -2.1929931640625, -2.085052490234375, -1.97711181640625, -1.869171142578125, -1.76123046875, -1.653289794921875, -1.54534912109375, -1.437408447265625, -1.3294677734375, -1.221527099609375, -1.11358642578125, -1.005645751953125, -0.897705078125, -0.789764404296875, -0.68182373046875, -0.573883056640625, -0.4659423828125, -0.358001708984375, -0.25006103515625, -0.142120361328125, -0.0341796875, 0.073760986328125, 0.18170166015625, 0.289642333984375, 0.3975830078125, 0.505523681640625, 0.61346435546875, 0.721405029296875, 0.829345703125, 0.937286376953125, 1.04522705078125, 1.153167724609375, 1.2611083984375, 1.369049072265625, 1.47698974609375, 1.584930419921875, 1.69287109375, 1.800811767578125, 1.90875244140625, 2.016693115234375, 2.1246337890625, 2.232574462890625, 2.34051513671875, 2.448455810546875, 2.556396484375, 2.664337158203125, 2.77227783203125, 2.880218505859375, 2.9881591796875, 3.096099853515625, 3.20404052734375, 3.311981201171875, 3.419921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 12.0, 13.0, 22.0, 21.0, 40.0, 47.0, 53.0, 82.0, 95.0, 155.0, 243.0, 393.0, 580.0, 1030.0, 1868.0, 3735.0, 8054.0, 19713.0, 56165.0, 175335.0, 388269.0, 257308.0, 84984.0, 28473.0, 11223.0, 4815.0, 2418.0, 1288.0, 770.0, 413.0, 279.0, 185.0, 137.0, 78.0, 51.0, 59.0, 25.0, 27.0, 24.0, 17.0, 7.0, 11.0, 4.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-83.25, -80.7783203125, -78.306640625, -75.8349609375, -73.36328125, -70.8916015625, -68.419921875, -65.9482421875, -63.4765625, -61.0048828125, -58.533203125, -56.0615234375, -53.58984375, -51.1181640625, -48.646484375, -46.1748046875, -43.703125, -41.2314453125, -38.759765625, -36.2880859375, -33.81640625, -31.3447265625, -28.873046875, -26.4013671875, -23.9296875, -21.4580078125, -18.986328125, -16.5146484375, -14.04296875, -11.5712890625, -9.099609375, -6.6279296875, -4.15625, -1.6845703125, 0.787109375, 3.2587890625, 5.73046875, 8.2021484375, 10.673828125, 13.1455078125, 15.6171875, 18.0888671875, 20.560546875, 23.0322265625, 25.50390625, 27.9755859375, 30.447265625, 32.9189453125, 35.390625, 37.8623046875, 40.333984375, 42.8056640625, 45.27734375, 47.7490234375, 50.220703125, 52.6923828125, 55.1640625, 57.6357421875, 60.107421875, 62.5791015625, 65.05078125, 67.5224609375, 69.994140625, 72.4658203125, 74.9375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 10.0, 8.0, 8.0, 10.0, 12.0, 14.0, 19.0, 22.0, 24.0, 36.0, 43.0, 32.0, 47.0, 38.0, 50.0, 43.0, 45.0, 46.0, 50.0, 51.0, 41.0, 43.0, 55.0, 39.0, 35.0, 28.0, 22.0, 28.0, 17.0, 16.0, 12.0, 11.0, 6.0, 5.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.203125, -25.39111328125, -24.5791015625, -23.76708984375, -22.955078125, -22.14306640625, -21.3310546875, -20.51904296875, -19.70703125, -18.89501953125, -18.0830078125, -17.27099609375, -16.458984375, -15.64697265625, -14.8349609375, -14.02294921875, -13.2109375, -12.39892578125, -11.5869140625, -10.77490234375, -9.962890625, -9.15087890625, -8.3388671875, -7.52685546875, -6.71484375, -5.90283203125, -5.0908203125, -4.27880859375, -3.466796875, -2.65478515625, -1.8427734375, -1.03076171875, -0.21875, 0.59326171875, 1.4052734375, 2.21728515625, 3.029296875, 3.84130859375, 4.6533203125, 5.46533203125, 6.27734375, 7.08935546875, 7.9013671875, 8.71337890625, 9.525390625, 10.33740234375, 11.1494140625, 11.96142578125, 12.7734375, 13.58544921875, 14.3974609375, 15.20947265625, 16.021484375, 16.83349609375, 17.6455078125, 18.45751953125, 19.26953125, 20.08154296875, 20.8935546875, 21.70556640625, 22.517578125, 23.32958984375, 24.1416015625, 24.95361328125, 25.765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 14.0, 10.0, 14.0, 28.0, 41.0, 48.0, 99.0, 124.0, 168.0, 287.0, 484.0, 743.0, 1253.0, 2360.0, 4509.0, 9927.0, 25080.0, 75969.0, 250952.0, 410753.0, 177121.0, 53602.0, 18700.0, 7724.0, 3742.0, 1963.0, 1100.0, 596.0, 407.0, 232.0, 159.0, 85.0, 84.0, 38.0, 27.0, 27.0, 18.0, 19.0, 2.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.375, -45.81396484375, -44.2529296875, -42.69189453125, -41.130859375, -39.56982421875, -38.0087890625, -36.44775390625, -34.88671875, -33.32568359375, -31.7646484375, -30.20361328125, -28.642578125, -27.08154296875, -25.5205078125, -23.95947265625, -22.3984375, -20.83740234375, -19.2763671875, -17.71533203125, -16.154296875, -14.59326171875, -13.0322265625, -11.47119140625, -9.91015625, -8.34912109375, -6.7880859375, -5.22705078125, -3.666015625, -2.10498046875, -0.5439453125, 1.01708984375, 2.578125, 4.13916015625, 5.7001953125, 7.26123046875, 8.822265625, 10.38330078125, 11.9443359375, 13.50537109375, 15.06640625, 16.62744140625, 18.1884765625, 19.74951171875, 21.310546875, 22.87158203125, 24.4326171875, 25.99365234375, 27.5546875, 29.11572265625, 30.6767578125, 32.23779296875, 33.798828125, 35.35986328125, 36.9208984375, 38.48193359375, 40.04296875, 41.60400390625, 43.1650390625, 44.72607421875, 46.287109375, 47.84814453125, 49.4091796875, 50.97021484375, 52.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 13.0, 11.0, 21.0, 27.0, 23.0, 24.0, 23.0, 50.0, 58.0, 65.0, 80.0, 79.0, 70.0, 65.0, 80.0, 56.0, 42.0, 53.0, 27.0, 24.0, 14.0, 14.0, 13.0, 8.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004313051700592041, -0.004140019416809082, -0.003966987133026123, -0.003793954849243164, -0.003620922565460205, -0.003447890281677246, -0.003274857997894287, -0.003101825714111328, -0.002928793430328369, -0.00275576114654541, -0.002582728862762451, -0.002409696578979492, -0.002236664295196533, -0.0020636320114135742, -0.0018905997276306152, -0.0017175674438476562, -0.0015445351600646973, -0.0013715028762817383, -0.0011984705924987793, -0.0010254383087158203, -0.0008524060249328613, -0.0006793737411499023, -0.0005063414573669434, -0.0003333091735839844, -0.0001602768898010254, 1.2755393981933594e-05, 0.00018578767776489258, 0.00035881996154785156, 0.0005318522453308105, 0.0007048845291137695, 0.0008779168128967285, 0.0010509490966796875, 0.0012239813804626465, 0.0013970136642456055, 0.0015700459480285645, 0.0017430782318115234, 0.0019161105155944824, 0.0020891427993774414, 0.0022621750831604004, 0.0024352073669433594, 0.0026082396507263184, 0.0027812719345092773, 0.0029543042182922363, 0.0031273365020751953, 0.0033003687858581543, 0.0034734010696411133, 0.0036464333534240723, 0.0038194656372070312, 0.00399249792098999, 0.004165530204772949, 0.004338562488555908, 0.004511594772338867, 0.004684627056121826, 0.004857659339904785, 0.005030691623687744, 0.005203723907470703, 0.005376756191253662, 0.005549788475036621, 0.00572282075881958, 0.005895853042602539, 0.006068885326385498, 0.006241917610168457, 0.006414949893951416, 0.006587982177734375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 15.0, 14.0, 25.0, 40.0, 75.0, 88.0, 158.0, 249.0, 427.0, 744.0, 1331.0, 2837.0, 6596.0, 19086.0, 74046.0, 357691.0, 445870.0, 99796.0, 24600.0, 8070.0, 3276.0, 1473.0, 794.0, 444.0, 271.0, 172.0, 107.0, 67.0, 51.0, 31.0, 24.0, 13.0, 9.0, 15.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-71.9375, -69.6962890625, -67.455078125, -65.2138671875, -62.97265625, -60.7314453125, -58.490234375, -56.2490234375, -54.0078125, -51.7666015625, -49.525390625, -47.2841796875, -45.04296875, -42.8017578125, -40.560546875, -38.3193359375, -36.078125, -33.8369140625, -31.595703125, -29.3544921875, -27.11328125, -24.8720703125, -22.630859375, -20.3896484375, -18.1484375, -15.9072265625, -13.666015625, -11.4248046875, -9.18359375, -6.9423828125, -4.701171875, -2.4599609375, -0.21875, 2.0224609375, 4.263671875, 6.5048828125, 8.74609375, 10.9873046875, 13.228515625, 15.4697265625, 17.7109375, 19.9521484375, 22.193359375, 24.4345703125, 26.67578125, 28.9169921875, 31.158203125, 33.3994140625, 35.640625, 37.8818359375, 40.123046875, 42.3642578125, 44.60546875, 46.8466796875, 49.087890625, 51.3291015625, 53.5703125, 55.8115234375, 58.052734375, 60.2939453125, 62.53515625, 64.7763671875, 67.017578125, 69.2587890625, 71.5]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 7.0, 12.0, 16.0, 19.0, 16.0, 26.0, 38.0, 38.0, 42.0, 62.0, 77.0, 77.0, 62.0, 70.0, 65.0, 65.0, 48.0, 37.0, 37.0, 43.0, 30.0, 22.0, 16.0, 15.0, 13.0, 8.0, 9.0, 4.0, 5.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.494873046875, -22.66162109375, -21.828369140625, -20.9951171875, -20.161865234375, -19.32861328125, -18.495361328125, -17.662109375, -16.828857421875, -15.99560546875, -15.162353515625, -14.3291015625, -13.495849609375, -12.66259765625, -11.829345703125, -10.99609375, -10.162841796875, -9.32958984375, -8.496337890625, -7.6630859375, -6.829833984375, -5.99658203125, -5.163330078125, -4.330078125, -3.496826171875, -2.66357421875, -1.830322265625, -0.9970703125, -0.163818359375, 0.66943359375, 1.502685546875, 2.3359375, 3.169189453125, 4.00244140625, 4.835693359375, 5.6689453125, 6.502197265625, 7.33544921875, 8.168701171875, 9.001953125, 9.835205078125, 10.66845703125, 11.501708984375, 12.3349609375, 13.168212890625, 14.00146484375, 14.834716796875, 15.66796875, 16.501220703125, 17.33447265625, 18.167724609375, 19.0009765625, 19.834228515625, 20.66748046875, 21.500732421875, 22.333984375, 23.167236328125, 24.00048828125, 24.833740234375, 25.6669921875, 26.500244140625, 27.33349609375, 28.166748046875, 29.0]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 16.0, 32.0, 105.0, 214.0, 301.0, 193.0, 79.0, 33.0, 13.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1470.41015625, -1432.190673828125, -1393.97119140625, -1355.751708984375, -1317.5322265625, -1279.312744140625, -1241.09326171875, -1202.873779296875, -1164.654296875, -1126.434814453125, -1088.21533203125, -1049.995849609375, -1011.7763671875, -973.556884765625, -935.33740234375, -897.117919921875, -858.8983764648438, -820.6788940429688, -782.4594116210938, -744.2399291992188, -706.0204467773438, -667.8009643554688, -629.5814208984375, -591.3619384765625, -553.1424560546875, -514.9229736328125, -476.7034912109375, -438.4840087890625, -400.2645263671875, -362.0450439453125, -323.8255310058594, -285.6060485839844, -247.38665771484375, -209.16717529296875, -170.94769287109375, -132.7281951904297, -94.50871276855469, -56.28923034667969, -18.069732666015625, 20.149749755859375, 58.369232177734375, 96.58871459960938, 134.80819702148438, 173.02769470214844, 211.24717712402344, 249.46665954589844, 287.6861572265625, 325.9056396484375, 364.1251220703125, 402.3446044921875, 440.5640869140625, 478.7835693359375, 517.0030517578125, 555.2225341796875, 593.4420166015625, 631.6614990234375, 669.8809814453125, 708.1004638671875, 746.3199462890625, 784.5394287109375, 822.7589111328125, 860.9783935546875, 899.1978759765625, 937.4173583984375, 975.6369018554688]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 4.0, 10.0, 7.0, 18.0, 20.0, 26.0, 25.0, 25.0, 32.0, 31.0, 42.0, 52.0, 59.0, 62.0, 53.0, 48.0, 45.0, 71.0, 44.0, 40.0, 44.0, 30.0, 23.0, 24.0, 29.0, 29.0, 23.0, 23.0, 12.0, 12.0, 7.0, 4.0, 3.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-203.62213134765625, -196.8587646484375, -190.0954132080078, -183.33204650878906, -176.5686798095703, -169.80532836914062, -163.04196166992188, -156.27859497070312, -149.51522827148438, -142.75186157226562, -135.98851013183594, -129.2251434326172, -122.46177673339844, -115.69841766357422, -108.93505859375, -102.17169189453125, -95.40834045410156, -88.64498138427734, -81.8816146850586, -75.11825561523438, -68.35488891601562, -61.591529846191406, -54.82817077636719, -48.0648078918457, -41.30144500732422, -34.538082122802734, -27.774721145629883, -21.01136016845703, -14.247997283935547, -7.4846343994140625, -0.7212753295898438, 6.042087554931641, 12.805450439453125, 19.56881332397461, 26.33217430114746, 33.09553527832031, 39.8588981628418, 46.62226104736328, 53.3856201171875, 60.148983001708984, 66.91234588623047, 73.67570495605469, 80.43907165527344, 87.20243072509766, 93.96578979492188, 100.72915649414062, 107.49251556396484, 114.25587463378906, 121.01924133300781, 127.78260040283203, 134.54595947265625, 141.309326171875, 148.07269287109375, 154.8360595703125, 161.5994110107422, 168.36277770996094, 175.12612915039062, 181.88949584960938, 188.65284729003906, 195.4162139892578, 202.17958068847656, 208.94293212890625, 215.706298828125, 222.46966552734375, 229.2330322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 15.0, 28.0, 43.0, 60.0, 124.0, 235.0, 485.0, 1254.0, 4032.0, 17650.0, 118734.0, 3780884.0, 234246.0, 27670.0, 5799.0, 1662.0, 650.0, 291.0, 136.0, 83.0, 60.0, 37.0, 27.0, 20.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.0, -290.3671875, -281.734375, -273.1015625, -264.46875, -255.8359375, -247.203125, -238.5703125, -229.9375, -221.3046875, -212.671875, -204.0390625, -195.40625, -186.7734375, -178.140625, -169.5078125, -160.875, -152.2421875, -143.609375, -134.9765625, -126.34375, -117.7109375, -109.078125, -100.4453125, -91.8125, -83.1796875, -74.546875, -65.9140625, -57.28125, -48.6484375, -40.015625, -31.3828125, -22.75, -14.1171875, -5.484375, 3.1484375, 11.78125, 20.4140625, 29.046875, 37.6796875, 46.3125, 54.9453125, 63.578125, 72.2109375, 80.84375, 89.4765625, 98.109375, 106.7421875, 115.375, 124.0078125, 132.640625, 141.2734375, 149.90625, 158.5390625, 167.171875, 175.8046875, 184.4375, 193.0703125, 201.703125, 210.3359375, 218.96875, 227.6015625, 236.234375, 244.8671875, 253.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 11.0, 17.0, 20.0, 20.0, 41.0, 32.0, 43.0, 48.0, 59.0, 63.0, 69.0, 68.0, 84.0, 67.0, 56.0, 56.0, 65.0, 34.0, 30.0, 34.0, 20.0, 16.0, 5.0, 11.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.118896484375, -7.87841796875, -7.637939453125, -7.3974609375, -7.156982421875, -6.91650390625, -6.676025390625, -6.435546875, -6.195068359375, -5.95458984375, -5.714111328125, -5.4736328125, -5.233154296875, -4.99267578125, -4.752197265625, -4.51171875, -4.271240234375, -4.03076171875, -3.790283203125, -3.5498046875, -3.309326171875, -3.06884765625, -2.828369140625, -2.587890625, -2.347412109375, -2.10693359375, -1.866455078125, -1.6259765625, -1.385498046875, -1.14501953125, -0.904541015625, -0.6640625, -0.423583984375, -0.18310546875, 0.057373046875, 0.2978515625, 0.538330078125, 0.77880859375, 1.019287109375, 1.259765625, 1.500244140625, 1.74072265625, 1.981201171875, 2.2216796875, 2.462158203125, 2.70263671875, 2.943115234375, 3.18359375, 3.424072265625, 3.66455078125, 3.905029296875, 4.1455078125, 4.385986328125, 4.62646484375, 4.866943359375, 5.107421875, 5.347900390625, 5.58837890625, 5.828857421875, 6.0693359375, 6.309814453125, 6.55029296875, 6.790771484375, 7.03125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 4.0, 13.0, 11.0, 23.0, 34.0, 41.0, 43.0, 53.0, 63.0, 141.0, 1038.0, 46760.0, 4092839.0, 51779.0, 1032.0, 140.0, 59.0, 50.0, 38.0, 30.0, 19.0, 20.0, 21.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-646.0, -625.5, -605.0, -584.5, -564.0, -543.5, -523.0, -502.5, -482.0, -461.5, -441.0, -420.5, -400.0, -379.5, -359.0, -338.5, -318.0, -297.5, -277.0, -256.5, -236.0, -215.5, -195.0, -174.5, -154.0, -133.5, -113.0, -92.5, -72.0, -51.5, -31.0, -10.5, 10.0, 30.5, 51.0, 71.5, 92.0, 112.5, 133.0, 153.5, 174.0, 194.5, 215.0, 235.5, 256.0, 276.5, 297.0, 317.5, 338.0, 358.5, 379.0, 399.5, 420.0, 440.5, 461.0, 481.5, 502.0, 522.5, 543.0, 563.5, 584.0, 604.5, 625.0, 645.5, 666.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 11.0, 14.0, 19.0, 53.0, 80.0, 133.0, 202.0, 442.0, 2026.0, 544.0, 251.0, 121.0, 77.0, 47.0, 31.0, 7.0, 12.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-68.1875, -66.8408203125, -65.494140625, -64.1474609375, -62.80078125, -61.4541015625, -60.107421875, -58.7607421875, -57.4140625, -56.0673828125, -54.720703125, -53.3740234375, -52.02734375, -50.6806640625, -49.333984375, -47.9873046875, -46.640625, -45.2939453125, -43.947265625, -42.6005859375, -41.25390625, -39.9072265625, -38.560546875, -37.2138671875, -35.8671875, -34.5205078125, -33.173828125, -31.8271484375, -30.48046875, -29.1337890625, -27.787109375, -26.4404296875, -25.09375, -23.7470703125, -22.400390625, -21.0537109375, -19.70703125, -18.3603515625, -17.013671875, -15.6669921875, -14.3203125, -12.9736328125, -11.626953125, -10.2802734375, -8.93359375, -7.5869140625, -6.240234375, -4.8935546875, -3.546875, -2.2001953125, -0.853515625, 0.4931640625, 1.83984375, 3.1865234375, 4.533203125, 5.8798828125, 7.2265625, 8.5732421875, 9.919921875, 11.2666015625, 12.61328125, 13.9599609375, 15.306640625, 16.6533203125, 18.0]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 2.0, 8.0, 14.0, 16.0, 30.0, 36.0, 59.0, 128.0, 166.0, 155.0, 135.0, 113.0, 56.0, 35.0, 20.0, 15.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.4701232910156, -302.81158447265625, -293.1530456542969, -283.4945068359375, -273.83599853515625, -264.1774597167969, -254.5189208984375, -244.86038208007812, -235.20184326171875, -225.54330444335938, -215.884765625, -206.2262420654297, -196.5677032470703, -186.90916442871094, -177.25064086914062, -167.59210205078125, -157.93356323242188, -148.2750244140625, -138.61648559570312, -128.9579620361328, -119.29942321777344, -109.64088439941406, -99.98235321044922, -90.32382202148438, -80.665283203125, -71.00674438476562, -61.34821319580078, -51.68967819213867, -42.03114318847656, -32.37260818481445, -22.714073181152344, -13.0555419921875, -3.39697265625, 6.261562347412109, 15.920097351074219, 25.578632354736328, 35.23716735839844, 44.89570236206055, 54.554237365722656, 64.2127685546875, 73.87130737304688, 83.52984619140625, 93.1883773803711, 102.84690856933594, 112.50544738769531, 122.16398620605469, 131.822509765625, 141.48104858398438, 151.13958740234375, 160.79812622070312, 170.4566650390625, 180.1151885986328, 189.7737274169922, 199.43226623535156, 209.09078979492188, 218.74932861328125, 228.40786743164062, 238.06640625, 247.72494506835938, 257.38348388671875, 267.0419921875, 276.7005310058594, 286.35906982421875, 296.0176086425781, 305.6761474609375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 8.0, 9.0, 18.0, 19.0, 21.0, 15.0, 19.0, 28.0, 32.0, 32.0, 38.0, 26.0, 39.0, 49.0, 41.0, 39.0, 36.0, 56.0, 41.0, 51.0, 44.0, 38.0, 37.0, 36.0, 34.0, 23.0, 19.0, 31.0, 19.0, 19.0, 12.0, 8.0, 9.0, 11.0, 7.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.92109680175781, -91.05319213867188, -88.1852798461914, -85.31737518310547, -82.44947052001953, -79.58155822753906, -76.71365356445312, -73.84574890136719, -70.97783660888672, -68.10993194580078, -65.24201965332031, -62.374114990234375, -59.50620651245117, -56.63829803466797, -53.77039337158203, -50.90248489379883, -48.03458023071289, -45.16667175292969, -42.29876708984375, -39.43085861206055, -36.562950134277344, -33.695045471191406, -30.827136993408203, -27.959228515625, -25.09132194519043, -22.22341537475586, -19.355506896972656, -16.487600326538086, -13.6196928024292, -10.751785278320312, -7.883878707885742, -5.015970230102539, -2.1480636596679688, 0.7198436260223389, 3.5877509117126465, 6.455657958984375, 9.323565483093262, 12.191473007202148, 15.059379577636719, 17.927288055419922, 20.795194625854492, 23.663101196289062, 26.531009674072266, 29.398916244506836, 32.266822814941406, 35.13473129272461, 38.00263977050781, 40.87054443359375, 43.73845291137695, 46.606361389160156, 49.474266052246094, 52.3421745300293, 55.2100830078125, 58.07798767089844, 60.94589614868164, 63.813804626464844, 66.68170928955078, 69.54961395263672, 72.41752624511719, 75.28543090820312, 78.15333557128906, 81.02124786376953, 83.88915252685547, 86.75706481933594, 89.62496948242188]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 12.0, 8.0, 13.0, 10.0, 21.0, 31.0, 32.0, 35.0, 51.0, 43.0, 59.0, 117.0, 169.0, 208.0, 393.0, 562.0, 1005.0, 2185.0, 5319.0, 15819.0, 51559.0, 172017.0, 395784.0, 272897.0, 88400.0, 26555.0, 8553.0, 3206.0, 1394.0, 705.0, 402.0, 269.0, 217.0, 118.0, 101.0, 65.0, 32.0, 38.0, 14.0, 27.0, 16.0, 19.0, 14.0, 10.0, 14.0, 2.0, 6.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-93.0, -89.97265625, -86.9453125, -83.91796875, -80.890625, -77.86328125, -74.8359375, -71.80859375, -68.78125, -65.75390625, -62.7265625, -59.69921875, -56.671875, -53.64453125, -50.6171875, -47.58984375, -44.5625, -41.53515625, -38.5078125, -35.48046875, -32.453125, -29.42578125, -26.3984375, -23.37109375, -20.34375, -17.31640625, -14.2890625, -11.26171875, -8.234375, -5.20703125, -2.1796875, 0.84765625, 3.875, 6.90234375, 9.9296875, 12.95703125, 15.984375, 19.01171875, 22.0390625, 25.06640625, 28.09375, 31.12109375, 34.1484375, 37.17578125, 40.203125, 43.23046875, 46.2578125, 49.28515625, 52.3125, 55.33984375, 58.3671875, 61.39453125, 64.421875, 67.44921875, 70.4765625, 73.50390625, 76.53125, 79.55859375, 82.5859375, 85.61328125, 88.640625, 91.66796875, 94.6953125, 97.72265625, 100.75]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 22.0, 15.0, 20.0, 40.0, 40.0, 53.0, 62.0, 73.0, 81.0, 81.0, 84.0, 57.0, 62.0, 61.0, 51.0, 54.0, 38.0, 24.0, 25.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4453125, -10.16302490234375, -9.8807373046875, -9.59844970703125, -9.316162109375, -9.03387451171875, -8.7515869140625, -8.46929931640625, -8.18701171875, -7.90472412109375, -7.6224365234375, -7.34014892578125, -7.057861328125, -6.77557373046875, -6.4932861328125, -6.21099853515625, -5.9287109375, -5.64642333984375, -5.3641357421875, -5.08184814453125, -4.799560546875, -4.51727294921875, -4.2349853515625, -3.95269775390625, -3.67041015625, -3.38812255859375, -3.1058349609375, -2.82354736328125, -2.541259765625, -2.25897216796875, -1.9766845703125, -1.69439697265625, -1.412109375, -1.12982177734375, -0.8475341796875, -0.56524658203125, -0.282958984375, -0.00067138671875, 0.2816162109375, 0.56390380859375, 0.84619140625, 1.12847900390625, 1.4107666015625, 1.69305419921875, 1.975341796875, 2.25762939453125, 2.5399169921875, 2.82220458984375, 3.1044921875, 3.38677978515625, 3.6690673828125, 3.95135498046875, 4.233642578125, 4.51593017578125, 4.7982177734375, 5.08050537109375, 5.36279296875, 5.64508056640625, 5.9273681640625, 6.20965576171875, 6.491943359375, 6.77423095703125, 7.0565185546875, 7.33880615234375, 7.62109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 9.0, 12.0, 14.0, 10.0, 15.0, 24.0, 44.0, 51.0, 66.0, 94.0, 121.0, 184.0, 280.0, 394.0, 706.0, 1229.0, 2109.0, 4405.0, 10240.0, 28022.0, 89022.0, 280058.0, 395228.0, 158831.0, 47895.0, 15910.0, 6498.0, 3015.0, 1549.0, 884.0, 531.0, 327.0, 219.0, 158.0, 116.0, 75.0, 45.0, 43.0, 29.0, 22.0, 19.0, 14.0, 13.0, 8.0, 10.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.8125, -79.0146484375, -76.216796875, -73.4189453125, -70.62109375, -67.8232421875, -65.025390625, -62.2275390625, -59.4296875, -56.6318359375, -53.833984375, -51.0361328125, -48.23828125, -45.4404296875, -42.642578125, -39.8447265625, -37.046875, -34.2490234375, -31.451171875, -28.6533203125, -25.85546875, -23.0576171875, -20.259765625, -17.4619140625, -14.6640625, -11.8662109375, -9.068359375, -6.2705078125, -3.47265625, -0.6748046875, 2.123046875, 4.9208984375, 7.71875, 10.5166015625, 13.314453125, 16.1123046875, 18.91015625, 21.7080078125, 24.505859375, 27.3037109375, 30.1015625, 32.8994140625, 35.697265625, 38.4951171875, 41.29296875, 44.0908203125, 46.888671875, 49.6865234375, 52.484375, 55.2822265625, 58.080078125, 60.8779296875, 63.67578125, 66.4736328125, 69.271484375, 72.0693359375, 74.8671875, 77.6650390625, 80.462890625, 83.2607421875, 86.05859375, 88.8564453125, 91.654296875, 94.4521484375, 97.25]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 18.0, 15.0, 20.0, 21.0, 29.0, 40.0, 37.0, 42.0, 48.0, 49.0, 46.0, 46.0, 44.0, 53.0, 55.0, 58.0, 56.0, 50.0, 44.0, 41.0, 22.0, 30.0, 20.0, 15.0, 12.0, 14.0, 18.0, 9.0, 7.0, 11.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.3125, -43.98583984375, -42.6591796875, -41.33251953125, -40.005859375, -38.67919921875, -37.3525390625, -36.02587890625, -34.69921875, -33.37255859375, -32.0458984375, -30.71923828125, -29.392578125, -28.06591796875, -26.7392578125, -25.41259765625, -24.0859375, -22.75927734375, -21.4326171875, -20.10595703125, -18.779296875, -17.45263671875, -16.1259765625, -14.79931640625, -13.47265625, -12.14599609375, -10.8193359375, -9.49267578125, -8.166015625, -6.83935546875, -5.5126953125, -4.18603515625, -2.859375, -1.53271484375, -0.2060546875, 1.12060546875, 2.447265625, 3.77392578125, 5.1005859375, 6.42724609375, 7.75390625, 9.08056640625, 10.4072265625, 11.73388671875, 13.060546875, 14.38720703125, 15.7138671875, 17.04052734375, 18.3671875, 19.69384765625, 21.0205078125, 22.34716796875, 23.673828125, 25.00048828125, 26.3271484375, 27.65380859375, 28.98046875, 30.30712890625, 31.6337890625, 32.96044921875, 34.287109375, 35.61376953125, 36.9404296875, 38.26708984375, 39.59375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 11.0, 9.0, 10.0, 23.0, 27.0, 65.0, 60.0, 107.0, 174.0, 334.0, 505.0, 1033.0, 2116.0, 4920.0, 13181.0, 47280.0, 246643.0, 542931.0, 142172.0, 30163.0, 9360.0, 3635.0, 1735.0, 837.0, 440.0, 289.0, 169.0, 113.0, 71.0, 41.0, 33.0, 12.0, 11.0, 11.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.5, -59.330078125, -57.16015625, -54.990234375, -52.8203125, -50.650390625, -48.48046875, -46.310546875, -44.140625, -41.970703125, -39.80078125, -37.630859375, -35.4609375, -33.291015625, -31.12109375, -28.951171875, -26.78125, -24.611328125, -22.44140625, -20.271484375, -18.1015625, -15.931640625, -13.76171875, -11.591796875, -9.421875, -7.251953125, -5.08203125, -2.912109375, -0.7421875, 1.427734375, 3.59765625, 5.767578125, 7.9375, 10.107421875, 12.27734375, 14.447265625, 16.6171875, 18.787109375, 20.95703125, 23.126953125, 25.296875, 27.466796875, 29.63671875, 31.806640625, 33.9765625, 36.146484375, 38.31640625, 40.486328125, 42.65625, 44.826171875, 46.99609375, 49.166015625, 51.3359375, 53.505859375, 55.67578125, 57.845703125, 60.015625, 62.185546875, 64.35546875, 66.525390625, 68.6953125, 70.865234375, 73.03515625, 75.205078125, 77.375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 3.0, 2.0, 12.0, 6.0, 11.0, 24.0, 18.0, 30.0, 31.0, 46.0, 45.0, 68.0, 91.0, 82.0, 88.0, 94.0, 79.0, 61.0, 46.0, 39.0, 30.0, 19.0, 19.0, 13.0, 7.0, 5.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.007282257080078125, -0.007073700428009033, -0.006865143775939941, -0.00665658712387085, -0.006448030471801758, -0.006239473819732666, -0.006030917167663574, -0.005822360515594482, -0.005613803863525391, -0.005405247211456299, -0.005196690559387207, -0.004988133907318115, -0.0047795772552490234, -0.004571020603179932, -0.00436246395111084, -0.004153907299041748, -0.003945350646972656, -0.0037367939949035645, -0.0035282373428344727, -0.003319680690765381, -0.003111124038696289, -0.0029025673866271973, -0.0026940107345581055, -0.0024854540824890137, -0.002276897430419922, -0.00206834077835083, -0.0018597841262817383, -0.0016512274742126465, -0.0014426708221435547, -0.0012341141700744629, -0.001025557518005371, -0.0008170008659362793, -0.0006084442138671875, -0.0003998875617980957, -0.0001913309097290039, 1.722574234008789e-05, 0.0002257823944091797, 0.0004343390464782715, 0.0006428956985473633, 0.0008514523506164551, 0.0010600090026855469, 0.0012685656547546387, 0.0014771223068237305, 0.0016856789588928223, 0.001894235610961914, 0.002102792263031006, 0.0023113489151000977, 0.0025199055671691895, 0.0027284622192382812, 0.002937018871307373, 0.003145575523376465, 0.0033541321754455566, 0.0035626888275146484, 0.0037712454795837402, 0.003979802131652832, 0.004188358783721924, 0.004396915435791016, 0.004605472087860107, 0.004814028739929199, 0.005022585391998291, 0.005231142044067383, 0.005439698696136475, 0.005648255348205566, 0.005856812000274658, 0.00606536865234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 13.0, 30.0, 33.0, 58.0, 59.0, 108.0, 141.0, 263.0, 464.0, 823.0, 1778.0, 3951.0, 10939.0, 45178.0, 407615.0, 500281.0, 55592.0, 12545.0, 4438.0, 1928.0, 905.0, 508.0, 284.0, 188.0, 112.0, 92.0, 55.0, 35.0, 20.0, 12.0, 12.0, 10.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-100.625, -97.384765625, -94.14453125, -90.904296875, -87.6640625, -84.423828125, -81.18359375, -77.943359375, -74.703125, -71.462890625, -68.22265625, -64.982421875, -61.7421875, -58.501953125, -55.26171875, -52.021484375, -48.78125, -45.541015625, -42.30078125, -39.060546875, -35.8203125, -32.580078125, -29.33984375, -26.099609375, -22.859375, -19.619140625, -16.37890625, -13.138671875, -9.8984375, -6.658203125, -3.41796875, -0.177734375, 3.0625, 6.302734375, 9.54296875, 12.783203125, 16.0234375, 19.263671875, 22.50390625, 25.744140625, 28.984375, 32.224609375, 35.46484375, 38.705078125, 41.9453125, 45.185546875, 48.42578125, 51.666015625, 54.90625, 58.146484375, 61.38671875, 64.626953125, 67.8671875, 71.107421875, 74.34765625, 77.587890625, 80.828125, 84.068359375, 87.30859375, 90.548828125, 93.7890625, 97.029296875, 100.26953125, 103.509765625, 106.75]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 7.0, 8.0, 15.0, 16.0, 26.0, 29.0, 40.0, 49.0, 76.0, 81.0, 75.0, 88.0, 89.0, 65.0, 66.0, 49.0, 40.0, 29.0, 29.0, 26.0, 9.0, 11.0, 6.0, 6.0, 13.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.0625, -30.890625, -29.71875, -28.546875, -27.375, -26.203125, -25.03125, -23.859375, -22.6875, -21.515625, -20.34375, -19.171875, -18.0, -16.828125, -15.65625, -14.484375, -13.3125, -12.140625, -10.96875, -9.796875, -8.625, -7.453125, -6.28125, -5.109375, -3.9375, -2.765625, -1.59375, -0.421875, 0.75, 1.921875, 3.09375, 4.265625, 5.4375, 6.609375, 7.78125, 8.953125, 10.125, 11.296875, 12.46875, 13.640625, 14.8125, 15.984375, 17.15625, 18.328125, 19.5, 20.671875, 21.84375, 23.015625, 24.1875, 25.359375, 26.53125, 27.703125, 28.875, 30.046875, 31.21875, 32.390625, 33.5625, 34.734375, 35.90625, 37.078125, 38.25, 39.421875, 40.59375, 41.765625, 42.9375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 18.0, 31.0, 58.0, 93.0, 150.0, 174.0, 159.0, 111.0, 70.0, 40.0, 30.0, 21.0, 11.0, 2.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-744.619873046875, -722.4520263671875, -700.2841796875, -678.1163330078125, -655.9485473632812, -633.7807006835938, -611.6128540039062, -589.4450073242188, -567.2772216796875, -545.109375, -522.9415283203125, -500.7737121582031, -478.60589599609375, -456.43804931640625, -434.27020263671875, -412.10235595703125, -389.93450927734375, -367.76666259765625, -345.5988464355469, -323.4309997558594, -301.26318359375, -279.0953369140625, -256.927490234375, -234.75965881347656, -212.59182739257812, -190.4239959716797, -168.25616455078125, -146.08831787109375, -123.92048645019531, -101.75265502929688, -79.58480834960938, -57.41697692871094, -35.2491455078125, -13.081310272216797, 9.086524963378906, 31.254364013671875, 53.42219543457031, 75.59002685546875, 97.75787353515625, 119.92570495605469, 142.09353637695312, 164.26136779785156, 186.42919921875, 208.5970458984375, 230.76487731933594, 252.93270874023438, 275.1005554199219, 297.26837158203125, 319.43621826171875, 341.60406494140625, 363.7718811035156, 385.9397277832031, 408.1075439453125, 430.275390625, 452.4432373046875, 474.611083984375, 496.7789001464844, 518.9467163085938, 541.1145629882812, 563.2824096679688, 585.4502563476562, 607.6180419921875, 629.785888671875, 651.9537353515625, 674.12158203125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 8.0, 6.0, 6.0, 5.0, 15.0, 13.0, 14.0, 16.0, 11.0, 23.0, 28.0, 27.0, 32.0, 28.0, 33.0, 40.0, 36.0, 50.0, 27.0, 42.0, 51.0, 41.0, 60.0, 41.0, 34.0, 32.0, 32.0, 34.0, 36.0, 21.0, 22.0, 19.0, 18.0, 23.0, 14.0, 10.0, 11.0, 7.0, 5.0, 3.0, 6.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-232.5243682861328, -225.1221466064453, -217.71990966796875, -210.31768798828125, -202.91546630859375, -195.5132293701172, -188.1110076904297, -180.70877075195312, -173.30654907226562, -165.90432739257812, -158.50209045410156, -151.09986877441406, -143.69764709472656, -136.29541015625, -128.8931884765625, -121.49095916748047, -114.08873748779297, -106.68650817871094, -99.28428649902344, -91.8820571899414, -84.47982788085938, -77.07760620117188, -69.67537689208984, -62.27314758300781, -54.87092208862305, -47.46869659423828, -40.06646728515625, -32.664241790771484, -25.262014389038086, -17.859786987304688, -10.457561492919922, -3.0553321838378906, 4.346893310546875, 11.749120712280273, 19.151348114013672, 26.553573608398438, 33.95580291748047, 41.358028411865234, 48.76025390625, 56.16248321533203, 63.5647087097168, 70.96693420410156, 78.3691635131836, 85.77139282226562, 93.17361450195312, 100.57584381103516, 107.97807312011719, 115.38029479980469, 122.78252410888672, 130.18475341796875, 137.58697509765625, 144.98919677734375, 152.3914337158203, 159.7936553955078, 167.19589233398438, 174.59811401367188, 182.00033569335938, 189.40255737304688, 196.80479431152344, 204.20701599121094, 211.60923767089844, 219.011474609375, 226.4136962890625, 233.81591796875, 241.21815490722656]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 9.0, 13.0, 20.0, 21.0, 33.0, 40.0, 66.0, 74.0, 130.0, 214.0, 391.0, 745.0, 1764.0, 5203.0, 18679.0, 92572.0, 3562875.0, 444953.0, 48180.0, 11725.0, 3655.0, 1389.0, 637.0, 318.0, 193.0, 120.0, 84.0, 65.0, 25.0, 21.0, 20.0, 11.0, 8.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.875, -146.4140625, -140.953125, -135.4921875, -130.03125, -124.5703125, -119.109375, -113.6484375, -108.1875, -102.7265625, -97.265625, -91.8046875, -86.34375, -80.8828125, -75.421875, -69.9609375, -64.5, -59.0390625, -53.578125, -48.1171875, -42.65625, -37.1953125, -31.734375, -26.2734375, -20.8125, -15.3515625, -9.890625, -4.4296875, 1.03125, 6.4921875, 11.953125, 17.4140625, 22.875, 28.3359375, 33.796875, 39.2578125, 44.71875, 50.1796875, 55.640625, 61.1015625, 66.5625, 72.0234375, 77.484375, 82.9453125, 88.40625, 93.8671875, 99.328125, 104.7890625, 110.25, 115.7109375, 121.171875, 126.6328125, 132.09375, 137.5546875, 143.015625, 148.4765625, 153.9375, 159.3984375, 164.859375, 170.3203125, 175.78125, 181.2421875, 186.703125, 192.1640625, 197.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 8.0, 22.0, 19.0, 28.0, 25.0, 29.0, 31.0, 47.0, 58.0, 63.0, 56.0, 63.0, 49.0, 59.0, 59.0, 52.0, 39.0, 44.0, 39.0, 41.0, 40.0, 18.0, 17.0, 21.0, 12.0, 14.0, 10.0, 8.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.25701904296875, -5.9945068359375, -5.73199462890625, -5.469482421875, -5.20697021484375, -4.9444580078125, -4.68194580078125, -4.41943359375, -4.15692138671875, -3.8944091796875, -3.63189697265625, -3.369384765625, -3.10687255859375, -2.8443603515625, -2.58184814453125, -2.3193359375, -2.05682373046875, -1.7943115234375, -1.53179931640625, -1.269287109375, -1.00677490234375, -0.7442626953125, -0.48175048828125, -0.21923828125, 0.04327392578125, 0.3057861328125, 0.56829833984375, 0.830810546875, 1.09332275390625, 1.3558349609375, 1.61834716796875, 1.880859375, 2.14337158203125, 2.4058837890625, 2.66839599609375, 2.930908203125, 3.19342041015625, 3.4559326171875, 3.71844482421875, 3.98095703125, 4.24346923828125, 4.5059814453125, 4.76849365234375, 5.031005859375, 5.29351806640625, 5.5560302734375, 5.81854248046875, 6.0810546875, 6.34356689453125, 6.6060791015625, 6.86859130859375, 7.131103515625, 7.39361572265625, 7.6561279296875, 7.91864013671875, 8.18115234375, 8.44366455078125, 8.7061767578125, 8.96868896484375, 9.231201171875, 9.49371337890625, 9.7562255859375, 10.01873779296875, 10.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 14.0, 22.0, 28.0, 45.0, 92.0, 155.0, 295.0, 605.0, 1322.0, 3476.0, 12025.0, 54005.0, 409514.0, 3497753.0, 173002.0, 30179.0, 7385.0, 2396.0, 888.0, 443.0, 234.0, 165.0, 93.0, 54.0, 25.0, 21.0, 12.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-178.25, -173.056640625, -167.86328125, -162.669921875, -157.4765625, -152.283203125, -147.08984375, -141.896484375, -136.703125, -131.509765625, -126.31640625, -121.123046875, -115.9296875, -110.736328125, -105.54296875, -100.349609375, -95.15625, -89.962890625, -84.76953125, -79.576171875, -74.3828125, -69.189453125, -63.99609375, -58.802734375, -53.609375, -48.416015625, -43.22265625, -38.029296875, -32.8359375, -27.642578125, -22.44921875, -17.255859375, -12.0625, -6.869140625, -1.67578125, 3.517578125, 8.7109375, 13.904296875, 19.09765625, 24.291015625, 29.484375, 34.677734375, 39.87109375, 45.064453125, 50.2578125, 55.451171875, 60.64453125, 65.837890625, 71.03125, 76.224609375, 81.41796875, 86.611328125, 91.8046875, 96.998046875, 102.19140625, 107.384765625, 112.578125, 117.771484375, 122.96484375, 128.158203125, 133.3515625, 138.544921875, 143.73828125, 148.931640625, 154.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 14.0, 15.0, 20.0, 13.0, 26.0, 32.0, 43.0, 53.0, 72.0, 71.0, 104.0, 199.0, 301.0, 631.0, 1336.0, 371.0, 206.0, 130.0, 96.0, 67.0, 49.0, 29.0, 31.0, 25.0, 27.0, 12.0, 14.0, 12.0, 12.0, 7.0, 10.0, 7.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.4794921875, -18.833984375, -18.1884765625, -17.54296875, -16.8974609375, -16.251953125, -15.6064453125, -14.9609375, -14.3154296875, -13.669921875, -13.0244140625, -12.37890625, -11.7333984375, -11.087890625, -10.4423828125, -9.796875, -9.1513671875, -8.505859375, -7.8603515625, -7.21484375, -6.5693359375, -5.923828125, -5.2783203125, -4.6328125, -3.9873046875, -3.341796875, -2.6962890625, -2.05078125, -1.4052734375, -0.759765625, -0.1142578125, 0.53125, 1.1767578125, 1.822265625, 2.4677734375, 3.11328125, 3.7587890625, 4.404296875, 5.0498046875, 5.6953125, 6.3408203125, 6.986328125, 7.6318359375, 8.27734375, 8.9228515625, 9.568359375, 10.2138671875, 10.859375, 11.5048828125, 12.150390625, 12.7958984375, 13.44140625, 14.0869140625, 14.732421875, 15.3779296875, 16.0234375, 16.6689453125, 17.314453125, 17.9599609375, 18.60546875, 19.2509765625, 19.896484375, 20.5419921875, 21.1875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 7.0, 11.0, 21.0, 31.0, 71.0, 141.0, 169.0, 203.0, 155.0, 105.0, 40.0, 31.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-408.87091064453125, -399.2136535644531, -389.556396484375, -379.8991394042969, -370.24188232421875, -360.5846252441406, -350.9273681640625, -341.27008056640625, -331.61285400390625, -321.9555969238281, -312.29833984375, -302.6410827636719, -292.98382568359375, -283.3265686035156, -273.6693115234375, -264.01202392578125, -254.35476684570312, -244.697509765625, -235.04025268554688, -225.38299560546875, -215.72573852539062, -206.0684814453125, -196.4112091064453, -186.7539520263672, -177.09669494628906, -167.43943786621094, -157.7821807861328, -148.1249237060547, -138.4676513671875, -128.81039428710938, -119.15313720703125, -109.49588012695312, -99.83863830566406, -90.18138122558594, -80.52412414550781, -70.86685943603516, -61.20960235595703, -51.552345275878906, -41.895084381103516, -32.237823486328125, -22.58056640625, -12.923307418823242, -3.2660484313964844, 6.391210556030273, 16.04846954345703, 25.705726623535156, 35.36298751831055, 45.02024841308594, 54.67750549316406, 64.33476257324219, 73.99201965332031, 83.64928436279297, 93.3065414428711, 102.96379852294922, 112.62106323242188, 122.2783203125, 131.93557739257812, 141.59283447265625, 151.25009155273438, 160.9073486328125, 170.56460571289062, 180.22186279296875, 189.87913513183594, 199.53639221191406, 209.1936492919922]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 12.0, 14.0, 19.0, 21.0, 28.0, 24.0, 32.0, 28.0, 36.0, 39.0, 44.0, 32.0, 46.0, 51.0, 62.0, 46.0, 53.0, 44.0, 55.0, 39.0, 40.0, 32.0, 34.0, 24.0, 25.0, 32.0, 19.0, 10.0, 9.0, 6.0, 5.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.48548126220703, -94.37825012207031, -91.27101135253906, -88.16378021240234, -85.05654907226562, -81.9493179321289, -78.84207916259766, -75.73484802246094, -72.62761688232422, -69.5203857421875, -66.41314697265625, -63.30591583251953, -60.19868469238281, -57.09144973754883, -53.984214782714844, -50.876983642578125, -47.76974868774414, -44.662513732910156, -41.55528259277344, -38.44804763793945, -35.340816497802734, -32.23358154296875, -29.1263484954834, -26.019115447998047, -22.911882400512695, -19.804649353027344, -16.697416305541992, -13.590182304382324, -10.482949256896973, -7.375716209411621, -4.268482208251953, -1.1612491607666016, 1.94598388671875, 5.053216934204102, 8.160449981689453, 11.267683982849121, 14.374917030334473, 17.48215103149414, 20.589384078979492, 23.696617126464844, 26.803850173950195, 29.911083221435547, 33.01831817626953, 36.12554931640625, 39.232784271240234, 42.34001541137695, 45.44725036621094, 48.554481506347656, 51.66171646118164, 54.768951416015625, 57.876182556152344, 60.98341751098633, 64.09065246582031, 67.19788360595703, 70.30511474609375, 73.412353515625, 76.51958465576172, 79.62681579589844, 82.73405456542969, 85.8412857055664, 88.94851684570312, 92.05574798583984, 95.1629867553711, 98.27021789550781, 101.37744903564453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 7.0, 12.0, 24.0, 29.0, 36.0, 44.0, 80.0, 97.0, 187.0, 370.0, 729.0, 1826.0, 5809.0, 23604.0, 112616.0, 442906.0, 355471.0, 79904.0, 17403.0, 4425.0, 1475.0, 637.0, 339.0, 142.0, 107.0, 72.0, 49.0, 30.0, 33.0, 19.0, 17.0, 9.0, 10.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-106.5, -103.052734375, -99.60546875, -96.158203125, -92.7109375, -89.263671875, -85.81640625, -82.369140625, -78.921875, -75.474609375, -72.02734375, -68.580078125, -65.1328125, -61.685546875, -58.23828125, -54.791015625, -51.34375, -47.896484375, -44.44921875, -41.001953125, -37.5546875, -34.107421875, -30.66015625, -27.212890625, -23.765625, -20.318359375, -16.87109375, -13.423828125, -9.9765625, -6.529296875, -3.08203125, 0.365234375, 3.8125, 7.259765625, 10.70703125, 14.154296875, 17.6015625, 21.048828125, 24.49609375, 27.943359375, 31.390625, 34.837890625, 38.28515625, 41.732421875, 45.1796875, 48.626953125, 52.07421875, 55.521484375, 58.96875, 62.416015625, 65.86328125, 69.310546875, 72.7578125, 76.205078125, 79.65234375, 83.099609375, 86.546875, 89.994140625, 93.44140625, 96.888671875, 100.3359375, 103.783203125, 107.23046875, 110.677734375, 114.125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 18.0, 20.0, 24.0, 29.0, 27.0, 49.0, 62.0, 61.0, 57.0, 79.0, 75.0, 62.0, 70.0, 53.0, 41.0, 48.0, 43.0, 38.0, 28.0, 24.0, 25.0, 9.0, 12.0, 12.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.3404541015625, -6.024658203125, -5.7088623046875, -5.39306640625, -5.0772705078125, -4.761474609375, -4.4456787109375, -4.1298828125, -3.8140869140625, -3.498291015625, -3.1824951171875, -2.86669921875, -2.5509033203125, -2.235107421875, -1.9193115234375, -1.603515625, -1.2877197265625, -0.971923828125, -0.6561279296875, -0.34033203125, -0.0245361328125, 0.291259765625, 0.6070556640625, 0.9228515625, 1.2386474609375, 1.554443359375, 1.8702392578125, 2.18603515625, 2.5018310546875, 2.817626953125, 3.1334228515625, 3.44921875, 3.7650146484375, 4.080810546875, 4.3966064453125, 4.71240234375, 5.0281982421875, 5.343994140625, 5.6597900390625, 5.9755859375, 6.2913818359375, 6.607177734375, 6.9229736328125, 7.23876953125, 7.5545654296875, 7.870361328125, 8.1861572265625, 8.501953125, 8.8177490234375, 9.133544921875, 9.4493408203125, 9.76513671875, 10.0809326171875, 10.396728515625, 10.7125244140625, 11.0283203125, 11.3441162109375, 11.659912109375, 11.9757080078125, 12.29150390625, 12.6072998046875, 12.923095703125, 13.2388916015625, 13.5546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 12.0, 17.0, 20.0, 26.0, 32.0, 39.0, 52.0, 95.0, 97.0, 166.0, 214.0, 282.0, 432.0, 722.0, 1126.0, 1977.0, 3682.0, 7771.0, 18165.0, 46038.0, 120128.0, 275163.0, 315712.0, 153348.0, 60382.0, 22889.0, 9415.0, 4556.0, 2261.0, 1253.0, 781.0, 504.0, 362.0, 256.0, 152.0, 115.0, 84.0, 53.0, 45.0, 41.0, 25.0, 16.0, 16.0, 9.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.0, -55.1083984375, -53.216796875, -51.3251953125, -49.43359375, -47.5419921875, -45.650390625, -43.7587890625, -41.8671875, -39.9755859375, -38.083984375, -36.1923828125, -34.30078125, -32.4091796875, -30.517578125, -28.6259765625, -26.734375, -24.8427734375, -22.951171875, -21.0595703125, -19.16796875, -17.2763671875, -15.384765625, -13.4931640625, -11.6015625, -9.7099609375, -7.818359375, -5.9267578125, -4.03515625, -2.1435546875, -0.251953125, 1.6396484375, 3.53125, 5.4228515625, 7.314453125, 9.2060546875, 11.09765625, 12.9892578125, 14.880859375, 16.7724609375, 18.6640625, 20.5556640625, 22.447265625, 24.3388671875, 26.23046875, 28.1220703125, 30.013671875, 31.9052734375, 33.796875, 35.6884765625, 37.580078125, 39.4716796875, 41.36328125, 43.2548828125, 45.146484375, 47.0380859375, 48.9296875, 50.8212890625, 52.712890625, 54.6044921875, 56.49609375, 58.3876953125, 60.279296875, 62.1708984375, 64.0625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 9.0, 12.0, 11.0, 16.0, 14.0, 25.0, 24.0, 36.0, 27.0, 29.0, 27.0, 29.0, 38.0, 37.0, 34.0, 46.0, 42.0, 45.0, 33.0, 45.0, 36.0, 52.0, 50.0, 33.0, 31.0, 26.0, 22.0, 25.0, 24.0, 22.0, 16.0, 8.0, 19.0, 13.0, 10.0, 9.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.53125, -34.4462890625, -33.361328125, -32.2763671875, -31.19140625, -30.1064453125, -29.021484375, -27.9365234375, -26.8515625, -25.7666015625, -24.681640625, -23.5966796875, -22.51171875, -21.4267578125, -20.341796875, -19.2568359375, -18.171875, -17.0869140625, -16.001953125, -14.9169921875, -13.83203125, -12.7470703125, -11.662109375, -10.5771484375, -9.4921875, -8.4072265625, -7.322265625, -6.2373046875, -5.15234375, -4.0673828125, -2.982421875, -1.8974609375, -0.8125, 0.2724609375, 1.357421875, 2.4423828125, 3.52734375, 4.6123046875, 5.697265625, 6.7822265625, 7.8671875, 8.9521484375, 10.037109375, 11.1220703125, 12.20703125, 13.2919921875, 14.376953125, 15.4619140625, 16.546875, 17.6318359375, 18.716796875, 19.8017578125, 20.88671875, 21.9716796875, 23.056640625, 24.1416015625, 25.2265625, 26.3115234375, 27.396484375, 28.4814453125, 29.56640625, 30.6513671875, 31.736328125, 32.8212890625, 33.90625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 8.0, 10.0, 14.0, 23.0, 35.0, 26.0, 78.0, 90.0, 140.0, 255.0, 429.0, 736.0, 1453.0, 3241.0, 8216.0, 24285.0, 87013.0, 360229.0, 412861.0, 104176.0, 28494.0, 9488.0, 3588.0, 1627.0, 813.0, 440.0, 260.0, 170.0, 112.0, 73.0, 40.0, 31.0, 31.0, 20.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.11328125, -33.9453125, -32.77734375, -31.609375, -30.44140625, -29.2734375, -28.10546875, -26.9375, -25.76953125, -24.6015625, -23.43359375, -22.265625, -21.09765625, -19.9296875, -18.76171875, -17.59375, -16.42578125, -15.2578125, -14.08984375, -12.921875, -11.75390625, -10.5859375, -9.41796875, -8.25, -7.08203125, -5.9140625, -4.74609375, -3.578125, -2.41015625, -1.2421875, -0.07421875, 1.09375, 2.26171875, 3.4296875, 4.59765625, 5.765625, 6.93359375, 8.1015625, 9.26953125, 10.4375, 11.60546875, 12.7734375, 13.94140625, 15.109375, 16.27734375, 17.4453125, 18.61328125, 19.78125, 20.94921875, 22.1171875, 23.28515625, 24.453125, 25.62109375, 26.7890625, 27.95703125, 29.125, 30.29296875, 31.4609375, 32.62890625, 33.796875, 34.96484375, 36.1328125, 37.30078125, 38.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 5.0, 6.0, 9.0, 13.0, 19.0, 25.0, 57.0, 63.0, 94.0, 112.0, 121.0, 128.0, 84.0, 73.0, 53.0, 35.0, 28.0, 20.0, 10.0, 13.0, 10.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00714111328125, -0.006935596466064453, -0.006730079650878906, -0.006524562835693359, -0.0063190460205078125, -0.006113529205322266, -0.005908012390136719, -0.005702495574951172, -0.005496978759765625, -0.005291461944580078, -0.005085945129394531, -0.004880428314208984, -0.0046749114990234375, -0.004469394683837891, -0.004263877868652344, -0.004058361053466797, -0.00385284423828125, -0.003647327423095703, -0.0034418106079101562, -0.0032362937927246094, -0.0030307769775390625, -0.0028252601623535156, -0.0026197433471679688, -0.002414226531982422, -0.002208709716796875, -0.002003192901611328, -0.0017976760864257812, -0.0015921592712402344, -0.0013866424560546875, -0.0011811256408691406, -0.0009756088256835938, -0.0007700920104980469, -0.0005645751953125, -0.0003590583801269531, -0.00015354156494140625, 5.1975250244140625e-05, 0.0002574920654296875, 0.0004630088806152344, 0.0006685256958007812, 0.0008740425109863281, 0.001079559326171875, 0.0012850761413574219, 0.0014905929565429688, 0.0016961097717285156, 0.0019016265869140625, 0.0021071434020996094, 0.0023126602172851562, 0.002518177032470703, 0.00272369384765625, 0.002929210662841797, 0.0031347274780273438, 0.0033402442932128906, 0.0035457611083984375, 0.0037512779235839844, 0.003956794738769531, 0.004162311553955078, 0.004367828369140625, 0.004573345184326172, 0.004778861999511719, 0.004984378814697266, 0.0051898956298828125, 0.005395412445068359, 0.005600929260253906, 0.005806446075439453, 0.006011962890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 14.0, 10.0, 25.0, 24.0, 44.0, 63.0, 96.0, 146.0, 264.0, 449.0, 741.0, 1500.0, 3378.0, 8956.0, 31288.0, 157999.0, 603846.0, 186862.0, 35584.0, 10026.0, 3606.0, 1626.0, 820.0, 451.0, 267.0, 145.0, 84.0, 60.0, 43.0, 36.0, 22.0, 15.0, 15.0, 9.0, 9.0, 0.0, 6.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.03125, -51.49609375, -49.9609375, -48.42578125, -46.890625, -45.35546875, -43.8203125, -42.28515625, -40.75, -39.21484375, -37.6796875, -36.14453125, -34.609375, -33.07421875, -31.5390625, -30.00390625, -28.46875, -26.93359375, -25.3984375, -23.86328125, -22.328125, -20.79296875, -19.2578125, -17.72265625, -16.1875, -14.65234375, -13.1171875, -11.58203125, -10.046875, -8.51171875, -6.9765625, -5.44140625, -3.90625, -2.37109375, -0.8359375, 0.69921875, 2.234375, 3.76953125, 5.3046875, 6.83984375, 8.375, 9.91015625, 11.4453125, 12.98046875, 14.515625, 16.05078125, 17.5859375, 19.12109375, 20.65625, 22.19140625, 23.7265625, 25.26171875, 26.796875, 28.33203125, 29.8671875, 31.40234375, 32.9375, 34.47265625, 36.0078125, 37.54296875, 39.078125, 40.61328125, 42.1484375, 43.68359375, 45.21875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 10.0, 8.0, 14.0, 7.0, 14.0, 27.0, 23.0, 30.0, 35.0, 56.0, 54.0, 70.0, 73.0, 93.0, 82.0, 93.0, 53.0, 57.0, 44.0, 24.0, 21.0, 16.0, 13.0, 13.0, 16.0, 7.0, 10.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.265625, -18.54248046875, -17.8193359375, -17.09619140625, -16.373046875, -15.64990234375, -14.9267578125, -14.20361328125, -13.48046875, -12.75732421875, -12.0341796875, -11.31103515625, -10.587890625, -9.86474609375, -9.1416015625, -8.41845703125, -7.6953125, -6.97216796875, -6.2490234375, -5.52587890625, -4.802734375, -4.07958984375, -3.3564453125, -2.63330078125, -1.91015625, -1.18701171875, -0.4638671875, 0.25927734375, 0.982421875, 1.70556640625, 2.4287109375, 3.15185546875, 3.875, 4.59814453125, 5.3212890625, 6.04443359375, 6.767578125, 7.49072265625, 8.2138671875, 8.93701171875, 9.66015625, 10.38330078125, 11.1064453125, 11.82958984375, 12.552734375, 13.27587890625, 13.9990234375, 14.72216796875, 15.4453125, 16.16845703125, 16.8916015625, 17.61474609375, 18.337890625, 19.06103515625, 19.7841796875, 20.50732421875, 21.23046875, 21.95361328125, 22.6767578125, 23.39990234375, 24.123046875, 24.84619140625, 25.5693359375, 26.29248046875, 27.015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 13.0, 14.0, 32.0, 53.0, 120.0, 183.0, 194.0, 172.0, 104.0, 61.0, 28.0, 16.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.243896484375, -281.3418273925781, -258.4397277832031, -235.53765869140625, -212.63558959960938, -189.73350524902344, -166.8314208984375, -143.92935180664062, -121.02726745605469, -98.12519073486328, -75.22311401367188, -52.32102966308594, -29.41895294189453, -6.516876220703125, 16.385208129882812, 39.28727722167969, 62.189361572265625, 85.09143829345703, 107.99351501464844, 130.89559936523438, 153.79766845703125, 176.6997528076172, 199.60183715820312, 222.50390625, 245.40599060058594, 268.3080749511719, 291.21014404296875, 314.11224365234375, 337.0143127441406, 359.9163818359375, 382.8184814453125, 405.72052001953125, 428.62261962890625, 451.5246887207031, 474.4267883300781, 497.328857421875, 520.23095703125, 543.1329956054688, 566.0350952148438, 588.9371337890625, 611.8392333984375, 634.7413330078125, 657.6433715820312, 680.5454711914062, 703.4475708007812, 726.349609375, 749.251708984375, 772.15380859375, 795.055908203125, 817.9580078125, 840.8600463867188, 863.7621459960938, 886.6642456054688, 909.5662841796875, 932.4683837890625, 955.3704833984375, 978.2725219726562, 1001.1746215820312, 1024.07666015625, 1046.978759765625, 1069.880859375, 1092.782958984375, 1115.68505859375, 1138.5870361328125, 1161.4891357421875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 15.0, 13.0, 12.0, 17.0, 14.0, 23.0, 25.0, 24.0, 42.0, 29.0, 39.0, 43.0, 53.0, 45.0, 64.0, 55.0, 65.0, 49.0, 46.0, 33.0, 42.0, 48.0, 29.0, 29.0, 25.0, 26.0, 12.0, 18.0, 8.0, 8.0, 11.0, 10.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-292.1956787109375, -284.10540771484375, -276.0151062011719, -267.9248352050781, -259.83453369140625, -251.74424743652344, -243.65396118164062, -235.56369018554688, -227.473388671875, -219.3831024169922, -211.29281616210938, -203.20252990722656, -195.11224365234375, -187.02195739746094, -178.93167114257812, -170.84140014648438, -162.75111389160156, -154.66082763671875, -146.57054138183594, -138.48025512695312, -130.3899688720703, -122.2996826171875, -114.20940399169922, -106.1191177368164, -98.0288314819336, -89.93854522705078, -81.84825897216797, -73.75798034667969, -65.66769409179688, -57.5774040222168, -49.48712158203125, -41.39683532714844, -33.306549072265625, -25.216262817382812, -17.125978469848633, -9.035694122314453, -0.9454078674316406, 7.144878387451172, 15.235160827636719, 23.32544708251953, 31.415733337402344, 39.506019592285156, 47.59630584716797, 55.686588287353516, 63.77687454223633, 71.86715698242188, 79.95744323730469, 88.0477294921875, 96.13801574707031, 104.22830200195312, 112.31858825683594, 120.40887451171875, 128.49916076660156, 136.58944702148438, 144.67971801757812, 152.77001953125, 160.86029052734375, 168.95057678222656, 177.04086303710938, 185.1311492919922, 193.221435546875, 201.3117218017578, 209.40200805664062, 217.49227905273438, 225.58258056640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 11.0, 12.0, 18.0, 33.0, 40.0, 62.0, 92.0, 172.0, 260.0, 509.0, 1203.0, 2976.0, 8841.0, 34060.0, 246768.0, 3776784.0, 93582.0, 19125.0, 5749.0, 2061.0, 880.0, 385.0, 242.0, 147.0, 75.0, 65.0, 36.0, 23.0, 14.0, 15.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-153.625, -149.7158203125, -145.806640625, -141.8974609375, -137.98828125, -134.0791015625, -130.169921875, -126.2607421875, -122.3515625, -118.4423828125, -114.533203125, -110.6240234375, -106.71484375, -102.8056640625, -98.896484375, -94.9873046875, -91.078125, -87.1689453125, -83.259765625, -79.3505859375, -75.44140625, -71.5322265625, -67.623046875, -63.7138671875, -59.8046875, -55.8955078125, -51.986328125, -48.0771484375, -44.16796875, -40.2587890625, -36.349609375, -32.4404296875, -28.53125, -24.6220703125, -20.712890625, -16.8037109375, -12.89453125, -8.9853515625, -5.076171875, -1.1669921875, 2.7421875, 6.6513671875, 10.560546875, 14.4697265625, 18.37890625, 22.2880859375, 26.197265625, 30.1064453125, 34.015625, 37.9248046875, 41.833984375, 45.7431640625, 49.65234375, 53.5615234375, 57.470703125, 61.3798828125, 65.2890625, 69.1982421875, 73.107421875, 77.0166015625, 80.92578125, 84.8349609375, 88.744140625, 92.6533203125, 96.5625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 10.0, 8.0, 9.0, 22.0, 27.0, 31.0, 35.0, 45.0, 57.0, 43.0, 73.0, 62.0, 71.0, 80.0, 76.0, 59.0, 49.0, 53.0, 48.0, 34.0, 23.0, 24.0, 18.0, 10.0, 9.0, 8.0, 8.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.52911376953125, -6.1871337890625, -5.84515380859375, -5.503173828125, -5.16119384765625, -4.8192138671875, -4.47723388671875, -4.13525390625, -3.79327392578125, -3.4512939453125, -3.10931396484375, -2.767333984375, -2.42535400390625, -2.0833740234375, -1.74139404296875, -1.3994140625, -1.05743408203125, -0.7154541015625, -0.37347412109375, -0.031494140625, 0.31048583984375, 0.6524658203125, 0.99444580078125, 1.33642578125, 1.67840576171875, 2.0203857421875, 2.36236572265625, 2.704345703125, 3.04632568359375, 3.3883056640625, 3.73028564453125, 4.072265625, 4.41424560546875, 4.7562255859375, 5.09820556640625, 5.440185546875, 5.78216552734375, 6.1241455078125, 6.46612548828125, 6.80810546875, 7.15008544921875, 7.4920654296875, 7.83404541015625, 8.176025390625, 8.51800537109375, 8.8599853515625, 9.20196533203125, 9.5439453125, 9.88592529296875, 10.2279052734375, 10.56988525390625, 10.911865234375, 11.25384521484375, 11.5958251953125, 11.93780517578125, 12.27978515625, 12.62176513671875, 12.9637451171875, 13.30572509765625, 13.647705078125, 13.98968505859375, 14.3316650390625, 14.67364501953125, 15.015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 10.0, 16.0, 23.0, 29.0, 49.0, 72.0, 166.0, 321.0, 850.0, 2653.0, 11243.0, 66159.0, 3414334.0, 645085.0, 42444.0, 7654.0, 2003.0, 636.0, 258.0, 107.0, 65.0, 39.0, 27.0, 9.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.0, -179.01171875, -174.0234375, -169.03515625, -164.046875, -159.05859375, -154.0703125, -149.08203125, -144.09375, -139.10546875, -134.1171875, -129.12890625, -124.140625, -119.15234375, -114.1640625, -109.17578125, -104.1875, -99.19921875, -94.2109375, -89.22265625, -84.234375, -79.24609375, -74.2578125, -69.26953125, -64.28125, -59.29296875, -54.3046875, -49.31640625, -44.328125, -39.33984375, -34.3515625, -29.36328125, -24.375, -19.38671875, -14.3984375, -9.41015625, -4.421875, 0.56640625, 5.5546875, 10.54296875, 15.53125, 20.51953125, 25.5078125, 30.49609375, 35.484375, 40.47265625, 45.4609375, 50.44921875, 55.4375, 60.42578125, 65.4140625, 70.40234375, 75.390625, 80.37890625, 85.3671875, 90.35546875, 95.34375, 100.33203125, 105.3203125, 110.30859375, 115.296875, 120.28515625, 125.2734375, 130.26171875, 135.25]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 13.0, 29.0, 35.0, 36.0, 79.0, 137.0, 355.0, 2153.0, 684.0, 204.0, 120.0, 92.0, 40.0, 25.0, 16.0, 17.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.623291015625, -46.55908203125, -45.494873046875, -44.4306640625, -43.366455078125, -42.30224609375, -41.238037109375, -40.173828125, -39.109619140625, -38.04541015625, -36.981201171875, -35.9169921875, -34.852783203125, -33.78857421875, -32.724365234375, -31.66015625, -30.595947265625, -29.53173828125, -28.467529296875, -27.4033203125, -26.339111328125, -25.27490234375, -24.210693359375, -23.146484375, -22.082275390625, -21.01806640625, -19.953857421875, -18.8896484375, -17.825439453125, -16.76123046875, -15.697021484375, -14.6328125, -13.568603515625, -12.50439453125, -11.440185546875, -10.3759765625, -9.311767578125, -8.24755859375, -7.183349609375, -6.119140625, -5.054931640625, -3.99072265625, -2.926513671875, -1.8623046875, -0.798095703125, 0.26611328125, 1.330322265625, 2.39453125, 3.458740234375, 4.52294921875, 5.587158203125, 6.6513671875, 7.715576171875, 8.77978515625, 9.843994140625, 10.908203125, 11.972412109375, 13.03662109375, 14.100830078125, 15.1650390625, 16.229248046875, 17.29345703125, 18.357666015625, 19.421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 4.0, 6.0, 7.0, 17.0, 26.0, 32.0, 56.0, 70.0, 114.0, 151.0, 136.0, 135.0, 97.0, 53.0, 30.0, 18.0, 17.0, 10.0, 9.0, 1.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-214.3878936767578, -209.1502685546875, -203.91262817382812, -198.6750030517578, -193.4373779296875, -188.1997528076172, -182.96212768554688, -177.7244873046875, -172.4868621826172, -167.24923706054688, -162.0115966796875, -156.7739715576172, -151.53634643554688, -146.29872131347656, -141.06109619140625, -135.82345581054688, -130.58583068847656, -125.34820556640625, -120.1105728149414, -114.87294006347656, -109.63531494140625, -104.39768981933594, -99.1600570678711, -93.92242431640625, -88.68479919433594, -83.44717407226562, -78.20954132080078, -72.97190856933594, -67.73428344726562, -62.49665451049805, -57.25902557373047, -52.02139663696289, -46.78375244140625, -41.54612350463867, -36.308494567871094, -31.070865631103516, -25.833236694335938, -20.59560775756836, -15.357978820800781, -10.120349884033203, -4.882720947265625, 0.3549079895019531, 5.592536926269531, 10.83016586303711, 16.067794799804688, 21.305423736572266, 26.543052673339844, 31.780681610107422, 37.018310546875, 42.25593948364258, 47.493568420410156, 52.731197357177734, 57.96882629394531, 63.20645523071289, 68.44408416748047, 73.68171691894531, 78.91934204101562, 84.15696716308594, 89.39459991455078, 94.63223266601562, 99.86985778808594, 105.10748291015625, 110.3451156616211, 115.58274841308594, 120.82037353515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 4.0, 12.0, 6.0, 10.0, 10.0, 18.0, 22.0, 20.0, 27.0, 28.0, 32.0, 47.0, 34.0, 51.0, 51.0, 41.0, 45.0, 52.0, 44.0, 60.0, 42.0, 46.0, 26.0, 27.0, 38.0, 33.0, 34.0, 19.0, 27.0, 19.0, 17.0, 7.0, 13.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-84.69847106933594, -82.26068878173828, -79.82290649414062, -77.38512420654297, -74.94734191894531, -72.50955963134766, -70.07177734375, -67.63398742675781, -65.19621276855469, -62.75843048095703, -60.320648193359375, -57.88286590576172, -55.44508361816406, -53.007301330566406, -50.569515228271484, -48.13173294067383, -45.693946838378906, -43.25616455078125, -40.818382263183594, -38.38059997558594, -35.94281768798828, -33.505035400390625, -31.067249298095703, -28.629467010498047, -26.19168472290039, -23.753902435302734, -21.316120147705078, -18.87833595275879, -16.440553665161133, -14.002771377563477, -11.564988136291504, -9.127204895019531, -6.689422607421875, -4.2516398429870605, -1.813857078552246, 0.6239256858825684, 3.061708450317383, 5.499490737915039, 7.937273979187012, 10.375057220458984, 12.81283950805664, 15.250621795654297, 17.688404083251953, 20.126188278198242, 22.5639705657959, 25.001752853393555, 27.439537048339844, 29.8773193359375, 32.315101623535156, 34.75288391113281, 37.19066619873047, 39.628448486328125, 42.06623077392578, 44.50401306152344, 46.94179916381836, 49.379581451416016, 51.81736373901367, 54.25514602661133, 56.692928314208984, 59.13071060180664, 61.56849670410156, 64.00627899169922, 66.44406127929688, 68.88184356689453, 71.31962585449219]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 7.0, 6.0, 11.0, 11.0, 21.0, 24.0, 32.0, 34.0, 61.0, 83.0, 137.0, 249.0, 334.0, 656.0, 1348.0, 2852.0, 6764.0, 19141.0, 61319.0, 209655.0, 439890.0, 212006.0, 61926.0, 19262.0, 6763.0, 2827.0, 1355.0, 669.0, 387.0, 237.0, 155.0, 88.0, 65.0, 40.0, 35.0, 18.0, 24.0, 14.0, 12.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.6875, -76.0205078125, -73.353515625, -70.6865234375, -68.01953125, -65.3525390625, -62.685546875, -60.0185546875, -57.3515625, -54.6845703125, -52.017578125, -49.3505859375, -46.68359375, -44.0166015625, -41.349609375, -38.6826171875, -36.015625, -33.3486328125, -30.681640625, -28.0146484375, -25.34765625, -22.6806640625, -20.013671875, -17.3466796875, -14.6796875, -12.0126953125, -9.345703125, -6.6787109375, -4.01171875, -1.3447265625, 1.322265625, 3.9892578125, 6.65625, 9.3232421875, 11.990234375, 14.6572265625, 17.32421875, 19.9912109375, 22.658203125, 25.3251953125, 27.9921875, 30.6591796875, 33.326171875, 35.9931640625, 38.66015625, 41.3271484375, 43.994140625, 46.6611328125, 49.328125, 51.9951171875, 54.662109375, 57.3291015625, 59.99609375, 62.6630859375, 65.330078125, 67.9970703125, 70.6640625, 73.3310546875, 75.998046875, 78.6650390625, 81.33203125, 83.9990234375, 86.666015625, 89.3330078125, 92.0]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 15.0, 15.0, 13.0, 22.0, 25.0, 46.0, 44.0, 58.0, 57.0, 59.0, 74.0, 77.0, 85.0, 56.0, 60.0, 58.0, 48.0, 41.0, 43.0, 30.0, 20.0, 15.0, 10.0, 5.0, 7.0, 8.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.11126708984375, -5.7498779296875, -5.38848876953125, -5.027099609375, -4.66571044921875, -4.3043212890625, -3.94293212890625, -3.58154296875, -3.22015380859375, -2.8587646484375, -2.49737548828125, -2.135986328125, -1.77459716796875, -1.4132080078125, -1.05181884765625, -0.6904296875, -0.32904052734375, 0.0323486328125, 0.39373779296875, 0.755126953125, 1.11651611328125, 1.4779052734375, 1.83929443359375, 2.20068359375, 2.56207275390625, 2.9234619140625, 3.28485107421875, 3.646240234375, 4.00762939453125, 4.3690185546875, 4.73040771484375, 5.091796875, 5.45318603515625, 5.8145751953125, 6.17596435546875, 6.537353515625, 6.89874267578125, 7.2601318359375, 7.62152099609375, 7.98291015625, 8.34429931640625, 8.7056884765625, 9.06707763671875, 9.428466796875, 9.78985595703125, 10.1512451171875, 10.51263427734375, 10.8740234375, 11.23541259765625, 11.5968017578125, 11.95819091796875, 12.319580078125, 12.68096923828125, 13.0423583984375, 13.40374755859375, 13.76513671875, 14.12652587890625, 14.4879150390625, 14.84930419921875, 15.210693359375, 15.57208251953125, 15.9334716796875, 16.29486083984375, 16.65625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 12.0, 12.0, 12.0, 17.0, 21.0, 34.0, 46.0, 81.0, 106.0, 143.0, 197.0, 294.0, 411.0, 599.0, 947.0, 1567.0, 2872.0, 5802.0, 13245.0, 33511.0, 89191.0, 223958.0, 342798.0, 201187.0, 78171.0, 29512.0, 11574.0, 5358.0, 2635.0, 1491.0, 839.0, 558.0, 400.0, 279.0, 186.0, 153.0, 92.0, 59.0, 52.0, 40.0, 23.0, 23.0, 17.0, 14.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.40625, -49.65966796875, -47.9130859375, -46.16650390625, -44.419921875, -42.67333984375, -40.9267578125, -39.18017578125, -37.43359375, -35.68701171875, -33.9404296875, -32.19384765625, -30.447265625, -28.70068359375, -26.9541015625, -25.20751953125, -23.4609375, -21.71435546875, -19.9677734375, -18.22119140625, -16.474609375, -14.72802734375, -12.9814453125, -11.23486328125, -9.48828125, -7.74169921875, -5.9951171875, -4.24853515625, -2.501953125, -0.75537109375, 0.9912109375, 2.73779296875, 4.484375, 6.23095703125, 7.9775390625, 9.72412109375, 11.470703125, 13.21728515625, 14.9638671875, 16.71044921875, 18.45703125, 20.20361328125, 21.9501953125, 23.69677734375, 25.443359375, 27.18994140625, 28.9365234375, 30.68310546875, 32.4296875, 34.17626953125, 35.9228515625, 37.66943359375, 39.416015625, 41.16259765625, 42.9091796875, 44.65576171875, 46.40234375, 48.14892578125, 49.8955078125, 51.64208984375, 53.388671875, 55.13525390625, 56.8818359375, 58.62841796875, 60.375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 1.0, 10.0, 6.0, 9.0, 12.0, 17.0, 19.0, 16.0, 18.0, 23.0, 24.0, 16.0, 49.0, 31.0, 39.0, 35.0, 32.0, 44.0, 43.0, 34.0, 42.0, 51.0, 33.0, 45.0, 39.0, 32.0, 24.0, 33.0, 28.0, 32.0, 24.0, 21.0, 16.0, 22.0, 11.0, 14.0, 8.0, 9.0, 3.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-36.21875, -35.1708984375, -34.123046875, -33.0751953125, -32.02734375, -30.9794921875, -29.931640625, -28.8837890625, -27.8359375, -26.7880859375, -25.740234375, -24.6923828125, -23.64453125, -22.5966796875, -21.548828125, -20.5009765625, -19.453125, -18.4052734375, -17.357421875, -16.3095703125, -15.26171875, -14.2138671875, -13.166015625, -12.1181640625, -11.0703125, -10.0224609375, -8.974609375, -7.9267578125, -6.87890625, -5.8310546875, -4.783203125, -3.7353515625, -2.6875, -1.6396484375, -0.591796875, 0.4560546875, 1.50390625, 2.5517578125, 3.599609375, 4.6474609375, 5.6953125, 6.7431640625, 7.791015625, 8.8388671875, 9.88671875, 10.9345703125, 11.982421875, 13.0302734375, 14.078125, 15.1259765625, 16.173828125, 17.2216796875, 18.26953125, 19.3173828125, 20.365234375, 21.4130859375, 22.4609375, 23.5087890625, 24.556640625, 25.6044921875, 26.65234375, 27.7001953125, 28.748046875, 29.7958984375, 30.84375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 17.0, 19.0, 24.0, 44.0, 70.0, 82.0, 134.0, 231.0, 391.0, 690.0, 1358.0, 3055.0, 10739.0, 448750.0, 564920.0, 11533.0, 3210.0, 1468.0, 743.0, 397.0, 252.0, 137.0, 91.0, 44.0, 43.0, 34.0, 18.0, 15.0, 5.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.75, -119.486328125, -115.22265625, -110.958984375, -106.6953125, -102.431640625, -98.16796875, -93.904296875, -89.640625, -85.376953125, -81.11328125, -76.849609375, -72.5859375, -68.322265625, -64.05859375, -59.794921875, -55.53125, -51.267578125, -47.00390625, -42.740234375, -38.4765625, -34.212890625, -29.94921875, -25.685546875, -21.421875, -17.158203125, -12.89453125, -8.630859375, -4.3671875, -0.103515625, 4.16015625, 8.423828125, 12.6875, 16.951171875, 21.21484375, 25.478515625, 29.7421875, 34.005859375, 38.26953125, 42.533203125, 46.796875, 51.060546875, 55.32421875, 59.587890625, 63.8515625, 68.115234375, 72.37890625, 76.642578125, 80.90625, 85.169921875, 89.43359375, 93.697265625, 97.9609375, 102.224609375, 106.48828125, 110.751953125, 115.015625, 119.279296875, 123.54296875, 127.806640625, 132.0703125, 136.333984375, 140.59765625, 144.861328125, 149.125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 25.0, 42.0, 119.0, 282.0, 293.0, 132.0, 44.0, 25.0, 12.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0218048095703125, -0.021214723587036133, -0.020624637603759766, -0.0200345516204834, -0.01944446563720703, -0.018854379653930664, -0.018264293670654297, -0.01767420768737793, -0.017084121704101562, -0.016494035720825195, -0.015903949737548828, -0.015313863754272461, -0.014723777770996094, -0.014133691787719727, -0.01354360580444336, -0.012953519821166992, -0.012363433837890625, -0.011773347854614258, -0.01118326187133789, -0.010593175888061523, -0.010003089904785156, -0.009413003921508789, -0.008822917938232422, -0.008232831954956055, -0.0076427459716796875, -0.00705265998840332, -0.006462574005126953, -0.005872488021850586, -0.005282402038574219, -0.0046923160552978516, -0.004102230072021484, -0.003512144088745117, -0.00292205810546875, -0.002331972122192383, -0.0017418861389160156, -0.0011518001556396484, -0.0005617141723632812, 2.8371810913085938e-05, 0.0006184577941894531, 0.0012085437774658203, 0.0017986297607421875, 0.0023887157440185547, 0.002978801727294922, 0.003568887710571289, 0.004158973693847656, 0.0047490596771240234, 0.005339145660400391, 0.005929231643676758, 0.006519317626953125, 0.007109403610229492, 0.007699489593505859, 0.008289575576782227, 0.008879661560058594, 0.009469747543334961, 0.010059833526611328, 0.010649919509887695, 0.011240005493164062, 0.01183009147644043, 0.012420177459716797, 0.013010263442993164, 0.013600349426269531, 0.014190435409545898, 0.014780521392822266, 0.015370607376098633, 0.015960693359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 14.0, 12.0, 22.0, 29.0, 39.0, 58.0, 97.0, 165.0, 315.0, 674.0, 1807.0, 7281.0, 568428.0, 459514.0, 6794.0, 1873.0, 699.0, 301.0, 163.0, 95.0, 59.0, 35.0, 18.0, 18.0, 4.0, 9.0, 3.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-219.0, -212.9140625, -206.828125, -200.7421875, -194.65625, -188.5703125, -182.484375, -176.3984375, -170.3125, -164.2265625, -158.140625, -152.0546875, -145.96875, -139.8828125, -133.796875, -127.7109375, -121.625, -115.5390625, -109.453125, -103.3671875, -97.28125, -91.1953125, -85.109375, -79.0234375, -72.9375, -66.8515625, -60.765625, -54.6796875, -48.59375, -42.5078125, -36.421875, -30.3359375, -24.25, -18.1640625, -12.078125, -5.9921875, 0.09375, 6.1796875, 12.265625, 18.3515625, 24.4375, 30.5234375, 36.609375, 42.6953125, 48.78125, 54.8671875, 60.953125, 67.0390625, 73.125, 79.2109375, 85.296875, 91.3828125, 97.46875, 103.5546875, 109.640625, 115.7265625, 121.8125, 127.8984375, 133.984375, 140.0703125, 146.15625, 152.2421875, 158.328125, 164.4140625, 170.5]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 17.0, 40.0, 42.0, 80.0, 79.0, 152.0, 193.0, 137.0, 89.0, 59.0, 26.0, 18.0, 14.0, 6.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-56.21875, -54.8837890625, -53.548828125, -52.2138671875, -50.87890625, -49.5439453125, -48.208984375, -46.8740234375, -45.5390625, -44.2041015625, -42.869140625, -41.5341796875, -40.19921875, -38.8642578125, -37.529296875, -36.1943359375, -34.859375, -33.5244140625, -32.189453125, -30.8544921875, -29.51953125, -28.1845703125, -26.849609375, -25.5146484375, -24.1796875, -22.8447265625, -21.509765625, -20.1748046875, -18.83984375, -17.5048828125, -16.169921875, -14.8349609375, -13.5, -12.1650390625, -10.830078125, -9.4951171875, -8.16015625, -6.8251953125, -5.490234375, -4.1552734375, -2.8203125, -1.4853515625, -0.150390625, 1.1845703125, 2.51953125, 3.8544921875, 5.189453125, 6.5244140625, 7.859375, 9.1943359375, 10.529296875, 11.8642578125, 13.19921875, 14.5341796875, 15.869140625, 17.2041015625, 18.5390625, 19.8740234375, 21.208984375, 22.5439453125, 23.87890625, 25.2138671875, 26.548828125, 27.8837890625, 29.21875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 5.0, 9.0, 14.0, 20.0, 23.0, 52.0, 73.0, 92.0, 110.0, 117.0, 105.0, 107.0, 64.0, 57.0, 49.0, 30.0, 21.0, 12.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-397.07916259765625, -382.76373291015625, -368.4482727050781, -354.1328430175781, -339.8173828125, -325.501953125, -311.1865234375, -296.87109375, -282.5556335449219, -268.2402038574219, -253.92474365234375, -239.60931396484375, -225.2938690185547, -210.97842407226562, -196.66299438476562, -182.34754943847656, -168.0321044921875, -153.71665954589844, -139.40121459960938, -125.08578491210938, -110.77033996582031, -96.45489501953125, -82.13945770263672, -67.82402038574219, -53.508575439453125, -39.19313430786133, -24.87769317626953, -10.562252044677734, 3.7531890869140625, 18.068634033203125, 32.384071350097656, 46.69950866699219, 61.01495361328125, 75.33039855957031, 89.64583587646484, 103.96127319335938, 118.27671813964844, 132.5921630859375, 146.9075927734375, 161.22303771972656, 175.53848266601562, 189.8539276123047, 204.16937255859375, 218.48480224609375, 232.8002471923828, 247.11569213867188, 261.4311218261719, 275.74658203125, 290.06201171875, 304.37744140625, 318.6929016113281, 333.0083312988281, 347.32379150390625, 361.63922119140625, 375.95465087890625, 390.27008056640625, 404.5855407714844, 418.9009704589844, 433.2164306640625, 447.5318603515625, 461.8472900390625, 476.1627502441406, 490.4781799316406, 504.79364013671875, 519.1090698242188]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 5.0, 3.0, 7.0, 7.0, 17.0, 14.0, 14.0, 20.0, 21.0, 24.0, 21.0, 29.0, 35.0, 41.0, 31.0, 52.0, 50.0, 44.0, 42.0, 35.0, 54.0, 46.0, 33.0, 53.0, 41.0, 26.0, 25.0, 32.0, 31.0, 16.0, 15.0, 23.0, 19.0, 23.0, 6.0, 11.0, 5.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-210.11585998535156, -203.5716552734375, -197.0274658203125, -190.48326110839844, -183.93905639648438, -177.3948516845703, -170.85064697265625, -164.30645751953125, -157.7622528076172, -151.21804809570312, -144.67385864257812, -138.12965393066406, -131.58544921875, -125.04124450683594, -118.4970474243164, -111.95285034179688, -105.40864562988281, -98.86444091796875, -92.32024383544922, -85.77604675292969, -79.23184204101562, -72.68763732910156, -66.14344024658203, -59.599239349365234, -53.05503845214844, -46.51083755493164, -39.966636657714844, -33.42243576049805, -26.87823486328125, -20.334033966064453, -13.789833068847656, -7.245632171630859, -0.701446533203125, 5.842754364013672, 12.386955261230469, 18.931156158447266, 25.475357055664062, 32.01955795288086, 38.563758850097656, 45.10795974731445, 51.65216064453125, 58.19636154174805, 64.74056243896484, 71.28475952148438, 77.82896423339844, 84.3731689453125, 90.91736602783203, 97.46156311035156, 104.00576782226562, 110.54997253417969, 117.09416961669922, 123.63836669921875, 130.1825714111328, 136.72677612304688, 143.27096557617188, 149.81517028808594, 156.359375, 162.90357971191406, 169.44778442382812, 175.99197387695312, 182.5361785888672, 189.08038330078125, 195.62457275390625, 202.1687774658203, 208.71298217773438]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 14.0, 23.0, 27.0, 35.0, 70.0, 89.0, 131.0, 222.0, 415.0, 715.0, 1489.0, 3575.0, 9090.0, 28129.0, 122101.0, 3255549.0, 667685.0, 73701.0, 19239.0, 6573.0, 2699.0, 1244.0, 572.0, 332.0, 191.0, 116.0, 70.0, 42.0, 33.0, 24.0, 27.0, 17.0, 7.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-104.125, -100.955078125, -97.78515625, -94.615234375, -91.4453125, -88.275390625, -85.10546875, -81.935546875, -78.765625, -75.595703125, -72.42578125, -69.255859375, -66.0859375, -62.916015625, -59.74609375, -56.576171875, -53.40625, -50.236328125, -47.06640625, -43.896484375, -40.7265625, -37.556640625, -34.38671875, -31.216796875, -28.046875, -24.876953125, -21.70703125, -18.537109375, -15.3671875, -12.197265625, -9.02734375, -5.857421875, -2.6875, 0.482421875, 3.65234375, 6.822265625, 9.9921875, 13.162109375, 16.33203125, 19.501953125, 22.671875, 25.841796875, 29.01171875, 32.181640625, 35.3515625, 38.521484375, 41.69140625, 44.861328125, 48.03125, 51.201171875, 54.37109375, 57.541015625, 60.7109375, 63.880859375, 67.05078125, 70.220703125, 73.390625, 76.560546875, 79.73046875, 82.900390625, 86.0703125, 89.240234375, 92.41015625, 95.580078125, 98.75]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 5.0, 7.0, 11.0, 14.0, 22.0, 19.0, 24.0, 31.0, 57.0, 42.0, 66.0, 70.0, 69.0, 81.0, 71.0, 68.0, 57.0, 59.0, 58.0, 48.0, 40.0, 28.0, 17.0, 9.0, 14.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46875, -7.09228515625, -6.7158203125, -6.33935546875, -5.962890625, -5.58642578125, -5.2099609375, -4.83349609375, -4.45703125, -4.08056640625, -3.7041015625, -3.32763671875, -2.951171875, -2.57470703125, -2.1982421875, -1.82177734375, -1.4453125, -1.06884765625, -0.6923828125, -0.31591796875, 0.060546875, 0.43701171875, 0.8134765625, 1.18994140625, 1.56640625, 1.94287109375, 2.3193359375, 2.69580078125, 3.072265625, 3.44873046875, 3.8251953125, 4.20166015625, 4.578125, 4.95458984375, 5.3310546875, 5.70751953125, 6.083984375, 6.46044921875, 6.8369140625, 7.21337890625, 7.58984375, 7.96630859375, 8.3427734375, 8.71923828125, 9.095703125, 9.47216796875, 9.8486328125, 10.22509765625, 10.6015625, 10.97802734375, 11.3544921875, 11.73095703125, 12.107421875, 12.48388671875, 12.8603515625, 13.23681640625, 13.61328125, 13.98974609375, 14.3662109375, 14.74267578125, 15.119140625, 15.49560546875, 15.8720703125, 16.24853515625, 16.625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 7.0, 9.0, 11.0, 13.0, 20.0, 27.0, 44.0, 63.0, 113.0, 199.0, 300.0, 589.0, 967.0, 2027.0, 4647.0, 11684.0, 36738.0, 151545.0, 2843751.0, 987045.0, 108110.0, 28555.0, 9918.0, 3993.0, 1773.0, 861.0, 457.0, 306.0, 165.0, 109.0, 74.0, 43.0, 37.0, 24.0, 14.0, 14.0, 4.0, 2.0, 4.0, 5.0, 9.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-109.875, -106.896484375, -103.91796875, -100.939453125, -97.9609375, -94.982421875, -92.00390625, -89.025390625, -86.046875, -83.068359375, -80.08984375, -77.111328125, -74.1328125, -71.154296875, -68.17578125, -65.197265625, -62.21875, -59.240234375, -56.26171875, -53.283203125, -50.3046875, -47.326171875, -44.34765625, -41.369140625, -38.390625, -35.412109375, -32.43359375, -29.455078125, -26.4765625, -23.498046875, -20.51953125, -17.541015625, -14.5625, -11.583984375, -8.60546875, -5.626953125, -2.6484375, 0.330078125, 3.30859375, 6.287109375, 9.265625, 12.244140625, 15.22265625, 18.201171875, 21.1796875, 24.158203125, 27.13671875, 30.115234375, 33.09375, 36.072265625, 39.05078125, 42.029296875, 45.0078125, 47.986328125, 50.96484375, 53.943359375, 56.921875, 59.900390625, 62.87890625, 65.857421875, 68.8359375, 71.814453125, 74.79296875, 77.771484375, 80.75]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 6.0, 12.0, 6.0, 13.0, 14.0, 21.0, 33.0, 38.0, 60.0, 98.0, 102.0, 173.0, 293.0, 659.0, 1335.0, 430.0, 230.0, 141.0, 89.0, 77.0, 48.0, 40.0, 26.0, 26.0, 32.0, 13.0, 13.0, 10.0, 9.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.394287109375, -25.49169921875, -24.589111328125, -23.6865234375, -22.783935546875, -21.88134765625, -20.978759765625, -20.076171875, -19.173583984375, -18.27099609375, -17.368408203125, -16.4658203125, -15.563232421875, -14.66064453125, -13.758056640625, -12.85546875, -11.952880859375, -11.05029296875, -10.147705078125, -9.2451171875, -8.342529296875, -7.43994140625, -6.537353515625, -5.634765625, -4.732177734375, -3.82958984375, -2.927001953125, -2.0244140625, -1.121826171875, -0.21923828125, 0.683349609375, 1.5859375, 2.488525390625, 3.39111328125, 4.293701171875, 5.1962890625, 6.098876953125, 7.00146484375, 7.904052734375, 8.806640625, 9.709228515625, 10.61181640625, 11.514404296875, 12.4169921875, 13.319580078125, 14.22216796875, 15.124755859375, 16.02734375, 16.929931640625, 17.83251953125, 18.735107421875, 19.6376953125, 20.540283203125, 21.44287109375, 22.345458984375, 23.248046875, 24.150634765625, 25.05322265625, 25.955810546875, 26.8583984375, 27.760986328125, 28.66357421875, 29.566162109375, 30.46875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 11.0, 18.0, 45.0, 86.0, 184.0, 233.0, 188.0, 128.0, 53.0, 29.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-370.48114013671875, -355.9477844238281, -341.4144592285156, -326.881103515625, -312.3477783203125, -297.8144226074219, -283.28106689453125, -268.74774169921875, -254.21438598632812, -239.68104553222656, -225.147705078125, -210.61434936523438, -196.0810089111328, -181.54766845703125, -167.0143280029297, -152.48098754882812, -137.94764709472656, -123.414306640625, -108.8809585571289, -94.34761810302734, -79.81427001953125, -65.28092956542969, -50.747589111328125, -36.21424102783203, -21.68090057373047, -7.147557258605957, 7.385786056518555, 21.91912841796875, 36.45247268676758, 50.985816955566406, 65.51915740966797, 80.05250549316406, 94.58584594726562, 109.11918640136719, 123.65253448486328, 138.18588256835938, 152.71922302246094, 167.2525634765625, 181.78590393066406, 196.31924438476562, 210.85260009765625, 225.3859405517578, 239.91928100585938, 254.45263671875, 268.9859619140625, 283.5193176269531, 298.05267333984375, 312.58599853515625, 327.11932373046875, 341.6526794433594, 356.1860046386719, 370.7193603515625, 385.252685546875, 399.7860412597656, 414.31939697265625, 428.85272216796875, 443.3860778808594, 457.91943359375, 472.4527587890625, 486.9861145019531, 501.5194396972656, 516.0527954101562, 530.5861206054688, 545.1195068359375, 559.65283203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 9.0, 14.0, 14.0, 14.0, 19.0, 36.0, 36.0, 47.0, 46.0, 47.0, 51.0, 48.0, 55.0, 53.0, 47.0, 55.0, 58.0, 51.0, 34.0, 46.0, 26.0, 26.0, 28.0, 24.0, 26.0, 17.0, 13.0, 11.0, 11.0, 11.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.26533508300781, -112.77194213867188, -108.27854919433594, -103.78515625, -99.29176330566406, -94.79837036132812, -90.30496978759766, -85.81157684326172, -81.31818389892578, -76.82479095458984, -72.3313980102539, -67.83800506591797, -63.344608306884766, -58.85121536254883, -54.357818603515625, -49.86442565917969, -45.37103271484375, -40.87763977050781, -36.384246826171875, -31.890850067138672, -27.397457122802734, -22.904064178466797, -18.410669326782227, -13.917274475097656, -9.423881530761719, -4.930487632751465, -0.43709373474121094, 4.056300163269043, 8.549694061279297, 13.043087005615234, 17.536481857299805, 22.029876708984375, 26.52325439453125, 31.016647338867188, 35.510040283203125, 40.00343704223633, 44.496829986572266, 48.9902229309082, 53.483619689941406, 57.977012634277344, 62.47040557861328, 66.96379852294922, 71.45719146728516, 75.9505844116211, 80.44398498535156, 84.9373779296875, 89.43077087402344, 93.92416381835938, 98.41755676269531, 102.91094970703125, 107.40434265136719, 111.89773559570312, 116.39112854003906, 120.884521484375, 125.37792205810547, 129.87130737304688, 134.36471557617188, 138.8581085205078, 143.35150146484375, 147.8448944091797, 152.33828735351562, 156.83168029785156, 161.3250732421875, 165.8184814453125, 170.31185913085938]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 13.0, 14.0, 20.0, 40.0, 42.0, 85.0, 84.0, 198.0, 326.0, 600.0, 1395.0, 3709.0, 12213.0, 53330.0, 254996.0, 530899.0, 146864.0, 31266.0, 7822.0, 2489.0, 947.0, 479.0, 250.0, 145.0, 86.0, 61.0, 44.0, 29.0, 28.0, 13.0, 15.0, 6.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-121.5625, -118.12109375, -114.6796875, -111.23828125, -107.796875, -104.35546875, -100.9140625, -97.47265625, -94.03125, -90.58984375, -87.1484375, -83.70703125, -80.265625, -76.82421875, -73.3828125, -69.94140625, -66.5, -63.05859375, -59.6171875, -56.17578125, -52.734375, -49.29296875, -45.8515625, -42.41015625, -38.96875, -35.52734375, -32.0859375, -28.64453125, -25.203125, -21.76171875, -18.3203125, -14.87890625, -11.4375, -7.99609375, -4.5546875, -1.11328125, 2.328125, 5.76953125, 9.2109375, 12.65234375, 16.09375, 19.53515625, 22.9765625, 26.41796875, 29.859375, 33.30078125, 36.7421875, 40.18359375, 43.625, 47.06640625, 50.5078125, 53.94921875, 57.390625, 60.83203125, 64.2734375, 67.71484375, 71.15625, 74.59765625, 78.0390625, 81.48046875, 84.921875, 88.36328125, 91.8046875, 95.24609375, 98.6875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 11.0, 8.0, 13.0, 26.0, 26.0, 32.0, 48.0, 67.0, 72.0, 79.0, 81.0, 85.0, 66.0, 63.0, 67.0, 58.0, 51.0, 46.0, 32.0, 29.0, 11.0, 16.0, 9.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.27130126953125, -6.8590087890625, -6.44671630859375, -6.034423828125, -5.62213134765625, -5.2098388671875, -4.79754638671875, -4.38525390625, -3.97296142578125, -3.5606689453125, -3.14837646484375, -2.736083984375, -2.32379150390625, -1.9114990234375, -1.49920654296875, -1.0869140625, -0.67462158203125, -0.2623291015625, 0.14996337890625, 0.562255859375, 0.97454833984375, 1.3868408203125, 1.79913330078125, 2.21142578125, 2.62371826171875, 3.0360107421875, 3.44830322265625, 3.860595703125, 4.27288818359375, 4.6851806640625, 5.09747314453125, 5.509765625, 5.92205810546875, 6.3343505859375, 6.74664306640625, 7.158935546875, 7.57122802734375, 7.9835205078125, 8.39581298828125, 8.80810546875, 9.22039794921875, 9.6326904296875, 10.04498291015625, 10.457275390625, 10.86956787109375, 11.2818603515625, 11.69415283203125, 12.1064453125, 12.51873779296875, 12.9310302734375, 13.34332275390625, 13.755615234375, 14.16790771484375, 14.5802001953125, 14.99249267578125, 15.40478515625, 15.81707763671875, 16.2293701171875, 16.64166259765625, 17.053955078125, 17.46624755859375, 17.8785400390625, 18.29083251953125, 18.703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 5.0, 11.0, 11.0, 12.0, 18.0, 39.0, 46.0, 67.0, 95.0, 103.0, 166.0, 252.0, 377.0, 580.0, 882.0, 1614.0, 2993.0, 5712.0, 12036.0, 26290.0, 59291.0, 129565.0, 259868.0, 279344.0, 145121.0, 66163.0, 29643.0, 13681.0, 6557.0, 3381.0, 1733.0, 956.0, 632.0, 405.0, 273.0, 164.0, 105.0, 97.0, 76.0, 49.0, 39.0, 30.0, 19.0, 13.0, 9.0, 9.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.90625, -45.52978515625, -44.1533203125, -42.77685546875, -41.400390625, -40.02392578125, -38.6474609375, -37.27099609375, -35.89453125, -34.51806640625, -33.1416015625, -31.76513671875, -30.388671875, -29.01220703125, -27.6357421875, -26.25927734375, -24.8828125, -23.50634765625, -22.1298828125, -20.75341796875, -19.376953125, -18.00048828125, -16.6240234375, -15.24755859375, -13.87109375, -12.49462890625, -11.1181640625, -9.74169921875, -8.365234375, -6.98876953125, -5.6123046875, -4.23583984375, -2.859375, -1.48291015625, -0.1064453125, 1.27001953125, 2.646484375, 4.02294921875, 5.3994140625, 6.77587890625, 8.15234375, 9.52880859375, 10.9052734375, 12.28173828125, 13.658203125, 15.03466796875, 16.4111328125, 17.78759765625, 19.1640625, 20.54052734375, 21.9169921875, 23.29345703125, 24.669921875, 26.04638671875, 27.4228515625, 28.79931640625, 30.17578125, 31.55224609375, 32.9287109375, 34.30517578125, 35.681640625, 37.05810546875, 38.4345703125, 39.81103515625, 41.1875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 7.0, 14.0, 14.0, 16.0, 15.0, 25.0, 20.0, 22.0, 26.0, 32.0, 35.0, 42.0, 32.0, 39.0, 44.0, 38.0, 38.0, 51.0, 45.0, 42.0, 56.0, 41.0, 34.0, 34.0, 21.0, 31.0, 26.0, 24.0, 20.0, 13.0, 20.0, 9.0, 12.0, 13.0, 5.0, 6.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.59375, -33.53076171875, -32.4677734375, -31.40478515625, -30.341796875, -29.27880859375, -28.2158203125, -27.15283203125, -26.08984375, -25.02685546875, -23.9638671875, -22.90087890625, -21.837890625, -20.77490234375, -19.7119140625, -18.64892578125, -17.5859375, -16.52294921875, -15.4599609375, -14.39697265625, -13.333984375, -12.27099609375, -11.2080078125, -10.14501953125, -9.08203125, -8.01904296875, -6.9560546875, -5.89306640625, -4.830078125, -3.76708984375, -2.7041015625, -1.64111328125, -0.578125, 0.48486328125, 1.5478515625, 2.61083984375, 3.673828125, 4.73681640625, 5.7998046875, 6.86279296875, 7.92578125, 8.98876953125, 10.0517578125, 11.11474609375, 12.177734375, 13.24072265625, 14.3037109375, 15.36669921875, 16.4296875, 17.49267578125, 18.5556640625, 19.61865234375, 20.681640625, 21.74462890625, 22.8076171875, 23.87060546875, 24.93359375, 25.99658203125, 27.0595703125, 28.12255859375, 29.185546875, 30.24853515625, 31.3115234375, 32.37451171875, 33.4375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 7.0, 13.0, 15.0, 12.0, 30.0, 37.0, 56.0, 83.0, 161.0, 272.0, 499.0, 1035.0, 2188.0, 5638.0, 18987.0, 93666.0, 576461.0, 290134.0, 41869.0, 10708.0, 3577.0, 1472.0, 659.0, 375.0, 205.0, 135.0, 77.0, 41.0, 31.0, 37.0, 16.0, 10.0, 15.0, 7.0, 4.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-57.40625, -55.75537109375, -54.1044921875, -52.45361328125, -50.802734375, -49.15185546875, -47.5009765625, -45.85009765625, -44.19921875, -42.54833984375, -40.8974609375, -39.24658203125, -37.595703125, -35.94482421875, -34.2939453125, -32.64306640625, -30.9921875, -29.34130859375, -27.6904296875, -26.03955078125, -24.388671875, -22.73779296875, -21.0869140625, -19.43603515625, -17.78515625, -16.13427734375, -14.4833984375, -12.83251953125, -11.181640625, -9.53076171875, -7.8798828125, -6.22900390625, -4.578125, -2.92724609375, -1.2763671875, 0.37451171875, 2.025390625, 3.67626953125, 5.3271484375, 6.97802734375, 8.62890625, 10.27978515625, 11.9306640625, 13.58154296875, 15.232421875, 16.88330078125, 18.5341796875, 20.18505859375, 21.8359375, 23.48681640625, 25.1376953125, 26.78857421875, 28.439453125, 30.09033203125, 31.7412109375, 33.39208984375, 35.04296875, 36.69384765625, 38.3447265625, 39.99560546875, 41.646484375, 43.29736328125, 44.9482421875, 46.59912109375, 48.25]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 1.0, 9.0, 11.0, 19.0, 18.0, 23.0, 29.0, 44.0, 44.0, 64.0, 77.0, 87.0, 114.0, 104.0, 64.0, 62.0, 50.0, 35.0, 26.0, 25.0, 14.0, 13.0, 10.0, 13.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004863739013671875, -0.004704892635345459, -0.004546046257019043, -0.004387199878692627, -0.004228353500366211, -0.004069507122039795, -0.003910660743713379, -0.003751814365386963, -0.003592967987060547, -0.003434121608734131, -0.003275275230407715, -0.003116428852081299, -0.002957582473754883, -0.002798736095428467, -0.0026398897171020508, -0.0024810433387756348, -0.0023221969604492188, -0.0021633505821228027, -0.0020045042037963867, -0.0018456578254699707, -0.0016868114471435547, -0.0015279650688171387, -0.0013691186904907227, -0.0012102723121643066, -0.0010514259338378906, -0.0008925795555114746, -0.0007337331771850586, -0.0005748867988586426, -0.00041604042053222656, -0.00025719404220581055, -9.834766387939453e-05, 6.0498714447021484e-05, 0.0002193450927734375, 0.0003781914710998535, 0.0005370378494262695, 0.0006958842277526855, 0.0008547306060791016, 0.0010135769844055176, 0.0011724233627319336, 0.0013312697410583496, 0.0014901161193847656, 0.0016489624977111816, 0.0018078088760375977, 0.0019666552543640137, 0.0021255016326904297, 0.0022843480110168457, 0.0024431943893432617, 0.0026020407676696777, 0.0027608871459960938, 0.0029197335243225098, 0.0030785799026489258, 0.003237426280975342, 0.003396272659301758, 0.003555119037628174, 0.00371396541595459, 0.003872811794281006, 0.004031658172607422, 0.004190504550933838, 0.004349350929260254, 0.00450819730758667, 0.004667043685913086, 0.004825890064239502, 0.004984736442565918, 0.005143582820892334, 0.00530242919921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 12.0, 7.0, 12.0, 17.0, 13.0, 30.0, 64.0, 99.0, 163.0, 248.0, 491.0, 876.0, 1816.0, 4182.0, 12111.0, 50530.0, 389188.0, 499534.0, 65242.0, 14674.0, 4840.0, 2145.0, 1041.0, 504.0, 291.0, 136.0, 108.0, 55.0, 36.0, 32.0, 25.0, 14.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.09375, -57.359375, -55.625, -53.890625, -52.15625, -50.421875, -48.6875, -46.953125, -45.21875, -43.484375, -41.75, -40.015625, -38.28125, -36.546875, -34.8125, -33.078125, -31.34375, -29.609375, -27.875, -26.140625, -24.40625, -22.671875, -20.9375, -19.203125, -17.46875, -15.734375, -14.0, -12.265625, -10.53125, -8.796875, -7.0625, -5.328125, -3.59375, -1.859375, -0.125, 1.609375, 3.34375, 5.078125, 6.8125, 8.546875, 10.28125, 12.015625, 13.75, 15.484375, 17.21875, 18.953125, 20.6875, 22.421875, 24.15625, 25.890625, 27.625, 29.359375, 31.09375, 32.828125, 34.5625, 36.296875, 38.03125, 39.765625, 41.5, 43.234375, 44.96875, 46.703125, 48.4375, 50.171875, 51.90625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 10.0, 14.0, 16.0, 28.0, 34.0, 36.0, 59.0, 70.0, 78.0, 88.0, 100.0, 90.0, 74.0, 67.0, 49.0, 48.0, 30.0, 27.0, 15.0, 15.0, 11.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.125, -35.253662109375, -34.38232421875, -33.510986328125, -32.6396484375, -31.768310546875, -30.89697265625, -30.025634765625, -29.154296875, -28.282958984375, -27.41162109375, -26.540283203125, -25.6689453125, -24.797607421875, -23.92626953125, -23.054931640625, -22.18359375, -21.312255859375, -20.44091796875, -19.569580078125, -18.6982421875, -17.826904296875, -16.95556640625, -16.084228515625, -15.212890625, -14.341552734375, -13.47021484375, -12.598876953125, -11.7275390625, -10.856201171875, -9.98486328125, -9.113525390625, -8.2421875, -7.370849609375, -6.49951171875, -5.628173828125, -4.7568359375, -3.885498046875, -3.01416015625, -2.142822265625, -1.271484375, -0.400146484375, 0.47119140625, 1.342529296875, 2.2138671875, 3.085205078125, 3.95654296875, 4.827880859375, 5.69921875, 6.570556640625, 7.44189453125, 8.313232421875, 9.1845703125, 10.055908203125, 10.92724609375, 11.798583984375, 12.669921875, 13.541259765625, 14.41259765625, 15.283935546875, 16.1552734375, 17.026611328125, 17.89794921875, 18.769287109375, 19.640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 17.0, 26.0, 52.0, 66.0, 119.0, 162.0, 180.0, 138.0, 95.0, 48.0, 39.0, 19.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-852.5416259765625, -833.6793823242188, -814.817138671875, -795.9548950195312, -777.0926513671875, -758.2303466796875, -739.3681030273438, -720.505859375, -701.6436157226562, -682.7813720703125, -663.9191284179688, -645.056884765625, -626.194580078125, -607.3323364257812, -588.4700927734375, -569.6078491210938, -550.74560546875, -531.8833618164062, -513.0211181640625, -494.1588439941406, -475.2966003417969, -456.4343566894531, -437.57208251953125, -418.7098388671875, -399.84759521484375, -380.9853515625, -362.12310791015625, -343.2608337402344, -324.3985900878906, -305.5363464355469, -286.674072265625, -267.81182861328125, -248.94955444335938, -230.08731079101562, -211.2250518798828, -192.36279296875, -173.50054931640625, -154.6383056640625, -135.7760467529297, -116.91378784179688, -98.05154418945312, -79.18929290771484, -60.32704162597656, -41.46479034423828, -22.6025390625, -3.7402877807617188, 15.121963500976562, 33.984222412109375, 52.846466064453125, 71.7087173461914, 90.57096862792969, 109.43321990966797, 128.29547119140625, 147.15771484375, 166.0199737548828, 184.88223266601562, 203.74447631835938, 222.60671997070312, 241.46897888183594, 260.33123779296875, 279.1934814453125, 298.05572509765625, 316.91796875, 335.7802429199219, 354.6424865722656]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 10.0, 5.0, 6.0, 7.0, 14.0, 9.0, 8.0, 11.0, 21.0, 11.0, 21.0, 26.0, 22.0, 34.0, 32.0, 33.0, 40.0, 34.0, 52.0, 44.0, 52.0, 42.0, 44.0, 38.0, 39.0, 47.0, 30.0, 37.0, 17.0, 34.0, 22.0, 22.0, 18.0, 18.0, 20.0, 8.0, 13.0, 11.0, 8.0, 6.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-191.688232421875, -185.8914031982422, -180.09458923339844, -174.29776000976562, -168.5009307861328, -162.7041015625, -156.90728759765625, -151.11045837402344, -145.31362915039062, -139.5167999267578, -133.71998596191406, -127.92315673828125, -122.12632751464844, -116.32950592041016, -110.53268432617188, -104.73585510253906, -98.93904113769531, -93.14221954345703, -87.34539031982422, -81.54856872558594, -75.75173950195312, -69.95491790771484, -64.15809631347656, -58.361270904541016, -52.56444549560547, -46.76762008666992, -40.970794677734375, -35.173973083496094, -29.377147674560547, -23.580322265625, -17.78350067138672, -11.986675262451172, -6.1898345947265625, -0.39301013946533203, 5.403814315795898, 11.200637817382812, 16.99746322631836, 22.794288635253906, 28.591110229492188, 34.387935638427734, 40.18476104736328, 45.98158645629883, 51.778411865234375, 57.575233459472656, 63.3720588684082, 69.16888427734375, 74.96570587158203, 80.76252746582031, 86.55935668945312, 92.3561782836914, 98.15300750732422, 103.9498291015625, 109.74665832519531, 115.5434799194336, 121.34030151367188, 127.13713073730469, 132.9339599609375, 138.7307891845703, 144.52760314941406, 150.32443237304688, 156.1212615966797, 161.9180908203125, 167.71490478515625, 173.51173400878906, 179.3085479736328]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 12.0, 14.0, 21.0, 35.0, 63.0, 98.0, 161.0, 321.0, 573.0, 1355.0, 3469.0, 11218.0, 50221.0, 3011631.0, 1054122.0, 44816.0, 10219.0, 3312.0, 1328.0, 568.0, 305.0, 162.0, 79.0, 51.0, 42.0, 27.0, 11.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.875, -103.875, -99.875, -95.875, -91.875, -87.875, -83.875, -79.875, -75.875, -71.875, -67.875, -63.875, -59.875, -55.875, -51.875, -47.875, -43.875, -39.875, -35.875, -31.875, -27.875, -23.875, -19.875, -15.875, -11.875, -7.875, -3.875, 0.125, 4.125, 8.125, 12.125, 16.125, 20.125, 24.125, 28.125, 32.125, 36.125, 40.125, 44.125, 48.125, 52.125, 56.125, 60.125, 64.125, 68.125, 72.125, 76.125, 80.125, 84.125, 88.125, 92.125, 96.125, 100.125, 104.125, 108.125, 112.125, 116.125, 120.125, 124.125, 128.125, 132.125, 136.125, 140.125, 144.125, 148.125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 8.0, 7.0, 15.0, 17.0, 31.0, 41.0, 42.0, 51.0, 61.0, 86.0, 65.0, 80.0, 75.0, 72.0, 67.0, 58.0, 63.0, 54.0, 33.0, 19.0, 18.0, 16.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765625, -7.354736328125, -6.94384765625, -6.532958984375, -6.1220703125, -5.711181640625, -5.30029296875, -4.889404296875, -4.478515625, -4.067626953125, -3.65673828125, -3.245849609375, -2.8349609375, -2.424072265625, -2.01318359375, -1.602294921875, -1.19140625, -0.780517578125, -0.36962890625, 0.041259765625, 0.4521484375, 0.863037109375, 1.27392578125, 1.684814453125, 2.095703125, 2.506591796875, 2.91748046875, 3.328369140625, 3.7392578125, 4.150146484375, 4.56103515625, 4.971923828125, 5.3828125, 5.793701171875, 6.20458984375, 6.615478515625, 7.0263671875, 7.437255859375, 7.84814453125, 8.259033203125, 8.669921875, 9.080810546875, 9.49169921875, 9.902587890625, 10.3134765625, 10.724365234375, 11.13525390625, 11.546142578125, 11.95703125, 12.367919921875, 12.77880859375, 13.189697265625, 13.6005859375, 14.011474609375, 14.42236328125, 14.833251953125, 15.244140625, 15.655029296875, 16.06591796875, 16.476806640625, 16.8876953125, 17.298583984375, 17.70947265625, 18.120361328125, 18.53125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 11.0, 11.0, 23.0, 15.0, 29.0, 39.0, 52.0, 92.0, 161.0, 273.0, 491.0, 1117.0, 3037.0, 9789.0, 41161.0, 274191.0, 3628035.0, 190397.0, 32450.0, 8272.0, 2554.0, 984.0, 448.0, 209.0, 131.0, 87.0, 69.0, 49.0, 31.0, 28.0, 16.0, 11.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.375, -120.1640625, -116.953125, -113.7421875, -110.53125, -107.3203125, -104.109375, -100.8984375, -97.6875, -94.4765625, -91.265625, -88.0546875, -84.84375, -81.6328125, -78.421875, -75.2109375, -72.0, -68.7890625, -65.578125, -62.3671875, -59.15625, -55.9453125, -52.734375, -49.5234375, -46.3125, -43.1015625, -39.890625, -36.6796875, -33.46875, -30.2578125, -27.046875, -23.8359375, -20.625, -17.4140625, -14.203125, -10.9921875, -7.78125, -4.5703125, -1.359375, 1.8515625, 5.0625, 8.2734375, 11.484375, 14.6953125, 17.90625, 21.1171875, 24.328125, 27.5390625, 30.75, 33.9609375, 37.171875, 40.3828125, 43.59375, 46.8046875, 50.015625, 53.2265625, 56.4375, 59.6484375, 62.859375, 66.0703125, 69.28125, 72.4921875, 75.703125, 78.9140625, 82.125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 21.0, 30.0, 46.0, 54.0, 83.0, 180.0, 348.0, 1923.0, 770.0, 229.0, 125.0, 78.0, 63.0, 38.0, 21.0, 20.0, 9.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.58349609375, -28.4794921875, -27.37548828125, -26.271484375, -25.16748046875, -24.0634765625, -22.95947265625, -21.85546875, -20.75146484375, -19.6474609375, -18.54345703125, -17.439453125, -16.33544921875, -15.2314453125, -14.12744140625, -13.0234375, -11.91943359375, -10.8154296875, -9.71142578125, -8.607421875, -7.50341796875, -6.3994140625, -5.29541015625, -4.19140625, -3.08740234375, -1.9833984375, -0.87939453125, 0.224609375, 1.32861328125, 2.4326171875, 3.53662109375, 4.640625, 5.74462890625, 6.8486328125, 7.95263671875, 9.056640625, 10.16064453125, 11.2646484375, 12.36865234375, 13.47265625, 14.57666015625, 15.6806640625, 16.78466796875, 17.888671875, 18.99267578125, 20.0966796875, 21.20068359375, 22.3046875, 23.40869140625, 24.5126953125, 25.61669921875, 26.720703125, 27.82470703125, 28.9287109375, 30.03271484375, 31.13671875, 32.24072265625, 33.3447265625, 34.44873046875, 35.552734375, 36.65673828125, 37.7607421875, 38.86474609375, 39.96875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 11.0, 48.0, 66.0, 163.0, 248.0, 218.0, 131.0, 67.0, 26.0, 12.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-573.6349487304688, -562.0990600585938, -550.5631713867188, -539.02734375, -527.491455078125, -515.95556640625, -504.419677734375, -492.8837890625, -481.347900390625, -469.81201171875, -458.2761535644531, -446.7402648925781, -435.2043762207031, -423.66851806640625, -412.13262939453125, -400.59674072265625, -389.0608825683594, -377.5249938964844, -365.9891357421875, -354.4532470703125, -342.9173583984375, -331.3814697265625, -319.8456115722656, -308.3097229003906, -296.77386474609375, -285.23797607421875, -273.7021179199219, -262.1662292480469, -250.63034057617188, -239.09446716308594, -227.55859375, -216.022705078125, -204.48684692382812, -192.9509735107422, -181.4150848388672, -169.87921142578125, -158.34332275390625, -146.8074493408203, -135.27157592773438, -123.7356948852539, -112.19981384277344, -100.66393280029297, -89.1280517578125, -77.59217834472656, -66.0562973022461, -54.520416259765625, -42.98454284667969, -31.44866180419922, -19.91278076171875, -8.376901626586914, 3.158977508544922, 14.694854736328125, 26.230735778808594, 37.76661682128906, 49.302490234375, 60.83837127685547, 72.37425231933594, 83.9101333618164, 95.44601440429688, 106.98188781738281, 118.51776885986328, 130.05364990234375, 141.5895233154297, 153.12539672851562, 164.66128540039062]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 6.0, 11.0, 2.0, 9.0, 17.0, 14.0, 12.0, 19.0, 17.0, 24.0, 36.0, 31.0, 29.0, 25.0, 34.0, 54.0, 40.0, 51.0, 43.0, 37.0, 43.0, 43.0, 47.0, 37.0, 49.0, 31.0, 39.0, 36.0, 28.0, 25.0, 18.0, 22.0, 15.0, 15.0, 13.0, 7.0, 4.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0], "bins": [-111.92119598388672, -109.01945495605469, -106.11770629882812, -103.2159652709961, -100.31421661376953, -97.4124755859375, -94.51072692871094, -91.6089859008789, -88.70724487304688, -85.80550384521484, -82.90375518798828, -80.00201416015625, -77.10026550292969, -74.19852447509766, -71.29678344726562, -68.39503479003906, -65.4932861328125, -62.5915412902832, -59.689796447753906, -56.788055419921875, -53.88630676269531, -50.98456573486328, -48.082820892333984, -45.18107604980469, -42.27933120727539, -39.377586364746094, -36.4758415222168, -33.5740966796875, -30.672353744506836, -27.77060890197754, -24.868865966796875, -21.967121124267578, -19.06536865234375, -16.163623809814453, -13.261879920959473, -10.360136032104492, -7.458391189575195, -4.556646347045898, -1.6549034118652344, 1.2468414306640625, 4.148586273193359, 7.050330638885498, 9.952075004577637, 12.853818893432617, 15.755563735961914, 18.65730857849121, 21.559051513671875, 24.460796356201172, 27.36254119873047, 30.264286041259766, 33.16603088378906, 36.067771911621094, 38.969520568847656, 41.87126159667969, 44.773006439208984, 47.67475128173828, 50.57649612426758, 53.478240966796875, 56.37998580932617, 59.28173065185547, 62.1834716796875, 65.08522033691406, 67.9869613647461, 70.88870239257812, 73.79045104980469]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 5.0, 8.0, 8.0, 13.0, 25.0, 25.0, 32.0, 56.0, 78.0, 121.0, 243.0, 388.0, 711.0, 1493.0, 3930.0, 11747.0, 43529.0, 191536.0, 528183.0, 201210.0, 45533.0, 12292.0, 4079.0, 1618.0, 706.0, 372.0, 209.0, 137.0, 63.0, 47.0, 44.0, 36.0, 16.0, 17.0, 21.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-125.0, -121.48046875, -117.9609375, -114.44140625, -110.921875, -107.40234375, -103.8828125, -100.36328125, -96.84375, -93.32421875, -89.8046875, -86.28515625, -82.765625, -79.24609375, -75.7265625, -72.20703125, -68.6875, -65.16796875, -61.6484375, -58.12890625, -54.609375, -51.08984375, -47.5703125, -44.05078125, -40.53125, -37.01171875, -33.4921875, -29.97265625, -26.453125, -22.93359375, -19.4140625, -15.89453125, -12.375, -8.85546875, -5.3359375, -1.81640625, 1.703125, 5.22265625, 8.7421875, 12.26171875, 15.78125, 19.30078125, 22.8203125, 26.33984375, 29.859375, 33.37890625, 36.8984375, 40.41796875, 43.9375, 47.45703125, 50.9765625, 54.49609375, 58.015625, 61.53515625, 65.0546875, 68.57421875, 72.09375, 75.61328125, 79.1328125, 82.65234375, 86.171875, 89.69140625, 93.2109375, 96.73046875, 100.25]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 10.0, 12.0, 22.0, 25.0, 27.0, 34.0, 41.0, 71.0, 53.0, 65.0, 82.0, 76.0, 75.0, 61.0, 66.0, 54.0, 50.0, 42.0, 49.0, 23.0, 19.0, 16.0, 8.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.1405029296875, -7.726318359375, -7.3121337890625, -6.89794921875, -6.4837646484375, -6.069580078125, -5.6553955078125, -5.2412109375, -4.8270263671875, -4.412841796875, -3.9986572265625, -3.58447265625, -3.1702880859375, -2.756103515625, -2.3419189453125, -1.927734375, -1.5135498046875, -1.099365234375, -0.6851806640625, -0.27099609375, 0.1431884765625, 0.557373046875, 0.9715576171875, 1.3857421875, 1.7999267578125, 2.214111328125, 2.6282958984375, 3.04248046875, 3.4566650390625, 3.870849609375, 4.2850341796875, 4.69921875, 5.1134033203125, 5.527587890625, 5.9417724609375, 6.35595703125, 6.7701416015625, 7.184326171875, 7.5985107421875, 8.0126953125, 8.4268798828125, 8.841064453125, 9.2552490234375, 9.66943359375, 10.0836181640625, 10.497802734375, 10.9119873046875, 11.326171875, 11.7403564453125, 12.154541015625, 12.5687255859375, 12.98291015625, 13.3970947265625, 13.811279296875, 14.2254638671875, 14.6396484375, 15.0538330078125, 15.468017578125, 15.8822021484375, 16.29638671875, 16.7105712890625, 17.124755859375, 17.5389404296875, 17.953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 18.0, 28.0, 26.0, 44.0, 53.0, 84.0, 129.0, 157.0, 255.0, 367.0, 595.0, 944.0, 1727.0, 3651.0, 9080.0, 24768.0, 73988.0, 219080.0, 400606.0, 204186.0, 69262.0, 23192.0, 8549.0, 3462.0, 1695.0, 901.0, 529.0, 387.0, 205.0, 188.0, 117.0, 75.0, 65.0, 32.0, 29.0, 19.0, 20.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-58.375, -56.458984375, -54.54296875, -52.626953125, -50.7109375, -48.794921875, -46.87890625, -44.962890625, -43.046875, -41.130859375, -39.21484375, -37.298828125, -35.3828125, -33.466796875, -31.55078125, -29.634765625, -27.71875, -25.802734375, -23.88671875, -21.970703125, -20.0546875, -18.138671875, -16.22265625, -14.306640625, -12.390625, -10.474609375, -8.55859375, -6.642578125, -4.7265625, -2.810546875, -0.89453125, 1.021484375, 2.9375, 4.853515625, 6.76953125, 8.685546875, 10.6015625, 12.517578125, 14.43359375, 16.349609375, 18.265625, 20.181640625, 22.09765625, 24.013671875, 25.9296875, 27.845703125, 29.76171875, 31.677734375, 33.59375, 35.509765625, 37.42578125, 39.341796875, 41.2578125, 43.173828125, 45.08984375, 47.005859375, 48.921875, 50.837890625, 52.75390625, 54.669921875, 56.5859375, 58.501953125, 60.41796875, 62.333984375, 64.25]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 10.0, 9.0, 6.0, 11.0, 16.0, 14.0, 28.0, 36.0, 28.0, 28.0, 33.0, 49.0, 39.0, 36.0, 47.0, 44.0, 33.0, 46.0, 42.0, 50.0, 39.0, 45.0, 35.0, 41.0, 33.0, 29.0, 23.0, 22.0, 24.0, 13.0, 13.0, 14.0, 11.0, 15.0, 10.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-44.0, -42.75439453125, -41.5087890625, -40.26318359375, -39.017578125, -37.77197265625, -36.5263671875, -35.28076171875, -34.03515625, -32.78955078125, -31.5439453125, -30.29833984375, -29.052734375, -27.80712890625, -26.5615234375, -25.31591796875, -24.0703125, -22.82470703125, -21.5791015625, -20.33349609375, -19.087890625, -17.84228515625, -16.5966796875, -15.35107421875, -14.10546875, -12.85986328125, -11.6142578125, -10.36865234375, -9.123046875, -7.87744140625, -6.6318359375, -5.38623046875, -4.140625, -2.89501953125, -1.6494140625, -0.40380859375, 0.841796875, 2.08740234375, 3.3330078125, 4.57861328125, 5.82421875, 7.06982421875, 8.3154296875, 9.56103515625, 10.806640625, 12.05224609375, 13.2978515625, 14.54345703125, 15.7890625, 17.03466796875, 18.2802734375, 19.52587890625, 20.771484375, 22.01708984375, 23.2626953125, 24.50830078125, 25.75390625, 26.99951171875, 28.2451171875, 29.49072265625, 30.736328125, 31.98193359375, 33.2275390625, 34.47314453125, 35.71875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 17.0, 23.0, 37.0, 84.0, 108.0, 232.0, 562.0, 1761.0, 8786.0, 132084.0, 847427.0, 50199.0, 5081.0, 1297.0, 420.0, 195.0, 98.0, 46.0, 26.0, 20.0, 13.0, 9.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.4375, -99.271484375, -96.10546875, -92.939453125, -89.7734375, -86.607421875, -83.44140625, -80.275390625, -77.109375, -73.943359375, -70.77734375, -67.611328125, -64.4453125, -61.279296875, -58.11328125, -54.947265625, -51.78125, -48.615234375, -45.44921875, -42.283203125, -39.1171875, -35.951171875, -32.78515625, -29.619140625, -26.453125, -23.287109375, -20.12109375, -16.955078125, -13.7890625, -10.623046875, -7.45703125, -4.291015625, -1.125, 2.041015625, 5.20703125, 8.373046875, 11.5390625, 14.705078125, 17.87109375, 21.037109375, 24.203125, 27.369140625, 30.53515625, 33.701171875, 36.8671875, 40.033203125, 43.19921875, 46.365234375, 49.53125, 52.697265625, 55.86328125, 59.029296875, 62.1953125, 65.361328125, 68.52734375, 71.693359375, 74.859375, 78.025390625, 81.19140625, 84.357421875, 87.5234375, 90.689453125, 93.85546875, 97.021484375, 100.1875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 9.0, 15.0, 35.0, 106.0, 234.0, 323.0, 169.0, 67.0, 24.0, 11.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01175689697265625, -0.0111464262008667, -0.010535955429077148, -0.009925484657287598, -0.009315013885498047, -0.008704543113708496, -0.008094072341918945, -0.0074836015701293945, -0.006873130798339844, -0.006262660026550293, -0.005652189254760742, -0.005041718482971191, -0.004431247711181641, -0.00382077693939209, -0.003210306167602539, -0.0025998353958129883, -0.0019893646240234375, -0.0013788938522338867, -0.0007684230804443359, -0.00015795230865478516, 0.0004525184631347656, 0.0010629892349243164, 0.0016734600067138672, 0.002283930778503418, 0.0028944015502929688, 0.0035048723220825195, 0.00411534309387207, 0.004725813865661621, 0.005336284637451172, 0.005946755409240723, 0.0065572261810302734, 0.007167696952819824, 0.007778167724609375, 0.008388638496398926, 0.008999109268188477, 0.009609580039978027, 0.010220050811767578, 0.010830521583557129, 0.01144099235534668, 0.01205146312713623, 0.012661933898925781, 0.013272404670715332, 0.013882875442504883, 0.014493346214294434, 0.015103816986083984, 0.015714287757873535, 0.016324758529663086, 0.016935229301452637, 0.017545700073242188, 0.01815617084503174, 0.01876664161682129, 0.01937711238861084, 0.01998758316040039, 0.02059805393218994, 0.021208524703979492, 0.021818995475769043, 0.022429466247558594, 0.023039937019348145, 0.023650407791137695, 0.024260878562927246, 0.024871349334716797, 0.025481820106506348, 0.0260922908782959, 0.02670276165008545, 0.027313232421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 11.0, 13.0, 21.0, 39.0, 61.0, 75.0, 162.0, 248.0, 547.0, 1479.0, 5694.0, 63727.0, 919690.0, 49141.0, 5167.0, 1346.0, 469.0, 265.0, 138.0, 80.0, 50.0, 45.0, 24.0, 15.0, 10.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-119.1875, -115.3994140625, -111.611328125, -107.8232421875, -104.03515625, -100.2470703125, -96.458984375, -92.6708984375, -88.8828125, -85.0947265625, -81.306640625, -77.5185546875, -73.73046875, -69.9423828125, -66.154296875, -62.3662109375, -58.578125, -54.7900390625, -51.001953125, -47.2138671875, -43.42578125, -39.6376953125, -35.849609375, -32.0615234375, -28.2734375, -24.4853515625, -20.697265625, -16.9091796875, -13.12109375, -9.3330078125, -5.544921875, -1.7568359375, 2.03125, 5.8193359375, 9.607421875, 13.3955078125, 17.18359375, 20.9716796875, 24.759765625, 28.5478515625, 32.3359375, 36.1240234375, 39.912109375, 43.7001953125, 47.48828125, 51.2763671875, 55.064453125, 58.8525390625, 62.640625, 66.4287109375, 70.216796875, 74.0048828125, 77.79296875, 81.5810546875, 85.369140625, 89.1572265625, 92.9453125, 96.7333984375, 100.521484375, 104.3095703125, 108.09765625, 111.8857421875, 115.673828125, 119.4619140625, 123.25]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 14.0, 27.0, 51.0, 82.0, 200.0, 242.0, 179.0, 98.0, 52.0, 19.0, 10.0, 5.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.0625, -63.7373046875, -61.412109375, -59.0869140625, -56.76171875, -54.4365234375, -52.111328125, -49.7861328125, -47.4609375, -45.1357421875, -42.810546875, -40.4853515625, -38.16015625, -35.8349609375, -33.509765625, -31.1845703125, -28.859375, -26.5341796875, -24.208984375, -21.8837890625, -19.55859375, -17.2333984375, -14.908203125, -12.5830078125, -10.2578125, -7.9326171875, -5.607421875, -3.2822265625, -0.95703125, 1.3681640625, 3.693359375, 6.0185546875, 8.34375, 10.6689453125, 12.994140625, 15.3193359375, 17.64453125, 19.9697265625, 22.294921875, 24.6201171875, 26.9453125, 29.2705078125, 31.595703125, 33.9208984375, 36.24609375, 38.5712890625, 40.896484375, 43.2216796875, 45.546875, 47.8720703125, 50.197265625, 52.5224609375, 54.84765625, 57.1728515625, 59.498046875, 61.8232421875, 64.1484375, 66.4736328125, 68.798828125, 71.1240234375, 73.44921875, 75.7744140625, 78.099609375, 80.4248046875, 82.75]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 9.0, 17.0, 15.0, 28.0, 34.0, 50.0, 79.0, 86.0, 76.0, 102.0, 96.0, 89.0, 78.0, 53.0, 44.0, 39.0, 25.0, 22.0, 8.0, 14.0, 10.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-291.9845275878906, -280.6142272949219, -269.24395751953125, -257.8736572265625, -246.5033721923828, -235.13308715820312, -223.76278686523438, -212.3925018310547, -201.022216796875, -189.6519317626953, -178.28164672851562, -166.91134643554688, -155.5410614013672, -144.1707763671875, -132.80047607421875, -121.43019104003906, -110.05990600585938, -98.68962097167969, -87.31932830810547, -75.94903564453125, -64.57875061035156, -53.20846176147461, -41.838172912597656, -30.467880249023438, -19.09759521484375, -7.727306365966797, 3.6429824829101562, 15.01327133178711, 26.383560180664062, 37.753849029541016, 49.12413787841797, 60.49443054199219, 71.86471557617188, 83.23500061035156, 94.60529327392578, 105.9755859375, 117.34587097167969, 128.71615600585938, 140.08645629882812, 151.4567413330078, 162.8270263671875, 174.1973114013672, 185.56759643554688, 196.93789672851562, 208.3081817626953, 219.678466796875, 231.04876708984375, 242.41905212402344, 253.78933715820312, 265.1596374511719, 276.5299072265625, 287.90020751953125, 299.2705078125, 310.6407775878906, 322.0110778808594, 333.38134765625, 344.75164794921875, 356.1219482421875, 367.4922180175781, 378.8625183105469, 390.2327880859375, 401.60308837890625, 412.973388671875, 424.34368896484375, 435.7139587402344]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 10.0, 14.0, 16.0, 14.0, 30.0, 23.0, 19.0, 31.0, 31.0, 28.0, 46.0, 34.0, 34.0, 40.0, 36.0, 42.0, 38.0, 39.0, 43.0, 39.0, 42.0, 38.0, 31.0, 37.0, 31.0, 21.0, 19.0, 17.0, 17.0, 25.0, 14.0, 16.0, 10.0, 8.0, 7.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-239.72491455078125, -232.7813262939453, -225.83773803710938, -218.89414978027344, -211.9505615234375, -205.00697326660156, -198.06338500976562, -191.11978149414062, -184.17620849609375, -177.2326202392578, -170.28903198242188, -163.34544372558594, -156.40185546875, -149.45826721191406, -142.51467895507812, -135.57107543945312, -128.6274871826172, -121.68389892578125, -114.74031066894531, -107.79672241210938, -100.85313415527344, -93.9095458984375, -86.96595001220703, -80.0223617553711, -73.07877349853516, -66.13518524169922, -59.19159698486328, -52.24800491333008, -45.30441665649414, -38.3608283996582, -31.417236328125, -24.473648071289062, -17.530044555664062, -10.586455345153809, -3.6428661346435547, 3.3007240295410156, 10.244312286376953, 17.18790054321289, 24.131492614746094, 31.07508087158203, 38.01866912841797, 44.962257385253906, 51.905845642089844, 58.84943771362305, 65.79302978515625, 72.73661804199219, 79.68020629882812, 86.62379455566406, 93.5673828125, 100.51097106933594, 107.45455932617188, 114.39814758300781, 121.34173583984375, 128.2853240966797, 135.22891235351562, 142.17251586914062, 149.1160888671875, 156.05967712402344, 163.00326538085938, 169.9468536376953, 176.89044189453125, 183.8340301513672, 190.77761840820312, 197.72122192382812, 204.66481018066406]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 1.0, 11.0, 11.0, 15.0, 14.0, 40.0, 42.0, 57.0, 109.0, 168.0, 344.0, 602.0, 1319.0, 2962.0, 7618.0, 24315.0, 107657.0, 3398732.0, 563621.0, 61078.0, 15813.0, 5377.0, 2177.0, 974.0, 506.0, 265.0, 170.0, 77.0, 55.0, 50.0, 25.0, 18.0, 14.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-99.5625, -96.4345703125, -93.306640625, -90.1787109375, -87.05078125, -83.9228515625, -80.794921875, -77.6669921875, -74.5390625, -71.4111328125, -68.283203125, -65.1552734375, -62.02734375, -58.8994140625, -55.771484375, -52.6435546875, -49.515625, -46.3876953125, -43.259765625, -40.1318359375, -37.00390625, -33.8759765625, -30.748046875, -27.6201171875, -24.4921875, -21.3642578125, -18.236328125, -15.1083984375, -11.98046875, -8.8525390625, -5.724609375, -2.5966796875, 0.53125, 3.6591796875, 6.787109375, 9.9150390625, 13.04296875, 16.1708984375, 19.298828125, 22.4267578125, 25.5546875, 28.6826171875, 31.810546875, 34.9384765625, 38.06640625, 41.1943359375, 44.322265625, 47.4501953125, 50.578125, 53.7060546875, 56.833984375, 59.9619140625, 63.08984375, 66.2177734375, 69.345703125, 72.4736328125, 75.6015625, 78.7294921875, 81.857421875, 84.9853515625, 88.11328125, 91.2412109375, 94.369140625, 97.4970703125, 100.625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 12.0, 7.0, 11.0, 23.0, 24.0, 26.0, 37.0, 49.0, 52.0, 55.0, 71.0, 75.0, 71.0, 67.0, 58.0, 68.0, 44.0, 53.0, 48.0, 34.0, 36.0, 24.0, 19.0, 10.0, 7.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.40838623046875, -7.0159912109375, -6.62359619140625, -6.231201171875, -5.83880615234375, -5.4464111328125, -5.05401611328125, -4.66162109375, -4.26922607421875, -3.8768310546875, -3.48443603515625, -3.092041015625, -2.69964599609375, -2.3072509765625, -1.91485595703125, -1.5224609375, -1.13006591796875, -0.7376708984375, -0.34527587890625, 0.047119140625, 0.43951416015625, 0.8319091796875, 1.22430419921875, 1.61669921875, 2.00909423828125, 2.4014892578125, 2.79388427734375, 3.186279296875, 3.57867431640625, 3.9710693359375, 4.36346435546875, 4.755859375, 5.14825439453125, 5.5406494140625, 5.93304443359375, 6.325439453125, 6.71783447265625, 7.1102294921875, 7.50262451171875, 7.89501953125, 8.28741455078125, 8.6798095703125, 9.07220458984375, 9.464599609375, 9.85699462890625, 10.2493896484375, 10.64178466796875, 11.0341796875, 11.42657470703125, 11.8189697265625, 12.21136474609375, 12.603759765625, 12.99615478515625, 13.3885498046875, 13.78094482421875, 14.17333984375, 14.56573486328125, 14.9581298828125, 15.35052490234375, 15.742919921875, 16.13531494140625, 16.5277099609375, 16.92010498046875, 17.3125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 15.0, 38.0, 54.0, 69.0, 114.0, 192.0, 286.0, 520.0, 903.0, 1766.0, 3362.0, 7600.0, 19516.0, 60099.0, 275154.0, 3272210.0, 431880.0, 78349.0, 24500.0, 9286.0, 4050.0, 1845.0, 1015.0, 555.0, 342.0, 194.0, 120.0, 79.0, 48.0, 28.0, 27.0, 18.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-69.125, -67.0048828125, -64.884765625, -62.7646484375, -60.64453125, -58.5244140625, -56.404296875, -54.2841796875, -52.1640625, -50.0439453125, -47.923828125, -45.8037109375, -43.68359375, -41.5634765625, -39.443359375, -37.3232421875, -35.203125, -33.0830078125, -30.962890625, -28.8427734375, -26.72265625, -24.6025390625, -22.482421875, -20.3623046875, -18.2421875, -16.1220703125, -14.001953125, -11.8818359375, -9.76171875, -7.6416015625, -5.521484375, -3.4013671875, -1.28125, 0.8388671875, 2.958984375, 5.0791015625, 7.19921875, 9.3193359375, 11.439453125, 13.5595703125, 15.6796875, 17.7998046875, 19.919921875, 22.0400390625, 24.16015625, 26.2802734375, 28.400390625, 30.5205078125, 32.640625, 34.7607421875, 36.880859375, 39.0009765625, 41.12109375, 43.2412109375, 45.361328125, 47.4814453125, 49.6015625, 51.7216796875, 53.841796875, 55.9619140625, 58.08203125, 60.2021484375, 62.322265625, 64.4423828125, 66.5625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 7.0, 9.0, 10.0, 16.0, 15.0, 22.0, 38.0, 60.0, 97.0, 131.0, 199.0, 438.0, 1505.0, 727.0, 285.0, 153.0, 98.0, 74.0, 41.0, 36.0, 22.0, 24.0, 13.0, 10.0, 9.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.8125, -30.869873046875, -29.92724609375, -28.984619140625, -28.0419921875, -27.099365234375, -26.15673828125, -25.214111328125, -24.271484375, -23.328857421875, -22.38623046875, -21.443603515625, -20.5009765625, -19.558349609375, -18.61572265625, -17.673095703125, -16.73046875, -15.787841796875, -14.84521484375, -13.902587890625, -12.9599609375, -12.017333984375, -11.07470703125, -10.132080078125, -9.189453125, -8.246826171875, -7.30419921875, -6.361572265625, -5.4189453125, -4.476318359375, -3.53369140625, -2.591064453125, -1.6484375, -0.705810546875, 0.23681640625, 1.179443359375, 2.1220703125, 3.064697265625, 4.00732421875, 4.949951171875, 5.892578125, 6.835205078125, 7.77783203125, 8.720458984375, 9.6630859375, 10.605712890625, 11.54833984375, 12.490966796875, 13.43359375, 14.376220703125, 15.31884765625, 16.261474609375, 17.2041015625, 18.146728515625, 19.08935546875, 20.031982421875, 20.974609375, 21.917236328125, 22.85986328125, 23.802490234375, 24.7451171875, 25.687744140625, 26.63037109375, 27.572998046875, 28.515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 20.0, 78.0, 135.0, 229.0, 226.0, 174.0, 74.0, 36.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-684.462890625, -671.3668823242188, -658.2708740234375, -645.1748046875, -632.0787963867188, -618.9827880859375, -605.8867797851562, -592.790771484375, -579.6947021484375, -566.5986938476562, -553.502685546875, -540.4066162109375, -527.3106079101562, -514.214599609375, -501.11859130859375, -488.0225524902344, -474.9265441894531, -461.8305358886719, -448.7344970703125, -435.63848876953125, -422.5424499511719, -409.4464416503906, -396.35040283203125, -383.25439453125, -370.15838623046875, -357.0623779296875, -343.9663391113281, -330.8703308105469, -317.7742919921875, -304.67828369140625, -291.582275390625, -278.4862365722656, -265.39019775390625, -252.29417419433594, -239.19815063476562, -226.10214233398438, -213.006103515625, -199.91009521484375, -186.81407165527344, -173.71804809570312, -160.62203979492188, -147.52601623535156, -134.42999267578125, -121.33397674560547, -108.23795318603516, -95.14192962646484, -82.04591369628906, -68.94989013671875, -55.85386657714844, -42.757843017578125, -29.661823272705078, -16.56580352783203, -3.4697799682617188, 9.626243591308594, 22.722259521484375, 35.81828308105469, 48.914306640625, 62.01033020019531, 75.10635375976562, 88.2023696899414, 101.29839324951172, 114.39441680908203, 127.49043273925781, 140.58645629882812, 153.68247985839844]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 14.0, 14.0, 8.0, 9.0, 12.0, 15.0, 18.0, 18.0, 27.0, 25.0, 29.0, 31.0, 28.0, 32.0, 33.0, 35.0, 38.0, 47.0, 39.0, 47.0, 52.0, 24.0, 35.0, 33.0, 39.0, 35.0, 35.0, 26.0, 32.0, 22.0, 19.0, 21.0, 12.0, 16.0, 13.0, 11.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0], "bins": [-96.74041748046875, -93.87686157226562, -91.01329803466797, -88.14974212646484, -85.28617858886719, -82.42262268066406, -79.55906677246094, -76.69550323486328, -73.83193969726562, -70.9683837890625, -68.10482025146484, -65.24126434326172, -62.37770080566406, -59.51414489746094, -56.65058517456055, -53.787025451660156, -50.92346954345703, -48.05990982055664, -45.19635009765625, -42.332794189453125, -39.46923065185547, -36.605674743652344, -33.74211502075195, -30.878555297851562, -28.014995574951172, -25.15143585205078, -22.28787612915039, -19.424318313598633, -16.560758590698242, -13.697198867797852, -10.833641052246094, -7.970081329345703, -5.1065216064453125, -2.24296236038208, 0.6205968856811523, 3.4841556549072266, 6.347715377807617, 9.211275100708008, 12.074832916259766, 14.938392639160156, 17.801952362060547, 20.665512084960938, 23.529071807861328, 26.392629623413086, 29.256189346313477, 32.1197509765625, 34.983306884765625, 37.846866607666016, 40.710426330566406, 43.5739860534668, 46.43754577636719, 49.30110168457031, 52.16466522216797, 55.028221130371094, 57.891780853271484, 60.755340576171875, 63.618900299072266, 66.48246002197266, 69.34601593017578, 72.20957946777344, 75.07313537597656, 77.93669891357422, 80.80025482177734, 83.663818359375, 86.52737426757812]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 10.0, 5.0, 8.0, 5.0, 18.0, 19.0, 17.0, 41.0, 43.0, 72.0, 112.0, 176.0, 308.0, 661.0, 1398.0, 3211.0, 9049.0, 29547.0, 124192.0, 586522.0, 224545.0, 47015.0, 13104.0, 4604.0, 1906.0, 873.0, 421.0, 236.0, 149.0, 97.0, 51.0, 36.0, 30.0, 19.0, 15.0, 10.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-106.125, -102.876953125, -99.62890625, -96.380859375, -93.1328125, -89.884765625, -86.63671875, -83.388671875, -80.140625, -76.892578125, -73.64453125, -70.396484375, -67.1484375, -63.900390625, -60.65234375, -57.404296875, -54.15625, -50.908203125, -47.66015625, -44.412109375, -41.1640625, -37.916015625, -34.66796875, -31.419921875, -28.171875, -24.923828125, -21.67578125, -18.427734375, -15.1796875, -11.931640625, -8.68359375, -5.435546875, -2.1875, 1.060546875, 4.30859375, 7.556640625, 10.8046875, 14.052734375, 17.30078125, 20.548828125, 23.796875, 27.044921875, 30.29296875, 33.541015625, 36.7890625, 40.037109375, 43.28515625, 46.533203125, 49.78125, 53.029296875, 56.27734375, 59.525390625, 62.7734375, 66.021484375, 69.26953125, 72.517578125, 75.765625, 79.013671875, 82.26171875, 85.509765625, 88.7578125, 92.005859375, 95.25390625, 98.501953125, 101.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 12.0, 17.0, 20.0, 23.0, 30.0, 42.0, 52.0, 43.0, 64.0, 65.0, 73.0, 67.0, 60.0, 72.0, 67.0, 53.0, 54.0, 36.0, 37.0, 22.0, 30.0, 16.0, 14.0, 7.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.309326171875, -8.89990234375, -8.490478515625, -8.0810546875, -7.671630859375, -7.26220703125, -6.852783203125, -6.443359375, -6.033935546875, -5.62451171875, -5.215087890625, -4.8056640625, -4.396240234375, -3.98681640625, -3.577392578125, -3.16796875, -2.758544921875, -2.34912109375, -1.939697265625, -1.5302734375, -1.120849609375, -0.71142578125, -0.302001953125, 0.107421875, 0.516845703125, 0.92626953125, 1.335693359375, 1.7451171875, 2.154541015625, 2.56396484375, 2.973388671875, 3.3828125, 3.792236328125, 4.20166015625, 4.611083984375, 5.0205078125, 5.429931640625, 5.83935546875, 6.248779296875, 6.658203125, 7.067626953125, 7.47705078125, 7.886474609375, 8.2958984375, 8.705322265625, 9.11474609375, 9.524169921875, 9.93359375, 10.343017578125, 10.75244140625, 11.161865234375, 11.5712890625, 11.980712890625, 12.39013671875, 12.799560546875, 13.208984375, 13.618408203125, 14.02783203125, 14.437255859375, 14.8466796875, 15.256103515625, 15.66552734375, 16.074951171875, 16.484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 18.0, 24.0, 29.0, 53.0, 66.0, 131.0, 170.0, 283.0, 498.0, 900.0, 1691.0, 3623.0, 9070.0, 30584.0, 130599.0, 569055.0, 230399.0, 48232.0, 13315.0, 4867.0, 2139.0, 1143.0, 615.0, 376.0, 223.0, 159.0, 85.0, 53.0, 42.0, 24.0, 23.0, 10.0, 13.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-104.9375, -102.2919921875, -99.646484375, -97.0009765625, -94.35546875, -91.7099609375, -89.064453125, -86.4189453125, -83.7734375, -81.1279296875, -78.482421875, -75.8369140625, -73.19140625, -70.5458984375, -67.900390625, -65.2548828125, -62.609375, -59.9638671875, -57.318359375, -54.6728515625, -52.02734375, -49.3818359375, -46.736328125, -44.0908203125, -41.4453125, -38.7998046875, -36.154296875, -33.5087890625, -30.86328125, -28.2177734375, -25.572265625, -22.9267578125, -20.28125, -17.6357421875, -14.990234375, -12.3447265625, -9.69921875, -7.0537109375, -4.408203125, -1.7626953125, 0.8828125, 3.5283203125, 6.173828125, 8.8193359375, 11.46484375, 14.1103515625, 16.755859375, 19.4013671875, 22.046875, 24.6923828125, 27.337890625, 29.9833984375, 32.62890625, 35.2744140625, 37.919921875, 40.5654296875, 43.2109375, 45.8564453125, 48.501953125, 51.1474609375, 53.79296875, 56.4384765625, 59.083984375, 61.7294921875, 64.375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 7.0, 6.0, 11.0, 16.0, 10.0, 19.0, 18.0, 19.0, 26.0, 32.0, 33.0, 35.0, 33.0, 49.0, 37.0, 44.0, 48.0, 44.0, 39.0, 39.0, 56.0, 31.0, 50.0, 25.0, 21.0, 37.0, 34.0, 22.0, 19.0, 15.0, 27.0, 20.0, 16.0, 12.0, 2.0, 7.0, 12.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.59375, -30.4697265625, -29.345703125, -28.2216796875, -27.09765625, -25.9736328125, -24.849609375, -23.7255859375, -22.6015625, -21.4775390625, -20.353515625, -19.2294921875, -18.10546875, -16.9814453125, -15.857421875, -14.7333984375, -13.609375, -12.4853515625, -11.361328125, -10.2373046875, -9.11328125, -7.9892578125, -6.865234375, -5.7412109375, -4.6171875, -3.4931640625, -2.369140625, -1.2451171875, -0.12109375, 1.0029296875, 2.126953125, 3.2509765625, 4.375, 5.4990234375, 6.623046875, 7.7470703125, 8.87109375, 9.9951171875, 11.119140625, 12.2431640625, 13.3671875, 14.4912109375, 15.615234375, 16.7392578125, 17.86328125, 18.9873046875, 20.111328125, 21.2353515625, 22.359375, 23.4833984375, 24.607421875, 25.7314453125, 26.85546875, 27.9794921875, 29.103515625, 30.2275390625, 31.3515625, 32.4755859375, 33.599609375, 34.7236328125, 35.84765625, 36.9716796875, 38.095703125, 39.2197265625, 40.34375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 8.0, 6.0, 10.0, 18.0, 33.0, 38.0, 59.0, 92.0, 159.0, 285.0, 488.0, 1045.0, 2558.0, 8935.0, 97794.0, 874453.0, 51792.0, 6600.0, 2193.0, 947.0, 410.0, 252.0, 99.0, 84.0, 65.0, 34.0, 30.0, 16.0, 10.0, 6.0, 13.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-90.125, -87.6494140625, -85.173828125, -82.6982421875, -80.22265625, -77.7470703125, -75.271484375, -72.7958984375, -70.3203125, -67.8447265625, -65.369140625, -62.8935546875, -60.41796875, -57.9423828125, -55.466796875, -52.9912109375, -50.515625, -48.0400390625, -45.564453125, -43.0888671875, -40.61328125, -38.1376953125, -35.662109375, -33.1865234375, -30.7109375, -28.2353515625, -25.759765625, -23.2841796875, -20.80859375, -18.3330078125, -15.857421875, -13.3818359375, -10.90625, -8.4306640625, -5.955078125, -3.4794921875, -1.00390625, 1.4716796875, 3.947265625, 6.4228515625, 8.8984375, 11.3740234375, 13.849609375, 16.3251953125, 18.80078125, 21.2763671875, 23.751953125, 26.2275390625, 28.703125, 31.1787109375, 33.654296875, 36.1298828125, 38.60546875, 41.0810546875, 43.556640625, 46.0322265625, 48.5078125, 50.9833984375, 53.458984375, 55.9345703125, 58.41015625, 60.8857421875, 63.361328125, 65.8369140625, 68.3125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 13.0, 6.0, 12.0, 15.0, 28.0, 37.0, 69.0, 99.0, 172.0, 180.0, 115.0, 74.0, 45.0, 29.0, 20.0, 28.0, 9.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005992889404296875, -0.0057623982429504395, -0.005531907081604004, -0.005301415920257568, -0.005070924758911133, -0.004840433597564697, -0.004609942436218262, -0.004379451274871826, -0.004148960113525391, -0.003918468952178955, -0.0036879777908325195, -0.003457486629486084, -0.0032269954681396484, -0.002996504306793213, -0.0027660131454467773, -0.002535521984100342, -0.0023050308227539062, -0.0020745396614074707, -0.0018440485000610352, -0.0016135573387145996, -0.001383066177368164, -0.0011525750160217285, -0.000922083854675293, -0.0006915926933288574, -0.0004611015319824219, -0.00023061037063598633, -1.1920928955078125e-07, 0.00023037195205688477, 0.0004608631134033203, 0.0006913542747497559, 0.0009218454360961914, 0.001152336597442627, 0.0013828277587890625, 0.001613318920135498, 0.0018438100814819336, 0.002074301242828369, 0.0023047924041748047, 0.0025352835655212402, 0.0027657747268676758, 0.0029962658882141113, 0.003226757049560547, 0.0034572482109069824, 0.003687739372253418, 0.0039182305335998535, 0.004148721694946289, 0.004379212856292725, 0.00460970401763916, 0.004840195178985596, 0.005070686340332031, 0.005301177501678467, 0.005531668663024902, 0.005762159824371338, 0.0059926509857177734, 0.006223142147064209, 0.0064536333084106445, 0.00668412446975708, 0.006914615631103516, 0.007145106792449951, 0.007375597953796387, 0.007606089115142822, 0.007836580276489258, 0.008067071437835693, 0.008297562599182129, 0.008528053760528564, 0.008758544921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 8.0, 17.0, 27.0, 28.0, 48.0, 68.0, 117.0, 206.0, 428.0, 1066.0, 3109.0, 14466.0, 696757.0, 317386.0, 10527.0, 2510.0, 939.0, 361.0, 177.0, 104.0, 59.0, 47.0, 36.0, 22.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.0, -98.9013671875, -95.802734375, -92.7041015625, -89.60546875, -86.5068359375, -83.408203125, -80.3095703125, -77.2109375, -74.1123046875, -71.013671875, -67.9150390625, -64.81640625, -61.7177734375, -58.619140625, -55.5205078125, -52.421875, -49.3232421875, -46.224609375, -43.1259765625, -40.02734375, -36.9287109375, -33.830078125, -30.7314453125, -27.6328125, -24.5341796875, -21.435546875, -18.3369140625, -15.23828125, -12.1396484375, -9.041015625, -5.9423828125, -2.84375, 0.2548828125, 3.353515625, 6.4521484375, 9.55078125, 12.6494140625, 15.748046875, 18.8466796875, 21.9453125, 25.0439453125, 28.142578125, 31.2412109375, 34.33984375, 37.4384765625, 40.537109375, 43.6357421875, 46.734375, 49.8330078125, 52.931640625, 56.0302734375, 59.12890625, 62.2275390625, 65.326171875, 68.4248046875, 71.5234375, 74.6220703125, 77.720703125, 80.8193359375, 83.91796875, 87.0166015625, 90.115234375, 93.2138671875, 96.3125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 3.0, 4.0, 10.0, 11.0, 30.0, 43.0, 82.0, 170.0, 237.0, 183.0, 104.0, 41.0, 26.0, 14.0, 14.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.03125, -46.64599609375, -45.2607421875, -43.87548828125, -42.490234375, -41.10498046875, -39.7197265625, -38.33447265625, -36.94921875, -35.56396484375, -34.1787109375, -32.79345703125, -31.408203125, -30.02294921875, -28.6376953125, -27.25244140625, -25.8671875, -24.48193359375, -23.0966796875, -21.71142578125, -20.326171875, -18.94091796875, -17.5556640625, -16.17041015625, -14.78515625, -13.39990234375, -12.0146484375, -10.62939453125, -9.244140625, -7.85888671875, -6.4736328125, -5.08837890625, -3.703125, -2.31787109375, -0.9326171875, 0.45263671875, 1.837890625, 3.22314453125, 4.6083984375, 5.99365234375, 7.37890625, 8.76416015625, 10.1494140625, 11.53466796875, 12.919921875, 14.30517578125, 15.6904296875, 17.07568359375, 18.4609375, 19.84619140625, 21.2314453125, 22.61669921875, 24.001953125, 25.38720703125, 26.7724609375, 28.15771484375, 29.54296875, 30.92822265625, 32.3134765625, 33.69873046875, 35.083984375, 36.46923828125, 37.8544921875, 39.23974609375, 40.625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 21.0, 27.0, 60.0, 136.0, 206.0, 200.0, 160.0, 96.0, 49.0, 21.0, 9.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-867.89501953125, -845.2411499023438, -822.5872802734375, -799.9334716796875, -777.2796020507812, -754.625732421875, -731.9718627929688, -709.3179931640625, -686.6641845703125, -664.0103149414062, -641.3564453125, -618.70263671875, -596.0487670898438, -573.3948974609375, -550.7410278320312, -528.087158203125, -505.43328857421875, -482.7794189453125, -460.1255798339844, -437.4717102050781, -414.81787109375, -392.16400146484375, -369.5101318359375, -346.85626220703125, -324.2024230957031, -301.5485534667969, -278.89471435546875, -256.2408447265625, -233.5869903564453, -210.93313598632812, -188.27926635742188, -165.6254119873047, -142.9715576171875, -120.31770324707031, -97.6638412475586, -75.00997924804688, -52.35612487792969, -29.7022705078125, -7.04840087890625, 15.605453491210938, 38.259307861328125, 60.91316604614258, 83.56702423095703, 106.22088623046875, 128.87474060058594, 151.52859497070312, 174.18246459960938, 196.83631896972656, 219.49017333984375, 242.14402770996094, 264.7978820800781, 287.4517517089844, 310.1055908203125, 332.75946044921875, 355.413330078125, 378.06719970703125, 400.7210388183594, 423.3749084472656, 446.02874755859375, 468.6826171875, 491.33648681640625, 513.9903564453125, 536.6441650390625, 559.2980346679688, 581.951904296875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 6.0, 9.0, 15.0, 9.0, 17.0, 17.0, 25.0, 22.0, 20.0, 25.0, 28.0, 24.0, 50.0, 41.0, 39.0, 38.0, 37.0, 50.0, 37.0, 47.0, 30.0, 36.0, 33.0, 41.0, 30.0, 32.0, 28.0, 32.0, 33.0, 26.0, 21.0, 17.0, 7.0, 7.0, 16.0, 11.0, 6.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-168.54010009765625, -162.70712280273438, -156.8741455078125, -151.04115295410156, -145.2081756591797, -139.3751983642578, -133.54222106933594, -127.70923614501953, -121.87625122070312, -116.04327392578125, -110.21028900146484, -104.37731170654297, -98.54432678222656, -92.71134948730469, -86.87837219238281, -81.0453872680664, -75.21240997314453, -69.37943267822266, -63.54644775390625, -57.713470458984375, -51.88048553466797, -46.047508239746094, -40.21452713012695, -34.38154602050781, -28.548564910888672, -22.71558380126953, -16.88260269165039, -11.049623489379883, -5.216642379760742, 0.6163387298583984, 6.449317932128906, 12.282299041748047, 18.115280151367188, 23.948261260986328, 29.78124237060547, 35.614219665527344, 41.44720458984375, 47.280181884765625, 53.113162994384766, 58.946144104003906, 64.77912902832031, 70.61210632324219, 76.4450912475586, 82.27806854248047, 88.11105346679688, 93.94403076171875, 99.77700805664062, 105.60999298095703, 111.4429702758789, 117.27594757080078, 123.10893249511719, 128.94190979003906, 134.77488708496094, 140.60787963867188, 146.44085693359375, 152.27383422851562, 158.1068115234375, 163.93978881835938, 169.77276611328125, 175.6057586669922, 181.43873596191406, 187.27171325683594, 193.1046905517578, 198.93768310546875, 204.77066040039062]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 7.0, 12.0, 10.0, 23.0, 26.0, 60.0, 66.0, 118.0, 219.0, 497.0, 1172.0, 3104.0, 10251.0, 44525.0, 773574.0, 3284950.0, 57107.0, 12372.0, 3639.0, 1325.0, 553.0, 256.0, 163.0, 73.0, 52.0, 34.0, 26.0, 17.0, 21.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.125, -151.796875, -147.46875, -143.140625, -138.8125, -134.484375, -130.15625, -125.828125, -121.5, -117.171875, -112.84375, -108.515625, -104.1875, -99.859375, -95.53125, -91.203125, -86.875, -82.546875, -78.21875, -73.890625, -69.5625, -65.234375, -60.90625, -56.578125, -52.25, -47.921875, -43.59375, -39.265625, -34.9375, -30.609375, -26.28125, -21.953125, -17.625, -13.296875, -8.96875, -4.640625, -0.3125, 4.015625, 8.34375, 12.671875, 17.0, 21.328125, 25.65625, 29.984375, 34.3125, 38.640625, 42.96875, 47.296875, 51.625, 55.953125, 60.28125, 64.609375, 68.9375, 73.265625, 77.59375, 81.921875, 86.25, 90.578125, 94.90625, 99.234375, 103.5625, 107.890625, 112.21875, 116.546875, 120.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 5.0, 17.0, 18.0, 17.0, 27.0, 37.0, 47.0, 56.0, 48.0, 65.0, 61.0, 66.0, 66.0, 68.0, 68.0, 65.0, 52.0, 48.0, 30.0, 39.0, 26.0, 17.0, 16.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0013427734375, -9.588623046875, -9.1759033203125, -8.76318359375, -8.3504638671875, -7.937744140625, -7.5250244140625, -7.1123046875, -6.6995849609375, -6.286865234375, -5.8741455078125, -5.46142578125, -5.0487060546875, -4.635986328125, -4.2232666015625, -3.810546875, -3.3978271484375, -2.985107421875, -2.5723876953125, -2.15966796875, -1.7469482421875, -1.334228515625, -0.9215087890625, -0.5087890625, -0.0960693359375, 0.316650390625, 0.7293701171875, 1.14208984375, 1.5548095703125, 1.967529296875, 2.3802490234375, 2.79296875, 3.2056884765625, 3.618408203125, 4.0311279296875, 4.44384765625, 4.8565673828125, 5.269287109375, 5.6820068359375, 6.0947265625, 6.5074462890625, 6.920166015625, 7.3328857421875, 7.74560546875, 8.1583251953125, 8.571044921875, 8.9837646484375, 9.396484375, 9.8092041015625, 10.221923828125, 10.6346435546875, 11.04736328125, 11.4600830078125, 11.872802734375, 12.2855224609375, 12.6982421875, 13.1109619140625, 13.523681640625, 13.9364013671875, 14.34912109375, 14.7618408203125, 15.174560546875, 15.5872802734375, 16.0]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 16.0, 26.0, 29.0, 55.0, 83.0, 133.0, 231.0, 424.0, 863.0, 1662.0, 3544.0, 7902.0, 19614.0, 56999.0, 245600.0, 3393386.0, 352906.0, 69997.0, 23511.0, 9367.0, 4066.0, 1812.0, 890.0, 476.0, 268.0, 170.0, 96.0, 51.0, 32.0, 27.0, 16.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -44.73291015625, -42.5595703125, -40.38623046875, -38.212890625, -36.03955078125, -33.8662109375, -31.69287109375, -29.51953125, -27.34619140625, -25.1728515625, -22.99951171875, -20.826171875, -18.65283203125, -16.4794921875, -14.30615234375, -12.1328125, -9.95947265625, -7.7861328125, -5.61279296875, -3.439453125, -1.26611328125, 0.9072265625, 3.08056640625, 5.25390625, 7.42724609375, 9.6005859375, 11.77392578125, 13.947265625, 16.12060546875, 18.2939453125, 20.46728515625, 22.640625, 24.81396484375, 26.9873046875, 29.16064453125, 31.333984375, 33.50732421875, 35.6806640625, 37.85400390625, 40.02734375, 42.20068359375, 44.3740234375, 46.54736328125, 48.720703125, 50.89404296875, 53.0673828125, 55.24072265625, 57.4140625, 59.58740234375, 61.7607421875, 63.93408203125, 66.107421875, 68.28076171875, 70.4541015625, 72.62744140625, 74.80078125, 76.97412109375, 79.1474609375, 81.32080078125, 83.494140625, 85.66748046875, 87.8408203125, 90.01416015625, 92.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 6.0, 15.0, 23.0, 41.0, 61.0, 46.0, 79.0, 121.0, 271.0, 853.0, 1613.0, 383.0, 183.0, 83.0, 75.0, 57.0, 40.0, 25.0, 14.0, 14.0, 14.0, 10.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.295654296875, -19.41943359375, -18.543212890625, -17.6669921875, -16.790771484375, -15.91455078125, -15.038330078125, -14.162109375, -13.285888671875, -12.40966796875, -11.533447265625, -10.6572265625, -9.781005859375, -8.90478515625, -8.028564453125, -7.15234375, -6.276123046875, -5.39990234375, -4.523681640625, -3.6474609375, -2.771240234375, -1.89501953125, -1.018798828125, -0.142578125, 0.733642578125, 1.60986328125, 2.486083984375, 3.3623046875, 4.238525390625, 5.11474609375, 5.990966796875, 6.8671875, 7.743408203125, 8.61962890625, 9.495849609375, 10.3720703125, 11.248291015625, 12.12451171875, 13.000732421875, 13.876953125, 14.753173828125, 15.62939453125, 16.505615234375, 17.3818359375, 18.258056640625, 19.13427734375, 20.010498046875, 20.88671875, 21.762939453125, 22.63916015625, 23.515380859375, 24.3916015625, 25.267822265625, 26.14404296875, 27.020263671875, 27.896484375, 28.772705078125, 29.64892578125, 30.525146484375, 31.4013671875, 32.277587890625, 33.15380859375, 34.030029296875, 34.90625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 22.0, 62.0, 166.0, 250.0, 234.0, 142.0, 73.0, 26.0, 13.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-558.0977172851562, -545.6300048828125, -533.1622924804688, -520.694580078125, -508.2268981933594, -495.7591857910156, -483.29150390625, -470.82379150390625, -458.3560791015625, -445.88836669921875, -433.4206848144531, -420.9529724121094, -408.4852600097656, -396.0175476074219, -383.54986572265625, -371.0821533203125, -358.61444091796875, -346.146728515625, -333.6790466308594, -321.2113342285156, -308.7436218261719, -296.2759094238281, -283.8082275390625, -271.34051513671875, -258.8728332519531, -246.40513610839844, -233.9374237060547, -221.4697265625, -209.00201416015625, -196.53431701660156, -184.06661987304688, -171.59890747070312, -159.13121032714844, -146.66351318359375, -134.19580078125, -121.72810363769531, -109.26039123535156, -96.79269409179688, -84.32498931884766, -71.85728454589844, -59.38957977294922, -46.921875, -34.45417022705078, -21.986469268798828, -9.51876449584961, 2.9489402770996094, 15.416641235351562, 27.88434600830078, 40.35205078125, 52.81975555419922, 65.28746032714844, 77.75515747070312, 90.22286987304688, 102.69056701660156, 115.15827178955078, 127.6259765625, 140.09368896484375, 152.56138610839844, 165.0290985107422, 177.49679565429688, 189.96450805664062, 202.4322052001953, 214.89990234375, 227.36761474609375, 239.83531188964844]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 10.0, 10.0, 20.0, 14.0, 16.0, 23.0, 29.0, 21.0, 37.0, 46.0, 47.0, 52.0, 43.0, 59.0, 49.0, 45.0, 62.0, 47.0, 51.0, 48.0, 39.0, 42.0, 34.0, 35.0, 25.0, 21.0, 18.0, 12.0, 11.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-131.56179809570312, -128.248046875, -124.93431091308594, -121.62055969238281, -118.30681610107422, -114.99307250976562, -111.6793212890625, -108.3655776977539, -105.05183410644531, -101.73809051513672, -98.42434692382812, -95.110595703125, -91.7968521118164, -88.48310852050781, -85.16935729980469, -81.8556137084961, -78.5418701171875, -75.2281265258789, -71.91438293457031, -68.60063171386719, -65.2868881225586, -61.97314453125, -58.65939712524414, -55.34564971923828, -52.03190612792969, -48.718162536621094, -45.404415130615234, -42.090667724609375, -38.77692413330078, -35.46318054199219, -32.14943313598633, -28.8356876373291, -25.521942138671875, -22.20819664001465, -18.894451141357422, -15.580705642700195, -12.266960144042969, -8.953214645385742, -5.639469146728516, -2.325723648071289, 0.9880218505859375, 4.301767349243164, 7.615512847900391, 10.929258346557617, 14.243003845214844, 17.55674934387207, 20.870494842529297, 24.184240341186523, 27.49798583984375, 30.811731338500977, 34.1254768371582, 37.43922424316406, 40.752967834472656, 44.06671142578125, 47.38045883178711, 50.69420623779297, 54.00794982910156, 57.321693420410156, 60.635440826416016, 63.949188232421875, 67.26293182373047, 70.57667541503906, 73.89042663574219, 77.20417022705078, 80.51791381835938]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 15.0, 14.0, 18.0, 31.0, 41.0, 56.0, 95.0, 130.0, 262.0, 472.0, 994.0, 2770.0, 8621.0, 31629.0, 134480.0, 607042.0, 200624.0, 43797.0, 11262.0, 3490.0, 1349.0, 579.0, 322.0, 165.0, 95.0, 64.0, 44.0, 30.0, 16.0, 12.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.6875, -79.693359375, -76.69921875, -73.705078125, -70.7109375, -67.716796875, -64.72265625, -61.728515625, -58.734375, -55.740234375, -52.74609375, -49.751953125, -46.7578125, -43.763671875, -40.76953125, -37.775390625, -34.78125, -31.787109375, -28.79296875, -25.798828125, -22.8046875, -19.810546875, -16.81640625, -13.822265625, -10.828125, -7.833984375, -4.83984375, -1.845703125, 1.1484375, 4.142578125, 7.13671875, 10.130859375, 13.125, 16.119140625, 19.11328125, 22.107421875, 25.1015625, 28.095703125, 31.08984375, 34.083984375, 37.078125, 40.072265625, 43.06640625, 46.060546875, 49.0546875, 52.048828125, 55.04296875, 58.037109375, 61.03125, 64.025390625, 67.01953125, 70.013671875, 73.0078125, 76.001953125, 78.99609375, 81.990234375, 84.984375, 87.978515625, 90.97265625, 93.966796875, 96.9609375, 99.955078125, 102.94921875, 105.943359375, 108.9375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 13.0, 20.0, 22.0, 26.0, 32.0, 49.0, 31.0, 39.0, 44.0, 62.0, 63.0, 73.0, 49.0, 65.0, 67.0, 54.0, 47.0, 49.0, 34.0, 44.0, 26.0, 14.0, 20.0, 15.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.5032958984375, -9.092529296875, -8.6817626953125, -8.27099609375, -7.8602294921875, -7.449462890625, -7.0386962890625, -6.6279296875, -6.2171630859375, -5.806396484375, -5.3956298828125, -4.98486328125, -4.5740966796875, -4.163330078125, -3.7525634765625, -3.341796875, -2.9310302734375, -2.520263671875, -2.1094970703125, -1.69873046875, -1.2879638671875, -0.877197265625, -0.4664306640625, -0.0556640625, 0.3551025390625, 0.765869140625, 1.1766357421875, 1.58740234375, 1.9981689453125, 2.408935546875, 2.8197021484375, 3.23046875, 3.6412353515625, 4.052001953125, 4.4627685546875, 4.87353515625, 5.2843017578125, 5.695068359375, 6.1058349609375, 6.5166015625, 6.9273681640625, 7.338134765625, 7.7489013671875, 8.15966796875, 8.5704345703125, 8.981201171875, 9.3919677734375, 9.802734375, 10.2135009765625, 10.624267578125, 11.0350341796875, 11.44580078125, 11.8565673828125, 12.267333984375, 12.6781005859375, 13.0888671875, 13.4996337890625, 13.910400390625, 14.3211669921875, 14.73193359375, 15.1427001953125, 15.553466796875, 15.9642333984375, 16.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 9.0, 11.0, 10.0, 18.0, 30.0, 49.0, 67.0, 114.0, 169.0, 314.0, 574.0, 1240.0, 2937.0, 7496.0, 21829.0, 64155.0, 223559.0, 492767.0, 158052.0, 48220.0, 16468.0, 5869.0, 2297.0, 1029.0, 500.0, 258.0, 157.0, 106.0, 61.0, 51.0, 40.0, 21.0, 16.0, 16.0, 9.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25, -46.4873046875, -44.724609375, -42.9619140625, -41.19921875, -39.4365234375, -37.673828125, -35.9111328125, -34.1484375, -32.3857421875, -30.623046875, -28.8603515625, -27.09765625, -25.3349609375, -23.572265625, -21.8095703125, -20.046875, -18.2841796875, -16.521484375, -14.7587890625, -12.99609375, -11.2333984375, -9.470703125, -7.7080078125, -5.9453125, -4.1826171875, -2.419921875, -0.6572265625, 1.10546875, 2.8681640625, 4.630859375, 6.3935546875, 8.15625, 9.9189453125, 11.681640625, 13.4443359375, 15.20703125, 16.9697265625, 18.732421875, 20.4951171875, 22.2578125, 24.0205078125, 25.783203125, 27.5458984375, 29.30859375, 31.0712890625, 32.833984375, 34.5966796875, 36.359375, 38.1220703125, 39.884765625, 41.6474609375, 43.41015625, 45.1728515625, 46.935546875, 48.6982421875, 50.4609375, 52.2236328125, 53.986328125, 55.7490234375, 57.51171875, 59.2744140625, 61.037109375, 62.7998046875, 64.5625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 14.0, 20.0, 18.0, 27.0, 34.0, 35.0, 31.0, 39.0, 54.0, 44.0, 48.0, 45.0, 52.0, 60.0, 60.0, 44.0, 38.0, 44.0, 39.0, 30.0, 27.0, 22.0, 24.0, 25.0, 25.0, 14.0, 14.0, 8.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.4736328125, -36.072265625, -34.6708984375, -33.26953125, -31.8681640625, -30.466796875, -29.0654296875, -27.6640625, -26.2626953125, -24.861328125, -23.4599609375, -22.05859375, -20.6572265625, -19.255859375, -17.8544921875, -16.453125, -15.0517578125, -13.650390625, -12.2490234375, -10.84765625, -9.4462890625, -8.044921875, -6.6435546875, -5.2421875, -3.8408203125, -2.439453125, -1.0380859375, 0.36328125, 1.7646484375, 3.166015625, 4.5673828125, 5.96875, 7.3701171875, 8.771484375, 10.1728515625, 11.57421875, 12.9755859375, 14.376953125, 15.7783203125, 17.1796875, 18.5810546875, 19.982421875, 21.3837890625, 22.78515625, 24.1865234375, 25.587890625, 26.9892578125, 28.390625, 29.7919921875, 31.193359375, 32.5947265625, 33.99609375, 35.3974609375, 36.798828125, 38.2001953125, 39.6015625, 41.0029296875, 42.404296875, 43.8056640625, 45.20703125, 46.6083984375, 48.009765625, 49.4111328125, 50.8125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 16.0, 14.0, 20.0, 23.0, 27.0, 51.0, 66.0, 130.0, 206.0, 346.0, 734.0, 1526.0, 3880.0, 10108.0, 33334.0, 141742.0, 511671.0, 262355.0, 56852.0, 15632.0, 5438.0, 2206.0, 962.0, 465.0, 237.0, 157.0, 88.0, 73.0, 53.0, 34.0, 22.0, 22.0, 11.0, 2.0, 5.0, 5.0, 1.0, 5.0, 0.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.5625, -20.783935546875, -20.00537109375, -19.226806640625, -18.4482421875, -17.669677734375, -16.89111328125, -16.112548828125, -15.333984375, -14.555419921875, -13.77685546875, -12.998291015625, -12.2197265625, -11.441162109375, -10.66259765625, -9.884033203125, -9.10546875, -8.326904296875, -7.54833984375, -6.769775390625, -5.9912109375, -5.212646484375, -4.43408203125, -3.655517578125, -2.876953125, -2.098388671875, -1.31982421875, -0.541259765625, 0.2373046875, 1.015869140625, 1.79443359375, 2.572998046875, 3.3515625, 4.130126953125, 4.90869140625, 5.687255859375, 6.4658203125, 7.244384765625, 8.02294921875, 8.801513671875, 9.580078125, 10.358642578125, 11.13720703125, 11.915771484375, 12.6943359375, 13.472900390625, 14.25146484375, 15.030029296875, 15.80859375, 16.587158203125, 17.36572265625, 18.144287109375, 18.9228515625, 19.701416015625, 20.47998046875, 21.258544921875, 22.037109375, 22.815673828125, 23.59423828125, 24.372802734375, 25.1513671875, 25.929931640625, 26.70849609375, 27.487060546875, 28.265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 6.0, 15.0, 23.0, 47.0, 76.0, 143.0, 253.0, 217.0, 95.0, 46.0, 27.0, 17.0, 11.0, 3.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0129241943359375, -0.012634813785552979, -0.012345433235168457, -0.012056052684783936, -0.011766672134399414, -0.011477291584014893, -0.011187911033630371, -0.01089853048324585, -0.010609149932861328, -0.010319769382476807, -0.010030388832092285, -0.009741008281707764, -0.009451627731323242, -0.00916224718093872, -0.0088728666305542, -0.008583486080169678, -0.008294105529785156, -0.008004724979400635, -0.007715344429016113, -0.007425963878631592, -0.00713658332824707, -0.006847202777862549, -0.006557822227478027, -0.006268441677093506, -0.005979061126708984, -0.005689680576324463, -0.005400300025939941, -0.00511091947555542, -0.0048215389251708984, -0.004532158374786377, -0.0042427778244018555, -0.003953397274017334, -0.0036640167236328125, -0.003374636173248291, -0.0030852556228637695, -0.002795875072479248, -0.0025064945220947266, -0.002217113971710205, -0.0019277334213256836, -0.0016383528709411621, -0.0013489723205566406, -0.0010595917701721191, -0.0007702112197875977, -0.00048083066940307617, -0.0001914501190185547, 9.79304313659668e-05, 0.0003873109817504883, 0.0006766915321350098, 0.0009660720825195312, 0.0012554526329040527, 0.0015448331832885742, 0.0018342137336730957, 0.002123594284057617, 0.0024129748344421387, 0.00270235538482666, 0.0029917359352111816, 0.003281116485595703, 0.0035704970359802246, 0.003859877586364746, 0.004149258136749268, 0.004438638687133789, 0.0047280192375183105, 0.005017399787902832, 0.0053067803382873535, 0.005596160888671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 12.0, 21.0, 46.0, 82.0, 142.0, 328.0, 805.0, 2656.0, 12512.0, 103031.0, 763007.0, 145146.0, 16057.0, 3119.0, 892.0, 345.0, 173.0, 74.0, 47.0, 29.0, 14.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0625, -43.830078125, -42.59765625, -41.365234375, -40.1328125, -38.900390625, -37.66796875, -36.435546875, -35.203125, -33.970703125, -32.73828125, -31.505859375, -30.2734375, -29.041015625, -27.80859375, -26.576171875, -25.34375, -24.111328125, -22.87890625, -21.646484375, -20.4140625, -19.181640625, -17.94921875, -16.716796875, -15.484375, -14.251953125, -13.01953125, -11.787109375, -10.5546875, -9.322265625, -8.08984375, -6.857421875, -5.625, -4.392578125, -3.16015625, -1.927734375, -0.6953125, 0.537109375, 1.76953125, 3.001953125, 4.234375, 5.466796875, 6.69921875, 7.931640625, 9.1640625, 10.396484375, 11.62890625, 12.861328125, 14.09375, 15.326171875, 16.55859375, 17.791015625, 19.0234375, 20.255859375, 21.48828125, 22.720703125, 23.953125, 25.185546875, 26.41796875, 27.650390625, 28.8828125, 30.115234375, 31.34765625, 32.580078125, 33.8125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 4.0, 3.0, 11.0, 11.0, 14.0, 24.0, 31.0, 32.0, 74.0, 83.0, 97.0, 98.0, 126.0, 82.0, 83.0, 61.0, 53.0, 15.0, 15.0, 14.0, 12.0, 12.0, 4.0, 7.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.17822265625, -19.5439453125, -18.90966796875, -18.275390625, -17.64111328125, -17.0068359375, -16.37255859375, -15.73828125, -15.10400390625, -14.4697265625, -13.83544921875, -13.201171875, -12.56689453125, -11.9326171875, -11.29833984375, -10.6640625, -10.02978515625, -9.3955078125, -8.76123046875, -8.126953125, -7.49267578125, -6.8583984375, -6.22412109375, -5.58984375, -4.95556640625, -4.3212890625, -3.68701171875, -3.052734375, -2.41845703125, -1.7841796875, -1.14990234375, -0.515625, 0.11865234375, 0.7529296875, 1.38720703125, 2.021484375, 2.65576171875, 3.2900390625, 3.92431640625, 4.55859375, 5.19287109375, 5.8271484375, 6.46142578125, 7.095703125, 7.72998046875, 8.3642578125, 8.99853515625, 9.6328125, 10.26708984375, 10.9013671875, 11.53564453125, 12.169921875, 12.80419921875, 13.4384765625, 14.07275390625, 14.70703125, 15.34130859375, 15.9755859375, 16.60986328125, 17.244140625, 17.87841796875, 18.5126953125, 19.14697265625, 19.78125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 18.0, 40.0, 115.0, 194.0, 236.0, 201.0, 117.0, 57.0, 16.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-896.938720703125, -874.2700805664062, -851.6015014648438, -828.932861328125, -806.2642822265625, -783.5956420898438, -760.927001953125, -738.2584228515625, -715.5897827148438, -692.921142578125, -670.2525634765625, -647.5839233398438, -624.915283203125, -602.2467041015625, -579.5780639648438, -556.909423828125, -534.2408447265625, -511.5722351074219, -488.90362548828125, -466.2349853515625, -443.5663757324219, -420.89776611328125, -398.2291259765625, -375.5605163574219, -352.89190673828125, -330.2232971191406, -307.5546875, -284.88604736328125, -262.2174377441406, -239.548828125, -216.8802032470703, -194.21157836914062, -171.54290771484375, -148.87429809570312, -126.20567321777344, -103.53705596923828, -80.86843872070312, -58.19982147216797, -35.53120422363281, -12.862579345703125, 9.8060302734375, 32.474647521972656, 55.14326477050781, 77.81188201904297, 100.48049926757812, 123.14911651611328, 145.81773376464844, 168.48635864257812, 191.15496826171875, 213.82357788085938, 236.49220275878906, 259.16082763671875, 281.8294372558594, 304.498046875, 327.16668701171875, 349.8352966308594, 372.50390625, 395.1725158691406, 417.84112548828125, 440.509765625, 463.1783752441406, 485.84698486328125, 508.515625, 531.1842041015625, 553.8528442382812]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 3.0, 7.0, 5.0, 7.0, 14.0, 13.0, 17.0, 14.0, 19.0, 24.0, 29.0, 30.0, 29.0, 43.0, 31.0, 35.0, 41.0, 41.0, 36.0, 36.0, 30.0, 40.0, 42.0, 44.0, 35.0, 36.0, 26.0, 27.0, 32.0, 28.0, 30.0, 21.0, 25.0, 13.0, 19.0, 13.0, 12.0, 9.0, 5.0, 5.0, 6.0, 7.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-166.53012084960938, -161.3583221435547, -156.1865234375, -151.01470947265625, -145.84291076660156, -140.67111206054688, -135.4993133544922, -130.3275146484375, -125.15570831298828, -119.9839096069336, -114.81210327148438, -109.64030456542969, -104.468505859375, -99.29669952392578, -94.1249008178711, -88.95309448242188, -83.78129577636719, -78.6094970703125, -73.43769073486328, -68.2658920288086, -63.09408950805664, -57.92228698730469, -52.75048828125, -47.57868576049805, -42.406883239746094, -37.23508071899414, -32.06327819824219, -26.8914794921875, -21.719676971435547, -16.547874450683594, -11.376073837280273, -6.204273223876953, -1.032470703125, 4.139330863952637, 9.311132431030273, 14.48293399810791, 19.654735565185547, 24.8265380859375, 29.99833869934082, 35.17013931274414, 40.341941833496094, 45.51374435424805, 50.685546875, 55.85734558105469, 61.02914810180664, 66.2009506225586, 71.37274932861328, 76.5445556640625, 81.71635437011719, 86.88815307617188, 92.0599594116211, 97.23175811767578, 102.403564453125, 107.57536315917969, 112.74716186523438, 117.91896057128906, 123.09076690673828, 128.2625732421875, 133.4343719482422, 138.60617065429688, 143.77796936035156, 148.94976806640625, 154.12158203125, 159.2933807373047, 164.46517944335938]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 13.0, 8.0, 10.0, 19.0, 33.0, 27.0, 54.0, 99.0, 137.0, 220.0, 429.0, 814.0, 1630.0, 3887.0, 10224.0, 33816.0, 167324.0, 3676555.0, 237146.0, 41520.0, 12041.0, 4305.0, 1865.0, 902.0, 471.0, 257.0, 140.0, 99.0, 69.0, 52.0, 36.0, 24.0, 13.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.375, -121.5263671875, -117.677734375, -113.8291015625, -109.98046875, -106.1318359375, -102.283203125, -98.4345703125, -94.5859375, -90.7373046875, -86.888671875, -83.0400390625, -79.19140625, -75.3427734375, -71.494140625, -67.6455078125, -63.796875, -59.9482421875, -56.099609375, -52.2509765625, -48.40234375, -44.5537109375, -40.705078125, -36.8564453125, -33.0078125, -29.1591796875, -25.310546875, -21.4619140625, -17.61328125, -13.7646484375, -9.916015625, -6.0673828125, -2.21875, 1.6298828125, 5.478515625, 9.3271484375, 13.17578125, 17.0244140625, 20.873046875, 24.7216796875, 28.5703125, 32.4189453125, 36.267578125, 40.1162109375, 43.96484375, 47.8134765625, 51.662109375, 55.5107421875, 59.359375, 63.2080078125, 67.056640625, 70.9052734375, 74.75390625, 78.6025390625, 82.451171875, 86.2998046875, 90.1484375, 93.9970703125, 97.845703125, 101.6943359375, 105.54296875, 109.3916015625, 113.240234375, 117.0888671875, 120.9375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 10.0, 12.0, 12.0, 14.0, 24.0, 23.0, 21.0, 41.0, 36.0, 54.0, 50.0, 53.0, 71.0, 59.0, 53.0, 59.0, 54.0, 52.0, 50.0, 50.0, 36.0, 35.0, 30.0, 24.0, 13.0, 15.0, 13.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.39306640625, -8.9892578125, -8.58544921875, -8.181640625, -7.77783203125, -7.3740234375, -6.97021484375, -6.56640625, -6.16259765625, -5.7587890625, -5.35498046875, -4.951171875, -4.54736328125, -4.1435546875, -3.73974609375, -3.3359375, -2.93212890625, -2.5283203125, -2.12451171875, -1.720703125, -1.31689453125, -0.9130859375, -0.50927734375, -0.10546875, 0.29833984375, 0.7021484375, 1.10595703125, 1.509765625, 1.91357421875, 2.3173828125, 2.72119140625, 3.125, 3.52880859375, 3.9326171875, 4.33642578125, 4.740234375, 5.14404296875, 5.5478515625, 5.95166015625, 6.35546875, 6.75927734375, 7.1630859375, 7.56689453125, 7.970703125, 8.37451171875, 8.7783203125, 9.18212890625, 9.5859375, 9.98974609375, 10.3935546875, 10.79736328125, 11.201171875, 11.60498046875, 12.0087890625, 12.41259765625, 12.81640625, 13.22021484375, 13.6240234375, 14.02783203125, 14.431640625, 14.83544921875, 15.2392578125, 15.64306640625, 16.046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 14.0, 19.0, 32.0, 57.0, 85.0, 121.0, 205.0, 355.0, 649.0, 1143.0, 2085.0, 4112.0, 8601.0, 18427.0, 44306.0, 134230.0, 888950.0, 2804416.0, 186476.0, 57118.0, 22269.0, 10186.0, 4766.0, 2510.0, 1359.0, 727.0, 440.0, 245.0, 141.0, 81.0, 58.0, 44.0, 19.0, 12.0, 10.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.6875, -51.7783203125, -49.869140625, -47.9599609375, -46.05078125, -44.1416015625, -42.232421875, -40.3232421875, -38.4140625, -36.5048828125, -34.595703125, -32.6865234375, -30.77734375, -28.8681640625, -26.958984375, -25.0498046875, -23.140625, -21.2314453125, -19.322265625, -17.4130859375, -15.50390625, -13.5947265625, -11.685546875, -9.7763671875, -7.8671875, -5.9580078125, -4.048828125, -2.1396484375, -0.23046875, 1.6787109375, 3.587890625, 5.4970703125, 7.40625, 9.3154296875, 11.224609375, 13.1337890625, 15.04296875, 16.9521484375, 18.861328125, 20.7705078125, 22.6796875, 24.5888671875, 26.498046875, 28.4072265625, 30.31640625, 32.2255859375, 34.134765625, 36.0439453125, 37.953125, 39.8623046875, 41.771484375, 43.6806640625, 45.58984375, 47.4990234375, 49.408203125, 51.3173828125, 53.2265625, 55.1357421875, 57.044921875, 58.9541015625, 60.86328125, 62.7724609375, 64.681640625, 66.5908203125, 68.5]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 11.0, 8.0, 8.0, 10.0, 18.0, 21.0, 25.0, 25.0, 41.0, 61.0, 79.0, 125.0, 216.0, 390.0, 1680.0, 575.0, 272.0, 145.0, 101.0, 50.0, 48.0, 37.0, 23.0, 18.0, 16.0, 19.0, 8.0, 8.0, 9.0, 6.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.75, -22.949951171875, -22.14990234375, -21.349853515625, -20.5498046875, -19.749755859375, -18.94970703125, -18.149658203125, -17.349609375, -16.549560546875, -15.74951171875, -14.949462890625, -14.1494140625, -13.349365234375, -12.54931640625, -11.749267578125, -10.94921875, -10.149169921875, -9.34912109375, -8.549072265625, -7.7490234375, -6.948974609375, -6.14892578125, -5.348876953125, -4.548828125, -3.748779296875, -2.94873046875, -2.148681640625, -1.3486328125, -0.548583984375, 0.25146484375, 1.051513671875, 1.8515625, 2.651611328125, 3.45166015625, 4.251708984375, 5.0517578125, 5.851806640625, 6.65185546875, 7.451904296875, 8.251953125, 9.052001953125, 9.85205078125, 10.652099609375, 11.4521484375, 12.252197265625, 13.05224609375, 13.852294921875, 14.65234375, 15.452392578125, 16.25244140625, 17.052490234375, 17.8525390625, 18.652587890625, 19.45263671875, 20.252685546875, 21.052734375, 21.852783203125, 22.65283203125, 23.452880859375, 24.2529296875, 25.052978515625, 25.85302734375, 26.653076171875, 27.453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 12.0, 11.0, 19.0, 33.0, 70.0, 131.0, 149.0, 163.0, 172.0, 100.0, 69.0, 35.0, 13.0, 14.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-343.56982421875, -336.17041015625, -328.7710266113281, -321.3716125488281, -313.97222900390625, -306.57281494140625, -299.17340087890625, -291.7740173339844, -284.3746032714844, -276.9751892089844, -269.5758056640625, -262.1763916015625, -254.77699279785156, -247.37759399414062, -239.97817993164062, -232.5787811279297, -225.17938232421875, -217.7799835205078, -210.38058471679688, -202.98117065429688, -195.58177185058594, -188.182373046875, -180.782958984375, -173.38356018066406, -165.98416137695312, -158.5847625732422, -151.18536376953125, -143.78594970703125, -136.3865509033203, -128.98715209960938, -121.5877456665039, -114.18833923339844, -106.7889404296875, -99.38954162597656, -91.9901351928711, -84.59072875976562, -77.19132995605469, -69.79193115234375, -62.39252471923828, -54.99312210083008, -47.593719482421875, -40.19431686401367, -32.79491424560547, -25.395511627197266, -17.996109008789062, -10.59670639038086, -3.1973037719726562, 4.202098846435547, 11.60150146484375, 19.000904083251953, 26.400306701660156, 33.79970932006836, 41.19911193847656, 48.598514556884766, 55.99791717529297, 63.39731979370117, 70.79672241210938, 78.19612121582031, 85.59552764892578, 92.99493408203125, 100.39433288574219, 107.79373168945312, 115.1931381225586, 122.59254455566406, 129.991943359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 17.0, 15.0, 14.0, 18.0, 28.0, 23.0, 24.0, 31.0, 40.0, 27.0, 39.0, 42.0, 44.0, 38.0, 47.0, 51.0, 45.0, 41.0, 35.0, 40.0, 40.0, 37.0, 26.0, 29.0, 29.0, 35.0, 23.0, 23.0, 15.0, 14.0, 13.0, 2.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-83.47816467285156, -80.70133209228516, -77.92449951171875, -75.14766693115234, -72.37083435058594, -69.59400939941406, -66.81717681884766, -64.04034423828125, -61.263511657714844, -58.48667907714844, -55.70984649658203, -52.93301773071289, -50.156185150146484, -47.37935256958008, -44.60252380371094, -41.82569122314453, -39.048858642578125, -36.27202606201172, -33.49519348144531, -30.718364715576172, -27.941532135009766, -25.16469955444336, -22.387868881225586, -19.611038208007812, -16.834205627441406, -14.057374000549316, -11.280542373657227, -8.503710746765137, -5.726879119873047, -2.950047492980957, -0.1732158660888672, 2.6036148071289062, 5.380455017089844, 8.157286643981934, 10.934118270874023, 13.710949897766113, 16.487781524658203, 19.26461410522461, 22.041444778442383, 24.818275451660156, 27.595108032226562, 30.37194061279297, 33.148773193359375, 35.925601959228516, 38.70243453979492, 41.47926712036133, 44.25609588623047, 47.032928466796875, 49.80976104736328, 52.58659362792969, 55.363426208496094, 58.140254974365234, 60.91708755493164, 63.69392013549805, 66.47074890136719, 69.2475814819336, 72.0244140625, 74.8012466430664, 77.57807922363281, 80.35491180419922, 83.13174438476562, 85.9085693359375, 88.6854019165039, 91.46223449707031, 94.23906707763672]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 7.0, 10.0, 11.0, 16.0, 18.0, 36.0, 71.0, 76.0, 137.0, 202.0, 363.0, 666.0, 1440.0, 3881.0, 12204.0, 46152.0, 187579.0, 533488.0, 194376.0, 47930.0, 12758.0, 3972.0, 1534.0, 694.0, 339.0, 215.0, 103.0, 75.0, 62.0, 45.0, 16.0, 21.0, 15.0, 12.0, 12.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-101.75, -98.7138671875, -95.677734375, -92.6416015625, -89.60546875, -86.5693359375, -83.533203125, -80.4970703125, -77.4609375, -74.4248046875, -71.388671875, -68.3525390625, -65.31640625, -62.2802734375, -59.244140625, -56.2080078125, -53.171875, -50.1357421875, -47.099609375, -44.0634765625, -41.02734375, -37.9912109375, -34.955078125, -31.9189453125, -28.8828125, -25.8466796875, -22.810546875, -19.7744140625, -16.73828125, -13.7021484375, -10.666015625, -7.6298828125, -4.59375, -1.5576171875, 1.478515625, 4.5146484375, 7.55078125, 10.5869140625, 13.623046875, 16.6591796875, 19.6953125, 22.7314453125, 25.767578125, 28.8037109375, 31.83984375, 34.8759765625, 37.912109375, 40.9482421875, 43.984375, 47.0205078125, 50.056640625, 53.0927734375, 56.12890625, 59.1650390625, 62.201171875, 65.2373046875, 68.2734375, 71.3095703125, 74.345703125, 77.3818359375, 80.41796875, 83.4541015625, 86.490234375, 89.5263671875, 92.5625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 6.0, 9.0, 10.0, 11.0, 11.0, 16.0, 25.0, 33.0, 36.0, 32.0, 40.0, 49.0, 52.0, 65.0, 47.0, 53.0, 61.0, 41.0, 69.0, 49.0, 46.0, 44.0, 36.0, 40.0, 19.0, 28.0, 11.0, 15.0, 12.0, 10.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.355712890625, -8.94580078125, -8.535888671875, -8.1259765625, -7.716064453125, -7.30615234375, -6.896240234375, -6.486328125, -6.076416015625, -5.66650390625, -5.256591796875, -4.8466796875, -4.436767578125, -4.02685546875, -3.616943359375, -3.20703125, -2.797119140625, -2.38720703125, -1.977294921875, -1.5673828125, -1.157470703125, -0.74755859375, -0.337646484375, 0.072265625, 0.482177734375, 0.89208984375, 1.302001953125, 1.7119140625, 2.121826171875, 2.53173828125, 2.941650390625, 3.3515625, 3.761474609375, 4.17138671875, 4.581298828125, 4.9912109375, 5.401123046875, 5.81103515625, 6.220947265625, 6.630859375, 7.040771484375, 7.45068359375, 7.860595703125, 8.2705078125, 8.680419921875, 9.09033203125, 9.500244140625, 9.91015625, 10.320068359375, 10.72998046875, 11.139892578125, 11.5498046875, 11.959716796875, 12.36962890625, 12.779541015625, 13.189453125, 13.599365234375, 14.00927734375, 14.419189453125, 14.8291015625, 15.239013671875, 15.64892578125, 16.058837890625, 16.46875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 12.0, 12.0, 28.0, 37.0, 46.0, 51.0, 100.0, 110.0, 137.0, 174.0, 316.0, 450.0, 700.0, 1269.0, 2858.0, 7523.0, 23610.0, 78446.0, 273456.0, 450735.0, 143987.0, 42637.0, 12734.0, 4573.0, 1857.0, 927.0, 552.0, 331.0, 251.0, 192.0, 95.0, 89.0, 67.0, 59.0, 25.0, 32.0, 17.0, 14.0, 15.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.25, -56.3857421875, -54.521484375, -52.6572265625, -50.79296875, -48.9287109375, -47.064453125, -45.2001953125, -43.3359375, -41.4716796875, -39.607421875, -37.7431640625, -35.87890625, -34.0146484375, -32.150390625, -30.2861328125, -28.421875, -26.5576171875, -24.693359375, -22.8291015625, -20.96484375, -19.1005859375, -17.236328125, -15.3720703125, -13.5078125, -11.6435546875, -9.779296875, -7.9150390625, -6.05078125, -4.1865234375, -2.322265625, -0.4580078125, 1.40625, 3.2705078125, 5.134765625, 6.9990234375, 8.86328125, 10.7275390625, 12.591796875, 14.4560546875, 16.3203125, 18.1845703125, 20.048828125, 21.9130859375, 23.77734375, 25.6416015625, 27.505859375, 29.3701171875, 31.234375, 33.0986328125, 34.962890625, 36.8271484375, 38.69140625, 40.5556640625, 42.419921875, 44.2841796875, 46.1484375, 48.0126953125, 49.876953125, 51.7412109375, 53.60546875, 55.4697265625, 57.333984375, 59.1982421875, 61.0625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 0.0, 6.0, 6.0, 10.0, 10.0, 23.0, 20.0, 14.0, 19.0, 17.0, 28.0, 41.0, 33.0, 38.0, 39.0, 45.0, 43.0, 47.0, 60.0, 51.0, 39.0, 58.0, 43.0, 37.0, 37.0, 31.0, 38.0, 23.0, 28.0, 21.0, 19.0, 18.0, 8.0, 12.0, 14.0, 5.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.0, -44.46484375, -42.9296875, -41.39453125, -39.859375, -38.32421875, -36.7890625, -35.25390625, -33.71875, -32.18359375, -30.6484375, -29.11328125, -27.578125, -26.04296875, -24.5078125, -22.97265625, -21.4375, -19.90234375, -18.3671875, -16.83203125, -15.296875, -13.76171875, -12.2265625, -10.69140625, -9.15625, -7.62109375, -6.0859375, -4.55078125, -3.015625, -1.48046875, 0.0546875, 1.58984375, 3.125, 4.66015625, 6.1953125, 7.73046875, 9.265625, 10.80078125, 12.3359375, 13.87109375, 15.40625, 16.94140625, 18.4765625, 20.01171875, 21.546875, 23.08203125, 24.6171875, 26.15234375, 27.6875, 29.22265625, 30.7578125, 32.29296875, 33.828125, 35.36328125, 36.8984375, 38.43359375, 39.96875, 41.50390625, 43.0390625, 44.57421875, 46.109375, 47.64453125, 49.1796875, 50.71484375, 52.25]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 10.0, 23.0, 16.0, 23.0, 33.0, 73.0, 94.0, 142.0, 233.0, 405.0, 792.0, 1753.0, 4483.0, 14950.0, 71540.0, 506048.0, 376111.0, 52851.0, 11925.0, 3812.0, 1525.0, 716.0, 384.0, 209.0, 121.0, 81.0, 53.0, 36.0, 32.0, 19.0, 14.0, 14.0, 8.0, 5.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.0625, -39.81494140625, -38.5673828125, -37.31982421875, -36.072265625, -34.82470703125, -33.5771484375, -32.32958984375, -31.08203125, -29.83447265625, -28.5869140625, -27.33935546875, -26.091796875, -24.84423828125, -23.5966796875, -22.34912109375, -21.1015625, -19.85400390625, -18.6064453125, -17.35888671875, -16.111328125, -14.86376953125, -13.6162109375, -12.36865234375, -11.12109375, -9.87353515625, -8.6259765625, -7.37841796875, -6.130859375, -4.88330078125, -3.6357421875, -2.38818359375, -1.140625, 0.10693359375, 1.3544921875, 2.60205078125, 3.849609375, 5.09716796875, 6.3447265625, 7.59228515625, 8.83984375, 10.08740234375, 11.3349609375, 12.58251953125, 13.830078125, 15.07763671875, 16.3251953125, 17.57275390625, 18.8203125, 20.06787109375, 21.3154296875, 22.56298828125, 23.810546875, 25.05810546875, 26.3056640625, 27.55322265625, 28.80078125, 30.04833984375, 31.2958984375, 32.54345703125, 33.791015625, 35.03857421875, 36.2861328125, 37.53369140625, 38.78125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 16.0, 22.0, 35.0, 50.0, 79.0, 158.0, 200.0, 166.0, 83.0, 61.0, 37.0, 35.0, 9.0, 13.0, 3.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007717132568359375, -0.007426202297210693, -0.007135272026062012, -0.00684434175491333, -0.0065534114837646484, -0.006262481212615967, -0.005971550941467285, -0.0056806206703186035, -0.005389690399169922, -0.00509876012802124, -0.004807829856872559, -0.004516899585723877, -0.004225969314575195, -0.003935039043426514, -0.003644108772277832, -0.0033531785011291504, -0.0030622482299804688, -0.002771317958831787, -0.0024803876876831055, -0.002189457416534424, -0.0018985271453857422, -0.0016075968742370605, -0.001316666603088379, -0.0010257363319396973, -0.0007348060607910156, -0.000443875789642334, -0.00015294551849365234, 0.0001379847526550293, 0.00042891502380371094, 0.0007198452949523926, 0.0010107755661010742, 0.0013017058372497559, 0.0015926361083984375, 0.0018835663795471191, 0.0021744966506958008, 0.0024654269218444824, 0.002756357192993164, 0.0030472874641418457, 0.0033382177352905273, 0.003629148006439209, 0.003920078277587891, 0.004211008548736572, 0.004501938819885254, 0.0047928690910339355, 0.005083799362182617, 0.005374729633331299, 0.0056656599044799805, 0.005956590175628662, 0.006247520446777344, 0.006538450717926025, 0.006829380989074707, 0.007120311260223389, 0.00741124153137207, 0.007702171802520752, 0.007993102073669434, 0.008284032344818115, 0.008574962615966797, 0.008865892887115479, 0.00915682315826416, 0.009447753429412842, 0.009738683700561523, 0.010029613971710205, 0.010320544242858887, 0.010611474514007568, 0.01090240478515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 15.0, 13.0, 29.0, 57.0, 116.0, 226.0, 443.0, 1085.0, 3105.0, 13801.0, 144948.0, 790031.0, 81012.0, 9619.0, 2397.0, 926.0, 338.0, 178.0, 109.0, 38.0, 29.0, 13.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -70.08740234375, -68.0498046875, -66.01220703125, -63.974609375, -61.93701171875, -59.8994140625, -57.86181640625, -55.82421875, -53.78662109375, -51.7490234375, -49.71142578125, -47.673828125, -45.63623046875, -43.5986328125, -41.56103515625, -39.5234375, -37.48583984375, -35.4482421875, -33.41064453125, -31.373046875, -29.33544921875, -27.2978515625, -25.26025390625, -23.22265625, -21.18505859375, -19.1474609375, -17.10986328125, -15.072265625, -13.03466796875, -10.9970703125, -8.95947265625, -6.921875, -4.88427734375, -2.8466796875, -0.80908203125, 1.228515625, 3.26611328125, 5.3037109375, 7.34130859375, 9.37890625, 11.41650390625, 13.4541015625, 15.49169921875, 17.529296875, 19.56689453125, 21.6044921875, 23.64208984375, 25.6796875, 27.71728515625, 29.7548828125, 31.79248046875, 33.830078125, 35.86767578125, 37.9052734375, 39.94287109375, 41.98046875, 44.01806640625, 46.0556640625, 48.09326171875, 50.130859375, 52.16845703125, 54.2060546875, 56.24365234375, 58.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 6.0, 13.0, 20.0, 31.0, 48.0, 85.0, 112.0, 147.0, 159.0, 126.0, 76.0, 64.0, 33.0, 27.0, 17.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-68.0, -66.584716796875, -65.16943359375, -63.754150390625, -62.3388671875, -60.923583984375, -59.50830078125, -58.093017578125, -56.677734375, -55.262451171875, -53.84716796875, -52.431884765625, -51.0166015625, -49.601318359375, -48.18603515625, -46.770751953125, -45.35546875, -43.940185546875, -42.52490234375, -41.109619140625, -39.6943359375, -38.279052734375, -36.86376953125, -35.448486328125, -34.033203125, -32.617919921875, -31.20263671875, -29.787353515625, -28.3720703125, -26.956787109375, -25.54150390625, -24.126220703125, -22.7109375, -21.295654296875, -19.88037109375, -18.465087890625, -17.0498046875, -15.634521484375, -14.21923828125, -12.803955078125, -11.388671875, -9.973388671875, -8.55810546875, -7.142822265625, -5.7275390625, -4.312255859375, -2.89697265625, -1.481689453125, -0.06640625, 1.348876953125, 2.76416015625, 4.179443359375, 5.5947265625, 7.010009765625, 8.42529296875, 9.840576171875, 11.255859375, 12.671142578125, 14.08642578125, 15.501708984375, 16.9169921875, 18.332275390625, 19.74755859375, 21.162841796875, 22.578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 4.0, 10.0, 32.0, 56.0, 78.0, 120.0, 142.0, 139.0, 119.0, 109.0, 67.0, 53.0, 23.0, 23.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-708.301025390625, -691.5404663085938, -674.7799682617188, -658.0194091796875, -641.2589111328125, -624.4983520507812, -607.73779296875, -590.977294921875, -574.2167358398438, -557.4561767578125, -540.6956787109375, -523.9351196289062, -507.1745910644531, -490.4140625, -473.6535339355469, -456.89300537109375, -440.1324768066406, -423.3719482421875, -406.6114196777344, -389.85089111328125, -373.09033203125, -356.3298034667969, -339.56927490234375, -322.8087463378906, -306.0482177734375, -289.2876892089844, -272.52716064453125, -255.76661682128906, -239.00607299804688, -222.24554443359375, -205.48501586914062, -188.7244873046875, -171.96389770507812, -155.203369140625, -138.4428253173828, -121.68229675292969, -104.92176055908203, -88.16122436523438, -71.40069580078125, -54.640159606933594, -37.87962341308594, -21.119089126586914, -4.358554840087891, 12.4019775390625, 29.162513732910156, 45.92304992675781, 62.68357849121094, 79.4441146850586, 96.20465087890625, 112.9651870727539, 129.72572326660156, 146.4862518310547, 163.24679565429688, 180.00732421875, 196.76785278320312, 213.52838134765625, 230.28892517089844, 247.04945373535156, 263.80999755859375, 280.5705261230469, 297.3310546875, 314.09161376953125, 330.85211181640625, 347.6126708984375, 364.3731994628906]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 5.0, 6.0, 8.0, 12.0, 7.0, 13.0, 27.0, 25.0, 23.0, 21.0, 17.0, 37.0, 38.0, 31.0, 29.0, 41.0, 43.0, 37.0, 43.0, 50.0, 41.0, 46.0, 32.0, 40.0, 51.0, 34.0, 43.0, 24.0, 29.0, 30.0, 14.0, 15.0, 16.0, 8.0, 10.0, 12.0, 8.0, 3.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.30807495117188, -228.4667510986328, -220.62542724609375, -212.78408813476562, -204.94276428222656, -197.1014404296875, -189.26011657714844, -181.41879272460938, -173.57745361328125, -165.7361297607422, -157.89480590820312, -150.053466796875, -142.21214294433594, -134.37081909179688, -126.52949523925781, -118.68817138671875, -110.84684753417969, -103.00552368164062, -95.16419219970703, -87.32286834716797, -79.48153686523438, -71.64021301269531, -63.79888916015625, -55.95756149291992, -48.116233825683594, -40.274906158447266, -32.43357849121094, -24.592254638671875, -16.750926971435547, -8.909599304199219, -1.0682754516601562, 6.773052215576172, 14.6143798828125, 22.455707550048828, 30.297033309936523, 38.13835906982422, 45.97968673706055, 53.821014404296875, 61.66233825683594, 69.503662109375, 77.3449935913086, 85.18631744384766, 93.02764892578125, 100.86897277832031, 108.71029663085938, 116.55162811279297, 124.39295196533203, 132.23428344726562, 140.0756072998047, 147.91693115234375, 155.7582550048828, 163.59957885742188, 171.44091796875, 179.28224182128906, 187.12356567382812, 194.9648895263672, 202.80621337890625, 210.6475372314453, 218.48886108398438, 226.3302001953125, 234.17152404785156, 242.01284790039062, 249.8541717529297, 257.69549560546875, 265.5368347167969]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 3.0, 6.0, 8.0, 13.0, 13.0, 31.0, 30.0, 45.0, 102.0, 152.0, 212.0, 388.0, 757.0, 1526.0, 3788.0, 10600.0, 36987.0, 186378.0, 3402576.0, 459325.0, 64516.0, 16661.0, 5505.0, 2258.0, 1020.0, 565.0, 297.0, 175.0, 110.0, 61.0, 37.0, 45.0, 24.0, 22.0, 15.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-109.3125, -106.068359375, -102.82421875, -99.580078125, -96.3359375, -93.091796875, -89.84765625, -86.603515625, -83.359375, -80.115234375, -76.87109375, -73.626953125, -70.3828125, -67.138671875, -63.89453125, -60.650390625, -57.40625, -54.162109375, -50.91796875, -47.673828125, -44.4296875, -41.185546875, -37.94140625, -34.697265625, -31.453125, -28.208984375, -24.96484375, -21.720703125, -18.4765625, -15.232421875, -11.98828125, -8.744140625, -5.5, -2.255859375, 0.98828125, 4.232421875, 7.4765625, 10.720703125, 13.96484375, 17.208984375, 20.453125, 23.697265625, 26.94140625, 30.185546875, 33.4296875, 36.673828125, 39.91796875, 43.162109375, 46.40625, 49.650390625, 52.89453125, 56.138671875, 59.3828125, 62.626953125, 65.87109375, 69.115234375, 72.359375, 75.603515625, 78.84765625, 82.091796875, 85.3359375, 88.580078125, 91.82421875, 95.068359375, 98.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 12.0, 19.0, 13.0, 16.0, 23.0, 25.0, 29.0, 38.0, 52.0, 52.0, 38.0, 56.0, 52.0, 48.0, 46.0, 74.0, 56.0, 56.0, 52.0, 35.0, 27.0, 39.0, 38.0, 17.0, 13.0, 13.0, 6.0, 8.0, 11.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1015625, -10.685791015625, -10.27001953125, -9.854248046875, -9.4384765625, -9.022705078125, -8.60693359375, -8.191162109375, -7.775390625, -7.359619140625, -6.94384765625, -6.528076171875, -6.1123046875, -5.696533203125, -5.28076171875, -4.864990234375, -4.44921875, -4.033447265625, -3.61767578125, -3.201904296875, -2.7861328125, -2.370361328125, -1.95458984375, -1.538818359375, -1.123046875, -0.707275390625, -0.29150390625, 0.124267578125, 0.5400390625, 0.955810546875, 1.37158203125, 1.787353515625, 2.203125, 2.618896484375, 3.03466796875, 3.450439453125, 3.8662109375, 4.281982421875, 4.69775390625, 5.113525390625, 5.529296875, 5.945068359375, 6.36083984375, 6.776611328125, 7.1923828125, 7.608154296875, 8.02392578125, 8.439697265625, 8.85546875, 9.271240234375, 9.68701171875, 10.102783203125, 10.5185546875, 10.934326171875, 11.35009765625, 11.765869140625, 12.181640625, 12.597412109375, 13.01318359375, 13.428955078125, 13.8447265625, 14.260498046875, 14.67626953125, 15.092041015625, 15.5078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 13.0, 15.0, 20.0, 30.0, 50.0, 79.0, 90.0, 153.0, 213.0, 353.0, 584.0, 980.0, 1835.0, 3696.0, 8148.0, 20534.0, 61071.0, 235467.0, 2550557.0, 1075088.0, 160238.0, 45567.0, 15967.0, 6683.0, 3019.0, 1527.0, 912.0, 469.0, 309.0, 188.0, 136.0, 79.0, 72.0, 41.0, 33.0, 19.0, 10.0, 6.0, 5.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.0625, -51.224609375, -49.38671875, -47.548828125, -45.7109375, -43.873046875, -42.03515625, -40.197265625, -38.359375, -36.521484375, -34.68359375, -32.845703125, -31.0078125, -29.169921875, -27.33203125, -25.494140625, -23.65625, -21.818359375, -19.98046875, -18.142578125, -16.3046875, -14.466796875, -12.62890625, -10.791015625, -8.953125, -7.115234375, -5.27734375, -3.439453125, -1.6015625, 0.236328125, 2.07421875, 3.912109375, 5.75, 7.587890625, 9.42578125, 11.263671875, 13.1015625, 14.939453125, 16.77734375, 18.615234375, 20.453125, 22.291015625, 24.12890625, 25.966796875, 27.8046875, 29.642578125, 31.48046875, 33.318359375, 35.15625, 36.994140625, 38.83203125, 40.669921875, 42.5078125, 44.345703125, 46.18359375, 48.021484375, 49.859375, 51.697265625, 53.53515625, 55.373046875, 57.2109375, 59.048828125, 60.88671875, 62.724609375, 64.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 7.0, 12.0, 21.0, 34.0, 42.0, 60.0, 74.0, 107.0, 192.0, 308.0, 697.0, 1321.0, 462.0, 255.0, 158.0, 87.0, 60.0, 48.0, 34.0, 19.0, 15.0, 16.0, 11.0, 8.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-47.34375, -46.250244140625, -45.15673828125, -44.063232421875, -42.9697265625, -41.876220703125, -40.78271484375, -39.689208984375, -38.595703125, -37.502197265625, -36.40869140625, -35.315185546875, -34.2216796875, -33.128173828125, -32.03466796875, -30.941162109375, -29.84765625, -28.754150390625, -27.66064453125, -26.567138671875, -25.4736328125, -24.380126953125, -23.28662109375, -22.193115234375, -21.099609375, -20.006103515625, -18.91259765625, -17.819091796875, -16.7255859375, -15.632080078125, -14.53857421875, -13.445068359375, -12.3515625, -11.258056640625, -10.16455078125, -9.071044921875, -7.9775390625, -6.884033203125, -5.79052734375, -4.697021484375, -3.603515625, -2.510009765625, -1.41650390625, -0.322998046875, 0.7705078125, 1.864013671875, 2.95751953125, 4.051025390625, 5.14453125, 6.238037109375, 7.33154296875, 8.425048828125, 9.5185546875, 10.612060546875, 11.70556640625, 12.799072265625, 13.892578125, 14.986083984375, 16.07958984375, 17.173095703125, 18.2666015625, 19.360107421875, 20.45361328125, 21.547119140625, 22.640625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 12.0, 12.0, 37.0, 41.0, 84.0, 109.0, 167.0, 159.0, 126.0, 95.0, 53.0, 38.0, 27.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-399.27655029296875, -389.57904052734375, -379.88153076171875, -370.1840515136719, -360.4865417480469, -350.7890319824219, -341.0915222167969, -331.39404296875, -321.696533203125, -311.9990234375, -302.301513671875, -292.6040344238281, -282.9065246582031, -273.2090148925781, -263.5115051269531, -253.8140106201172, -244.1165008544922, -234.4189910888672, -224.72149658203125, -215.02398681640625, -205.3264923095703, -195.6289825439453, -185.93148803710938, -176.23397827148438, -166.53646850585938, -156.83895874023438, -147.14146423339844, -137.44395446777344, -127.7464599609375, -118.0489501953125, -108.35144805908203, -98.65394592285156, -88.95643615722656, -79.2589340209961, -69.56143188476562, -59.86392593383789, -50.16642379760742, -40.46892166137695, -30.77141571044922, -21.07391357421875, -11.376411437988281, -1.678908348083496, 8.018594741821289, 17.71609878540039, 27.41360092163086, 37.11110305786133, 46.80860900878906, 56.50611114501953, 66.20361328125, 75.90111541748047, 85.59861755371094, 95.29612731933594, 104.99362182617188, 114.69113159179688, 124.38863372802734, 134.0861358642578, 143.78363037109375, 153.48114013671875, 163.1786346435547, 172.8761444091797, 182.57363891601562, 192.27114868164062, 201.96865844726562, 211.66615295410156, 221.36366271972656]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 7.0, 11.0, 11.0, 21.0, 27.0, 20.0, 32.0, 44.0, 36.0, 39.0, 38.0, 42.0, 45.0, 41.0, 41.0, 55.0, 41.0, 53.0, 62.0, 51.0, 35.0, 36.0, 24.0, 33.0, 18.0, 19.0, 24.0, 10.0, 18.0, 5.0, 12.0, 3.0, 2.0, 4.0, 9.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-130.43902587890625, -126.33580780029297, -122.23258209228516, -118.12936401367188, -114.02613830566406, -109.92292022705078, -105.8197021484375, -101.71647644042969, -97.61325073242188, -93.5100326538086, -89.40680694580078, -85.3035888671875, -81.20036315917969, -77.0971450805664, -72.99392700195312, -68.89070129394531, -64.78748321533203, -60.684261322021484, -56.58103942871094, -52.477821350097656, -48.374595642089844, -44.27137756347656, -40.168155670166016, -36.06493377685547, -31.961711883544922, -27.858489990234375, -23.755268096923828, -19.652048110961914, -15.548826217651367, -11.44560432434082, -7.342384338378906, -3.2391624450683594, 0.8640594482421875, 4.967280864715576, 9.070502281188965, 13.173723220825195, 17.276945114135742, 21.38016700744629, 25.483386993408203, 29.58660888671875, 33.6898307800293, 37.793052673339844, 41.89627456665039, 45.99949645996094, 50.10271453857422, 54.20594024658203, 58.30915832519531, 62.41238021850586, 66.5156021118164, 70.61882019042969, 74.7220458984375, 78.82526397705078, 82.9284896850586, 87.03170776367188, 91.13493347167969, 95.23815155029297, 99.34136962890625, 103.44458770751953, 107.54781341552734, 111.65103149414062, 115.75425720214844, 119.85747528076172, 123.960693359375, 128.0639190673828, 132.16714477539062]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 14.0, 16.0, 27.0, 21.0, 66.0, 94.0, 124.0, 236.0, 320.0, 577.0, 1102.0, 2573.0, 6488.0, 18211.0, 59781.0, 200771.0, 407529.0, 241080.0, 73454.0, 22336.0, 7711.0, 2985.0, 1331.0, 700.0, 338.0, 209.0, 134.0, 84.0, 62.0, 46.0, 28.0, 17.0, 20.0, 11.0, 5.0, 8.0, 9.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-80.9375, -78.6630859375, -76.388671875, -74.1142578125, -71.83984375, -69.5654296875, -67.291015625, -65.0166015625, -62.7421875, -60.4677734375, -58.193359375, -55.9189453125, -53.64453125, -51.3701171875, -49.095703125, -46.8212890625, -44.546875, -42.2724609375, -39.998046875, -37.7236328125, -35.44921875, -33.1748046875, -30.900390625, -28.6259765625, -26.3515625, -24.0771484375, -21.802734375, -19.5283203125, -17.25390625, -14.9794921875, -12.705078125, -10.4306640625, -8.15625, -5.8818359375, -3.607421875, -1.3330078125, 0.94140625, 3.2158203125, 5.490234375, 7.7646484375, 10.0390625, 12.3134765625, 14.587890625, 16.8623046875, 19.13671875, 21.4111328125, 23.685546875, 25.9599609375, 28.234375, 30.5087890625, 32.783203125, 35.0576171875, 37.33203125, 39.6064453125, 41.880859375, 44.1552734375, 46.4296875, 48.7041015625, 50.978515625, 53.2529296875, 55.52734375, 57.8017578125, 60.076171875, 62.3505859375, 64.625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 8.0, 11.0, 15.0, 21.0, 20.0, 37.0, 27.0, 36.0, 46.0, 43.0, 50.0, 62.0, 49.0, 50.0, 59.0, 51.0, 57.0, 58.0, 33.0, 47.0, 44.0, 25.0, 31.0, 19.0, 17.0, 15.0, 9.0, 8.0, 8.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.0146484375, -9.576171875, -9.1376953125, -8.69921875, -8.2607421875, -7.822265625, -7.3837890625, -6.9453125, -6.5068359375, -6.068359375, -5.6298828125, -5.19140625, -4.7529296875, -4.314453125, -3.8759765625, -3.4375, -2.9990234375, -2.560546875, -2.1220703125, -1.68359375, -1.2451171875, -0.806640625, -0.3681640625, 0.0703125, 0.5087890625, 0.947265625, 1.3857421875, 1.82421875, 2.2626953125, 2.701171875, 3.1396484375, 3.578125, 4.0166015625, 4.455078125, 4.8935546875, 5.33203125, 5.7705078125, 6.208984375, 6.6474609375, 7.0859375, 7.5244140625, 7.962890625, 8.4013671875, 8.83984375, 9.2783203125, 9.716796875, 10.1552734375, 10.59375, 11.0322265625, 11.470703125, 11.9091796875, 12.34765625, 12.7861328125, 13.224609375, 13.6630859375, 14.1015625, 14.5400390625, 14.978515625, 15.4169921875, 15.85546875, 16.2939453125, 16.732421875, 17.1708984375, 17.609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 6.0, 7.0, 8.0, 11.0, 21.0, 19.0, 25.0, 43.0, 40.0, 81.0, 105.0, 130.0, 246.0, 311.0, 491.0, 739.0, 1424.0, 2911.0, 7377.0, 23383.0, 82152.0, 290311.0, 425137.0, 151113.0, 40832.0, 12404.0, 4449.0, 1906.0, 1034.0, 602.0, 355.0, 245.0, 163.0, 117.0, 80.0, 89.0, 50.0, 32.0, 31.0, 24.0, 12.0, 14.0, 4.0, 4.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-65.1875, -63.1650390625, -61.142578125, -59.1201171875, -57.09765625, -55.0751953125, -53.052734375, -51.0302734375, -49.0078125, -46.9853515625, -44.962890625, -42.9404296875, -40.91796875, -38.8955078125, -36.873046875, -34.8505859375, -32.828125, -30.8056640625, -28.783203125, -26.7607421875, -24.73828125, -22.7158203125, -20.693359375, -18.6708984375, -16.6484375, -14.6259765625, -12.603515625, -10.5810546875, -8.55859375, -6.5361328125, -4.513671875, -2.4912109375, -0.46875, 1.5537109375, 3.576171875, 5.5986328125, 7.62109375, 9.6435546875, 11.666015625, 13.6884765625, 15.7109375, 17.7333984375, 19.755859375, 21.7783203125, 23.80078125, 25.8232421875, 27.845703125, 29.8681640625, 31.890625, 33.9130859375, 35.935546875, 37.9580078125, 39.98046875, 42.0029296875, 44.025390625, 46.0478515625, 48.0703125, 50.0927734375, 52.115234375, 54.1376953125, 56.16015625, 58.1826171875, 60.205078125, 62.2275390625, 64.25]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 3.0, 6.0, 6.0, 12.0, 8.0, 11.0, 20.0, 13.0, 22.0, 25.0, 23.0, 32.0, 30.0, 37.0, 26.0, 41.0, 38.0, 34.0, 39.0, 37.0, 43.0, 40.0, 45.0, 43.0, 39.0, 28.0, 36.0, 29.0, 28.0, 27.0, 27.0, 18.0, 17.0, 12.0, 23.0, 13.0, 13.0, 13.0, 9.0, 6.0, 7.0, 0.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-51.9375, -50.376953125, -48.81640625, -47.255859375, -45.6953125, -44.134765625, -42.57421875, -41.013671875, -39.453125, -37.892578125, -36.33203125, -34.771484375, -33.2109375, -31.650390625, -30.08984375, -28.529296875, -26.96875, -25.408203125, -23.84765625, -22.287109375, -20.7265625, -19.166015625, -17.60546875, -16.044921875, -14.484375, -12.923828125, -11.36328125, -9.802734375, -8.2421875, -6.681640625, -5.12109375, -3.560546875, -2.0, -0.439453125, 1.12109375, 2.681640625, 4.2421875, 5.802734375, 7.36328125, 8.923828125, 10.484375, 12.044921875, 13.60546875, 15.166015625, 16.7265625, 18.287109375, 19.84765625, 21.408203125, 22.96875, 24.529296875, 26.08984375, 27.650390625, 29.2109375, 30.771484375, 32.33203125, 33.892578125, 35.453125, 37.013671875, 38.57421875, 40.134765625, 41.6953125, 43.255859375, 44.81640625, 46.376953125, 47.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 13.0, 14.0, 21.0, 27.0, 47.0, 103.0, 134.0, 248.0, 421.0, 777.0, 1410.0, 3036.0, 7161.0, 20018.0, 64567.0, 217923.0, 420413.0, 214842.0, 64269.0, 19735.0, 7078.0, 3089.0, 1413.0, 744.0, 426.0, 236.0, 133.0, 80.0, 46.0, 34.0, 25.0, 14.0, 8.0, 12.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.984375, -27.173095703125, -26.36181640625, -25.550537109375, -24.7392578125, -23.927978515625, -23.11669921875, -22.305419921875, -21.494140625, -20.682861328125, -19.87158203125, -19.060302734375, -18.2490234375, -17.437744140625, -16.62646484375, -15.815185546875, -15.00390625, -14.192626953125, -13.38134765625, -12.570068359375, -11.7587890625, -10.947509765625, -10.13623046875, -9.324951171875, -8.513671875, -7.702392578125, -6.89111328125, -6.079833984375, -5.2685546875, -4.457275390625, -3.64599609375, -2.834716796875, -2.0234375, -1.212158203125, -0.40087890625, 0.410400390625, 1.2216796875, 2.032958984375, 2.84423828125, 3.655517578125, 4.466796875, 5.278076171875, 6.08935546875, 6.900634765625, 7.7119140625, 8.523193359375, 9.33447265625, 10.145751953125, 10.95703125, 11.768310546875, 12.57958984375, 13.390869140625, 14.2021484375, 15.013427734375, 15.82470703125, 16.635986328125, 17.447265625, 18.258544921875, 19.06982421875, 19.881103515625, 20.6923828125, 21.503662109375, 22.31494140625, 23.126220703125, 23.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 11.0, 18.0, 16.0, 17.0, 31.0, 42.0, 41.0, 40.0, 50.0, 53.0, 62.0, 49.0, 53.0, 62.0, 58.0, 58.0, 52.0, 44.0, 34.0, 32.0, 31.0, 23.0, 13.0, 26.0, 11.0, 9.0, 6.0, 7.0, 7.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002956390380859375, -0.002844691276550293, -0.002732992172241211, -0.002621293067932129, -0.002509593963623047, -0.002397894859313965, -0.002286195755004883, -0.0021744966506958008, -0.0020627975463867188, -0.0019510984420776367, -0.0018393993377685547, -0.0017277002334594727, -0.0016160011291503906, -0.0015043020248413086, -0.0013926029205322266, -0.0012809038162231445, -0.0011692047119140625, -0.0010575056076049805, -0.0009458065032958984, -0.0008341073989868164, -0.0007224082946777344, -0.0006107091903686523, -0.0004990100860595703, -0.0003873109817504883, -0.00027561187744140625, -0.00016391277313232422, -5.221366882324219e-05, 5.9485435485839844e-05, 0.00017118453979492188, 0.0002828836441040039, 0.00039458274841308594, 0.000506281852722168, 0.00061798095703125, 0.000729680061340332, 0.0008413791656494141, 0.0009530782699584961, 0.0010647773742675781, 0.0011764764785766602, 0.0012881755828857422, 0.0013998746871948242, 0.0015115737915039062, 0.0016232728958129883, 0.0017349720001220703, 0.0018466711044311523, 0.0019583702087402344, 0.0020700693130493164, 0.0021817684173583984, 0.0022934675216674805, 0.0024051666259765625, 0.0025168657302856445, 0.0026285648345947266, 0.0027402639389038086, 0.0028519630432128906, 0.0029636621475219727, 0.0030753612518310547, 0.0031870603561401367, 0.0032987594604492188, 0.0034104585647583008, 0.003522157669067383, 0.003633856773376465, 0.003745555877685547, 0.003857254981994629, 0.003968954086303711, 0.004080653190612793, 0.004192352294921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 8.0, 10.0, 21.0, 34.0, 35.0, 55.0, 76.0, 100.0, 134.0, 235.0, 375.0, 617.0, 1181.0, 2451.0, 6214.0, 17586.0, 63160.0, 242701.0, 456752.0, 185504.0, 47549.0, 14027.0, 5056.0, 2066.0, 1011.0, 559.0, 336.0, 200.0, 148.0, 110.0, 57.0, 43.0, 35.0, 36.0, 14.0, 10.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.484375, -29.571533203125, -28.65869140625, -27.745849609375, -26.8330078125, -25.920166015625, -25.00732421875, -24.094482421875, -23.181640625, -22.268798828125, -21.35595703125, -20.443115234375, -19.5302734375, -18.617431640625, -17.70458984375, -16.791748046875, -15.87890625, -14.966064453125, -14.05322265625, -13.140380859375, -12.2275390625, -11.314697265625, -10.40185546875, -9.489013671875, -8.576171875, -7.663330078125, -6.75048828125, -5.837646484375, -4.9248046875, -4.011962890625, -3.09912109375, -2.186279296875, -1.2734375, -0.360595703125, 0.55224609375, 1.465087890625, 2.3779296875, 3.290771484375, 4.20361328125, 5.116455078125, 6.029296875, 6.942138671875, 7.85498046875, 8.767822265625, 9.6806640625, 10.593505859375, 11.50634765625, 12.419189453125, 13.33203125, 14.244873046875, 15.15771484375, 16.070556640625, 16.9833984375, 17.896240234375, 18.80908203125, 19.721923828125, 20.634765625, 21.547607421875, 22.46044921875, 23.373291015625, 24.2861328125, 25.198974609375, 26.11181640625, 27.024658203125, 27.9375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 15.0, 16.0, 19.0, 22.0, 23.0, 28.0, 32.0, 42.0, 42.0, 49.0, 62.0, 48.0, 68.0, 66.0, 62.0, 39.0, 42.0, 47.0, 38.0, 37.0, 19.0, 23.0, 26.0, 22.0, 12.0, 16.0, 11.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.85107421875, -19.1708984375, -18.49072265625, -17.810546875, -17.13037109375, -16.4501953125, -15.77001953125, -15.08984375, -14.40966796875, -13.7294921875, -13.04931640625, -12.369140625, -11.68896484375, -11.0087890625, -10.32861328125, -9.6484375, -8.96826171875, -8.2880859375, -7.60791015625, -6.927734375, -6.24755859375, -5.5673828125, -4.88720703125, -4.20703125, -3.52685546875, -2.8466796875, -2.16650390625, -1.486328125, -0.80615234375, -0.1259765625, 0.55419921875, 1.234375, 1.91455078125, 2.5947265625, 3.27490234375, 3.955078125, 4.63525390625, 5.3154296875, 5.99560546875, 6.67578125, 7.35595703125, 8.0361328125, 8.71630859375, 9.396484375, 10.07666015625, 10.7568359375, 11.43701171875, 12.1171875, 12.79736328125, 13.4775390625, 14.15771484375, 14.837890625, 15.51806640625, 16.1982421875, 16.87841796875, 17.55859375, 18.23876953125, 18.9189453125, 19.59912109375, 20.279296875, 20.95947265625, 21.6396484375, 22.31982421875, 23.0]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 11.0, 17.0, 48.0, 53.0, 83.0, 154.0, 148.0, 172.0, 133.0, 62.0, 46.0, 36.0, 16.0, 13.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-614.4017944335938, -594.3441772460938, -574.28662109375, -554.22900390625, -534.17138671875, -514.1138305664062, -494.05621337890625, -473.9986267089844, -453.9410400390625, -433.8834533691406, -413.8258361816406, -393.76824951171875, -373.7106628417969, -353.653076171875, -333.595458984375, -313.5378723144531, -293.4802551269531, -273.42266845703125, -253.3650665283203, -233.30746459960938, -213.2498779296875, -193.19227600097656, -173.13467407226562, -153.07708740234375, -133.0194854736328, -112.9618911743164, -92.904296875, -72.84669494628906, -52.789100646972656, -32.73150634765625, -12.673904418945312, 7.3836822509765625, 27.4412841796875, 47.498878479003906, 67.55647277832031, 87.61407470703125, 107.67166900634766, 127.72926330566406, 147.786865234375, 167.84445190429688, 187.9020538330078, 207.95965576171875, 228.01724243164062, 248.07484436035156, 268.1324462890625, 288.1900329589844, 308.24761962890625, 328.30523681640625, 348.3628234863281, 368.42041015625, 388.47802734375, 408.5356140136719, 428.59320068359375, 448.65081787109375, 468.7084045410156, 488.7659912109375, 508.8236083984375, 528.8812255859375, 548.9387817382812, 568.9963989257812, 589.0540161132812, 609.111572265625, 629.169189453125, 649.226806640625, 669.2843627929688]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 12.0, 14.0, 8.0, 19.0, 17.0, 12.0, 39.0, 31.0, 34.0, 41.0, 38.0, 33.0, 40.0, 37.0, 45.0, 30.0, 36.0, 48.0, 46.0, 50.0, 37.0, 47.0, 43.0, 30.0, 32.0, 28.0, 26.0, 17.0, 8.0, 15.0, 12.0, 12.0, 11.0, 11.0, 6.0, 5.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-294.7973937988281, -286.0057678222656, -277.2141418457031, -268.4225158691406, -259.6308898925781, -250.83926391601562, -242.0476531982422, -233.2560272216797, -224.4644012451172, -215.6727752685547, -206.8811492919922, -198.0895233154297, -189.29791259765625, -180.50628662109375, -171.71466064453125, -162.92303466796875, -154.13140869140625, -145.33978271484375, -136.54815673828125, -127.75653839111328, -118.96491241455078, -110.17328643798828, -101.38166809082031, -92.59004211425781, -83.79841613769531, -75.00679016113281, -66.21516418457031, -57.423545837402344, -48.631919860839844, -39.840293884277344, -31.04867172241211, -22.257049560546875, -13.46539306640625, -4.673768997192383, 4.117855072021484, 12.909479141235352, 21.70110321044922, 30.49272918701172, 39.28435134887695, 48.07597351074219, 56.86759948730469, 65.65922546386719, 74.45085144042969, 83.24246978759766, 92.03409576416016, 100.82572174072266, 109.61734008789062, 118.40896606445312, 127.20059204101562, 135.99221801757812, 144.78384399414062, 153.57546997070312, 162.36709594726562, 171.15872192382812, 179.95033264160156, 188.74195861816406, 197.53358459472656, 206.32521057128906, 215.11683654785156, 223.90846252441406, 232.7000732421875, 241.49169921875, 250.2833251953125, 259.074951171875, 267.8665771484375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 7.0, 12.0, 17.0, 30.0, 48.0, 98.0, 156.0, 296.0, 568.0, 1147.0, 3307.0, 18149.0, 4086182.0, 74239.0, 6545.0, 1804.0, 809.0, 385.0, 163.0, 102.0, 58.0, 55.0, 31.0, 14.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.625, -195.57421875, -188.5234375, -181.47265625, -174.421875, -167.37109375, -160.3203125, -153.26953125, -146.21875, -139.16796875, -132.1171875, -125.06640625, -118.015625, -110.96484375, -103.9140625, -96.86328125, -89.8125, -82.76171875, -75.7109375, -68.66015625, -61.609375, -54.55859375, -47.5078125, -40.45703125, -33.40625, -26.35546875, -19.3046875, -12.25390625, -5.203125, 1.84765625, 8.8984375, 15.94921875, 23.0, 30.05078125, 37.1015625, 44.15234375, 51.203125, 58.25390625, 65.3046875, 72.35546875, 79.40625, 86.45703125, 93.5078125, 100.55859375, 107.609375, 114.66015625, 121.7109375, 128.76171875, 135.8125, 142.86328125, 149.9140625, 156.96484375, 164.015625, 171.06640625, 178.1171875, 185.16796875, 192.21875, 199.26953125, 206.3203125, 213.37109375, 220.421875, 227.47265625, 234.5234375, 241.57421875, 248.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 7.0, 6.0, 9.0, 14.0, 12.0, 21.0, 16.0, 27.0, 41.0, 38.0, 37.0, 41.0, 42.0, 44.0, 48.0, 50.0, 61.0, 60.0, 63.0, 57.0, 40.0, 41.0, 47.0, 37.0, 25.0, 19.0, 12.0, 22.0, 14.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.546875, -12.085205078125, -11.62353515625, -11.161865234375, -10.7001953125, -10.238525390625, -9.77685546875, -9.315185546875, -8.853515625, -8.391845703125, -7.93017578125, -7.468505859375, -7.0068359375, -6.545166015625, -6.08349609375, -5.621826171875, -5.16015625, -4.698486328125, -4.23681640625, -3.775146484375, -3.3134765625, -2.851806640625, -2.39013671875, -1.928466796875, -1.466796875, -1.005126953125, -0.54345703125, -0.081787109375, 0.3798828125, 0.841552734375, 1.30322265625, 1.764892578125, 2.2265625, 2.688232421875, 3.14990234375, 3.611572265625, 4.0732421875, 4.534912109375, 4.99658203125, 5.458251953125, 5.919921875, 6.381591796875, 6.84326171875, 7.304931640625, 7.7666015625, 8.228271484375, 8.68994140625, 9.151611328125, 9.61328125, 10.074951171875, 10.53662109375, 10.998291015625, 11.4599609375, 11.921630859375, 12.38330078125, 12.844970703125, 13.306640625, 13.768310546875, 14.22998046875, 14.691650390625, 15.1533203125, 15.614990234375, 16.07666015625, 16.538330078125, 17.0]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 16.0, 13.0, 23.0, 21.0, 37.0, 48.0, 59.0, 102.0, 157.0, 230.0, 392.0, 712.0, 1092.0, 2220.0, 5357.0, 17117.0, 131744.0, 3966147.0, 50199.0, 10499.0, 3873.0, 1727.0, 978.0, 580.0, 317.0, 185.0, 136.0, 99.0, 62.0, 39.0, 32.0, 11.0, 17.0, 7.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-112.8125, -109.6181640625, -106.423828125, -103.2294921875, -100.03515625, -96.8408203125, -93.646484375, -90.4521484375, -87.2578125, -84.0634765625, -80.869140625, -77.6748046875, -74.48046875, -71.2861328125, -68.091796875, -64.8974609375, -61.703125, -58.5087890625, -55.314453125, -52.1201171875, -48.92578125, -45.7314453125, -42.537109375, -39.3427734375, -36.1484375, -32.9541015625, -29.759765625, -26.5654296875, -23.37109375, -20.1767578125, -16.982421875, -13.7880859375, -10.59375, -7.3994140625, -4.205078125, -1.0107421875, 2.18359375, 5.3779296875, 8.572265625, 11.7666015625, 14.9609375, 18.1552734375, 21.349609375, 24.5439453125, 27.73828125, 30.9326171875, 34.126953125, 37.3212890625, 40.515625, 43.7099609375, 46.904296875, 50.0986328125, 53.29296875, 56.4873046875, 59.681640625, 62.8759765625, 66.0703125, 69.2646484375, 72.458984375, 75.6533203125, 78.84765625, 82.0419921875, 85.236328125, 88.4306640625, 91.625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 10.0, 21.0, 25.0, 43.0, 100.0, 288.0, 3262.0, 174.0, 63.0, 24.0, 14.0, 15.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.703125, -23.067626953125, -22.43212890625, -21.796630859375, -21.1611328125, -20.525634765625, -19.89013671875, -19.254638671875, -18.619140625, -17.983642578125, -17.34814453125, -16.712646484375, -16.0771484375, -15.441650390625, -14.80615234375, -14.170654296875, -13.53515625, -12.899658203125, -12.26416015625, -11.628662109375, -10.9931640625, -10.357666015625, -9.72216796875, -9.086669921875, -8.451171875, -7.815673828125, -7.18017578125, -6.544677734375, -5.9091796875, -5.273681640625, -4.63818359375, -4.002685546875, -3.3671875, -2.731689453125, -2.09619140625, -1.460693359375, -0.8251953125, -0.189697265625, 0.44580078125, 1.081298828125, 1.716796875, 2.352294921875, 2.98779296875, 3.623291015625, 4.2587890625, 4.894287109375, 5.52978515625, 6.165283203125, 6.80078125, 7.436279296875, 8.07177734375, 8.707275390625, 9.3427734375, 9.978271484375, 10.61376953125, 11.249267578125, 11.884765625, 12.520263671875, 13.15576171875, 13.791259765625, 14.4267578125, 15.062255859375, 15.69775390625, 16.333251953125, 16.96875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 13.0, 14.0, 33.0, 32.0, 57.0, 58.0, 81.0, 105.0, 133.0, 102.0, 93.0, 84.0, 62.0, 43.0, 21.0, 19.0, 16.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.64203643798828, -61.530479431152344, -59.418922424316406, -57.30736541748047, -55.19580841064453, -53.084251403808594, -50.972694396972656, -48.86113739013672, -46.74958038330078, -44.638023376464844, -42.526466369628906, -40.41490936279297, -38.30335235595703, -36.191795349121094, -34.080238342285156, -31.96868133544922, -29.85712432861328, -27.745567321777344, -25.634010314941406, -23.52245330810547, -21.41089630126953, -19.299339294433594, -17.187782287597656, -15.076225280761719, -12.964668273925781, -10.853111267089844, -8.741554260253906, -6.629997253417969, -4.518440246582031, -2.4068832397460938, -0.29532623291015625, 1.8162307739257812, 3.9277801513671875, 6.039337158203125, 8.150894165039062, 10.262451171875, 12.374008178710938, 14.485565185546875, 16.597122192382812, 18.70867919921875, 20.820236206054688, 22.931793212890625, 25.043350219726562, 27.1549072265625, 29.266464233398438, 31.378021240234375, 33.48957824707031, 35.60113525390625, 37.71269226074219, 39.824249267578125, 41.93580627441406, 44.04736328125, 46.15892028808594, 48.270477294921875, 50.38203430175781, 52.49359130859375, 54.60514831542969, 56.716705322265625, 58.82826232910156, 60.9398193359375, 63.05137634277344, 65.16293334960938, 67.27449035644531, 69.38604736328125, 71.49760437011719]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 10.0, 7.0, 9.0, 4.0, 10.0, 19.0, 15.0, 22.0, 24.0, 29.0, 27.0, 29.0, 27.0, 31.0, 51.0, 41.0, 54.0, 59.0, 58.0, 42.0, 41.0, 38.0, 38.0, 36.0, 35.0, 35.0, 29.0, 26.0, 20.0, 22.0, 15.0, 16.0, 20.0, 10.0, 11.0, 8.0, 4.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.5850715637207, -35.49740219116211, -34.40972900390625, -33.322059631347656, -32.23439025878906, -31.146717071533203, -30.05904769897461, -28.971376419067383, -27.883705139160156, -26.79603385925293, -25.708362579345703, -24.62069320678711, -23.533021926879883, -22.445350646972656, -21.357681274414062, -20.270009994506836, -19.18233871459961, -18.094667434692383, -17.006996154785156, -15.919326782226562, -14.831655502319336, -13.74398422241211, -12.6563138961792, -11.568643569946289, -10.480972290039062, -9.393301010131836, -8.305630683898926, -7.217959880828857, -6.130289077758789, -5.042618274688721, -3.9549474716186523, -2.867276668548584, -1.77960205078125, -0.6919312477111816, 0.3957395553588867, 1.483410358428955, 2.5710811614990234, 3.658751964569092, 4.74642276763916, 5.8340935707092285, 6.921764373779297, 8.009435653686523, 9.097105979919434, 10.184776306152344, 11.27244758605957, 12.360118865966797, 13.447789192199707, 14.535459518432617, 15.623130798339844, 16.71080207824707, 17.798473358154297, 18.88614273071289, 19.973814010620117, 21.061485290527344, 22.149154663085938, 23.236825942993164, 24.32449722290039, 25.412168502807617, 26.499839782714844, 27.587509155273438, 28.675180435180664, 29.76285171508789, 30.850521087646484, 31.93819236755371, 33.02586364746094]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 9.0, 10.0, 17.0, 31.0, 38.0, 67.0, 93.0, 163.0, 228.0, 392.0, 822.0, 1602.0, 3762.0, 9365.0, 25503.0, 71721.0, 190532.0, 348573.0, 243277.0, 95801.0, 34591.0, 12687.0, 4898.0, 2060.0, 997.0, 524.0, 273.0, 180.0, 119.0, 76.0, 43.0, 27.0, 21.0, 11.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.9375, -58.20751953125, -56.4775390625, -54.74755859375, -53.017578125, -51.28759765625, -49.5576171875, -47.82763671875, -46.09765625, -44.36767578125, -42.6376953125, -40.90771484375, -39.177734375, -37.44775390625, -35.7177734375, -33.98779296875, -32.2578125, -30.52783203125, -28.7978515625, -27.06787109375, -25.337890625, -23.60791015625, -21.8779296875, -20.14794921875, -18.41796875, -16.68798828125, -14.9580078125, -13.22802734375, -11.498046875, -9.76806640625, -8.0380859375, -6.30810546875, -4.578125, -2.84814453125, -1.1181640625, 0.61181640625, 2.341796875, 4.07177734375, 5.8017578125, 7.53173828125, 9.26171875, 10.99169921875, 12.7216796875, 14.45166015625, 16.181640625, 17.91162109375, 19.6416015625, 21.37158203125, 23.1015625, 24.83154296875, 26.5615234375, 28.29150390625, 30.021484375, 31.75146484375, 33.4814453125, 35.21142578125, 36.94140625, 38.67138671875, 40.4013671875, 42.13134765625, 43.861328125, 45.59130859375, 47.3212890625, 49.05126953125, 50.78125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 3.0, 9.0, 5.0, 7.0, 13.0, 20.0, 24.0, 14.0, 22.0, 27.0, 33.0, 33.0, 41.0, 32.0, 40.0, 49.0, 55.0, 51.0, 60.0, 55.0, 48.0, 36.0, 54.0, 50.0, 34.0, 35.0, 31.0, 24.0, 16.0, 14.0, 9.0, 14.0, 8.0, 5.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.4676513671875, -11.989990234375, -11.5123291015625, -11.03466796875, -10.5570068359375, -10.079345703125, -9.6016845703125, -9.1240234375, -8.6463623046875, -8.168701171875, -7.6910400390625, -7.21337890625, -6.7357177734375, -6.258056640625, -5.7803955078125, -5.302734375, -4.8250732421875, -4.347412109375, -3.8697509765625, -3.39208984375, -2.9144287109375, -2.436767578125, -1.9591064453125, -1.4814453125, -1.0037841796875, -0.526123046875, -0.0484619140625, 0.42919921875, 0.9068603515625, 1.384521484375, 1.8621826171875, 2.33984375, 2.8175048828125, 3.295166015625, 3.7728271484375, 4.25048828125, 4.7281494140625, 5.205810546875, 5.6834716796875, 6.1611328125, 6.6387939453125, 7.116455078125, 7.5941162109375, 8.07177734375, 8.5494384765625, 9.027099609375, 9.5047607421875, 9.982421875, 10.4600830078125, 10.937744140625, 11.4154052734375, 11.89306640625, 12.3707275390625, 12.848388671875, 13.3260498046875, 13.8037109375, 14.2813720703125, 14.759033203125, 15.2366943359375, 15.71435546875, 16.1920166015625, 16.669677734375, 17.1473388671875, 17.625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 10.0, 11.0, 13.0, 21.0, 21.0, 28.0, 35.0, 46.0, 67.0, 95.0, 117.0, 177.0, 219.0, 281.0, 368.0, 594.0, 963.0, 1612.0, 3123.0, 6941.0, 19039.0, 53093.0, 153035.0, 374738.0, 275705.0, 99917.0, 34515.0, 12408.0, 5114.0, 2329.0, 1246.0, 739.0, 507.0, 327.0, 255.0, 235.0, 136.0, 127.0, 91.0, 71.0, 54.0, 36.0, 21.0, 24.0, 19.0, 5.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0], "bins": [-49.34375, -47.8837890625, -46.423828125, -44.9638671875, -43.50390625, -42.0439453125, -40.583984375, -39.1240234375, -37.6640625, -36.2041015625, -34.744140625, -33.2841796875, -31.82421875, -30.3642578125, -28.904296875, -27.4443359375, -25.984375, -24.5244140625, -23.064453125, -21.6044921875, -20.14453125, -18.6845703125, -17.224609375, -15.7646484375, -14.3046875, -12.8447265625, -11.384765625, -9.9248046875, -8.46484375, -7.0048828125, -5.544921875, -4.0849609375, -2.625, -1.1650390625, 0.294921875, 1.7548828125, 3.21484375, 4.6748046875, 6.134765625, 7.5947265625, 9.0546875, 10.5146484375, 11.974609375, 13.4345703125, 14.89453125, 16.3544921875, 17.814453125, 19.2744140625, 20.734375, 22.1943359375, 23.654296875, 25.1142578125, 26.57421875, 28.0341796875, 29.494140625, 30.9541015625, 32.4140625, 33.8740234375, 35.333984375, 36.7939453125, 38.25390625, 39.7138671875, 41.173828125, 42.6337890625, 44.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 13.0, 10.0, 13.0, 13.0, 9.0, 20.0, 21.0, 30.0, 26.0, 34.0, 30.0, 40.0, 35.0, 25.0, 32.0, 29.0, 37.0, 41.0, 44.0, 36.0, 37.0, 34.0, 35.0, 28.0, 20.0, 31.0, 31.0, 23.0, 21.0, 24.0, 22.0, 17.0, 23.0, 16.0, 15.0, 10.0, 5.0, 8.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-52.03125, -50.40380859375, -48.7763671875, -47.14892578125, -45.521484375, -43.89404296875, -42.2666015625, -40.63916015625, -39.01171875, -37.38427734375, -35.7568359375, -34.12939453125, -32.501953125, -30.87451171875, -29.2470703125, -27.61962890625, -25.9921875, -24.36474609375, -22.7373046875, -21.10986328125, -19.482421875, -17.85498046875, -16.2275390625, -14.60009765625, -12.97265625, -11.34521484375, -9.7177734375, -8.09033203125, -6.462890625, -4.83544921875, -3.2080078125, -1.58056640625, 0.046875, 1.67431640625, 3.3017578125, 4.92919921875, 6.556640625, 8.18408203125, 9.8115234375, 11.43896484375, 13.06640625, 14.69384765625, 16.3212890625, 17.94873046875, 19.576171875, 21.20361328125, 22.8310546875, 24.45849609375, 26.0859375, 27.71337890625, 29.3408203125, 30.96826171875, 32.595703125, 34.22314453125, 35.8505859375, 37.47802734375, 39.10546875, 40.73291015625, 42.3603515625, 43.98779296875, 45.615234375, 47.24267578125, 48.8701171875, 50.49755859375, 52.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 3.0, 2.0, 10.0, 10.0, 13.0, 27.0, 38.0, 47.0, 57.0, 107.0, 149.0, 238.0, 419.0, 715.0, 1321.0, 2767.0, 6402.0, 17974.0, 63972.0, 265515.0, 484956.0, 147132.0, 36528.0, 11342.0, 4240.0, 2043.0, 1018.0, 569.0, 296.0, 210.0, 141.0, 86.0, 53.0, 34.0, 37.0, 26.0, 17.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.765625, -25.936767578125, -25.10791015625, -24.279052734375, -23.4501953125, -22.621337890625, -21.79248046875, -20.963623046875, -20.134765625, -19.305908203125, -18.47705078125, -17.648193359375, -16.8193359375, -15.990478515625, -15.16162109375, -14.332763671875, -13.50390625, -12.675048828125, -11.84619140625, -11.017333984375, -10.1884765625, -9.359619140625, -8.53076171875, -7.701904296875, -6.873046875, -6.044189453125, -5.21533203125, -4.386474609375, -3.5576171875, -2.728759765625, -1.89990234375, -1.071044921875, -0.2421875, 0.586669921875, 1.41552734375, 2.244384765625, 3.0732421875, 3.902099609375, 4.73095703125, 5.559814453125, 6.388671875, 7.217529296875, 8.04638671875, 8.875244140625, 9.7041015625, 10.532958984375, 11.36181640625, 12.190673828125, 13.01953125, 13.848388671875, 14.67724609375, 15.506103515625, 16.3349609375, 17.163818359375, 17.99267578125, 18.821533203125, 19.650390625, 20.479248046875, 21.30810546875, 22.136962890625, 22.9658203125, 23.794677734375, 24.62353515625, 25.452392578125, 26.28125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 13.0, 19.0, 38.0, 52.0, 83.0, 120.0, 163.0, 148.0, 121.0, 80.0, 61.0, 34.0, 24.0, 12.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00685882568359375, -0.0066378116607666016, -0.006416797637939453, -0.006195783615112305, -0.005974769592285156, -0.005753755569458008, -0.005532741546630859, -0.005311727523803711, -0.0050907135009765625, -0.004869699478149414, -0.004648685455322266, -0.004427671432495117, -0.004206657409667969, -0.00398564338684082, -0.003764629364013672, -0.0035436153411865234, -0.003322601318359375, -0.0031015872955322266, -0.002880573272705078, -0.0026595592498779297, -0.0024385452270507812, -0.002217531204223633, -0.0019965171813964844, -0.001775503158569336, -0.0015544891357421875, -0.001333475112915039, -0.0011124610900878906, -0.0008914470672607422, -0.0006704330444335938, -0.0004494190216064453, -0.00022840499877929688, -7.3909759521484375e-06, 0.000213623046875, 0.00043463706970214844, 0.0006556510925292969, 0.0008766651153564453, 0.0010976791381835938, 0.0013186931610107422, 0.0015397071838378906, 0.001760721206665039, 0.0019817352294921875, 0.002202749252319336, 0.0024237632751464844, 0.002644777297973633, 0.0028657913208007812, 0.0030868053436279297, 0.003307819366455078, 0.0035288333892822266, 0.003749847412109375, 0.0039708614349365234, 0.004191875457763672, 0.00441288948059082, 0.004633903503417969, 0.004854917526245117, 0.005075931549072266, 0.005296945571899414, 0.0055179595947265625, 0.005738973617553711, 0.005959987640380859, 0.006181001663208008, 0.006402015686035156, 0.006623029708862305, 0.006844043731689453, 0.0070650577545166016, 0.00728607177734375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 4.0, 12.0, 12.0, 32.0, 47.0, 65.0, 133.0, 191.0, 364.0, 799.0, 1785.0, 5458.0, 25847.0, 249870.0, 668868.0, 77915.0, 11681.0, 3074.0, 1164.0, 557.0, 265.0, 150.0, 105.0, 58.0, 34.0, 18.0, 14.0, 13.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.34375, -47.8603515625, -46.376953125, -44.8935546875, -43.41015625, -41.9267578125, -40.443359375, -38.9599609375, -37.4765625, -35.9931640625, -34.509765625, -33.0263671875, -31.54296875, -30.0595703125, -28.576171875, -27.0927734375, -25.609375, -24.1259765625, -22.642578125, -21.1591796875, -19.67578125, -18.1923828125, -16.708984375, -15.2255859375, -13.7421875, -12.2587890625, -10.775390625, -9.2919921875, -7.80859375, -6.3251953125, -4.841796875, -3.3583984375, -1.875, -0.3916015625, 1.091796875, 2.5751953125, 4.05859375, 5.5419921875, 7.025390625, 8.5087890625, 9.9921875, 11.4755859375, 12.958984375, 14.4423828125, 15.92578125, 17.4091796875, 18.892578125, 20.3759765625, 21.859375, 23.3427734375, 24.826171875, 26.3095703125, 27.79296875, 29.2763671875, 30.759765625, 32.2431640625, 33.7265625, 35.2099609375, 36.693359375, 38.1767578125, 39.66015625, 41.1435546875, 42.626953125, 44.1103515625, 45.59375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 5.0, 10.0, 8.0, 13.0, 21.0, 23.0, 23.0, 46.0, 59.0, 47.0, 80.0, 75.0, 85.0, 85.0, 87.0, 65.0, 58.0, 41.0, 34.0, 23.0, 23.0, 14.0, 12.0, 11.0, 5.0, 5.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.5625, -30.628662109375, -29.69482421875, -28.760986328125, -27.8271484375, -26.893310546875, -25.95947265625, -25.025634765625, -24.091796875, -23.157958984375, -22.22412109375, -21.290283203125, -20.3564453125, -19.422607421875, -18.48876953125, -17.554931640625, -16.62109375, -15.687255859375, -14.75341796875, -13.819580078125, -12.8857421875, -11.951904296875, -11.01806640625, -10.084228515625, -9.150390625, -8.216552734375, -7.28271484375, -6.348876953125, -5.4150390625, -4.481201171875, -3.54736328125, -2.613525390625, -1.6796875, -0.745849609375, 0.18798828125, 1.121826171875, 2.0556640625, 2.989501953125, 3.92333984375, 4.857177734375, 5.791015625, 6.724853515625, 7.65869140625, 8.592529296875, 9.5263671875, 10.460205078125, 11.39404296875, 12.327880859375, 13.26171875, 14.195556640625, 15.12939453125, 16.063232421875, 16.9970703125, 17.930908203125, 18.86474609375, 19.798583984375, 20.732421875, 21.666259765625, 22.60009765625, 23.533935546875, 24.4677734375, 25.401611328125, 26.33544921875, 27.269287109375, 28.203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 18.0, 40.0, 124.0, 225.0, 253.0, 184.0, 93.0, 40.0, 11.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-927.5210571289062, -892.4483642578125, -857.3756103515625, -822.3028564453125, -787.2301635742188, -752.157470703125, -717.084716796875, -682.011962890625, -646.9392700195312, -611.8665771484375, -576.7938232421875, -541.7210693359375, -506.64837646484375, -471.5756530761719, -436.5029296875, -401.4302062988281, -366.35748291015625, -331.2847595214844, -296.2120361328125, -261.1393127441406, -226.06658935546875, -190.99386596679688, -155.921142578125, -120.84841918945312, -85.77569580078125, -50.702972412109375, -15.6302490234375, 19.442474365234375, 54.51519775390625, 89.58792114257812, 124.66064453125, 159.73336791992188, 194.8060302734375, 229.87875366210938, 264.95147705078125, 300.0242004394531, 335.096923828125, 370.1696472167969, 405.24237060546875, 440.3150939941406, 475.3878173828125, 510.4605407714844, 545.5332641601562, 580.60595703125, 615.6787109375, 650.75146484375, 685.8241577148438, 720.8968505859375, 755.9696044921875, 791.0423583984375, 826.1150512695312, 861.187744140625, 896.260498046875, 931.333251953125, 966.4059448242188, 1001.4786376953125, 1036.5513916015625, 1071.6241455078125, 1106.69677734375, 1141.76953125, 1176.84228515625, 1211.9150390625, 1246.98779296875, 1282.0604248046875, 1317.1331787109375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 7.0, 6.0, 14.0, 14.0, 17.0, 18.0, 17.0, 14.0, 22.0, 27.0, 29.0, 31.0, 35.0, 38.0, 36.0, 31.0, 44.0, 58.0, 63.0, 45.0, 42.0, 35.0, 59.0, 51.0, 44.0, 26.0, 27.0, 25.0, 17.0, 20.0, 19.0, 13.0, 11.0, 8.0, 11.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-339.6788330078125, -329.2286376953125, -318.7784423828125, -308.3282165527344, -297.8780212402344, -287.4278259277344, -276.9776306152344, -266.5274353027344, -256.07720947265625, -245.62701416015625, -235.1768035888672, -224.7266082763672, -214.27639770507812, -203.82620239257812, -193.37600708007812, -182.92581176757812, -172.47561645507812, -162.02542114257812, -151.57521057128906, -141.12501525878906, -130.6748046875, -120.224609375, -109.7744140625, -99.32421112060547, -88.87400817871094, -78.4238052368164, -67.97360229492188, -57.523406982421875, -47.073204040527344, -36.62300109863281, -26.172801971435547, -15.722602844238281, -5.27239990234375, 5.177801132202148, 15.628002166748047, 26.078203201293945, 36.528404235839844, 46.978607177734375, 57.42880630493164, 67.8790054321289, 78.32920837402344, 88.77941131591797, 99.2296142578125, 109.6798095703125, 120.13001251220703, 130.58021545410156, 141.03041076660156, 151.48062133789062, 161.93081665039062, 172.38101196289062, 182.8312225341797, 193.2814178466797, 203.73162841796875, 214.18182373046875, 224.63201904296875, 235.08221435546875, 245.5324249267578, 255.9826202392578, 266.4328308105469, 276.8830261230469, 287.3332214355469, 297.783447265625, 308.233642578125, 318.683837890625, 329.134033203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 12.0, 25.0, 30.0, 58.0, 106.0, 188.0, 492.0, 1811.0, 9583.0, 230764.0, 3935103.0, 12721.0, 2278.0, 613.0, 224.0, 114.0, 63.0, 37.0, 19.0, 8.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.875, -161.134765625, -155.39453125, -149.654296875, -143.9140625, -138.173828125, -132.43359375, -126.693359375, -120.953125, -115.212890625, -109.47265625, -103.732421875, -97.9921875, -92.251953125, -86.51171875, -80.771484375, -75.03125, -69.291015625, -63.55078125, -57.810546875, -52.0703125, -46.330078125, -40.58984375, -34.849609375, -29.109375, -23.369140625, -17.62890625, -11.888671875, -6.1484375, -0.408203125, 5.33203125, 11.072265625, 16.8125, 22.552734375, 28.29296875, 34.033203125, 39.7734375, 45.513671875, 51.25390625, 56.994140625, 62.734375, 68.474609375, 74.21484375, 79.955078125, 85.6953125, 91.435546875, 97.17578125, 102.916015625, 108.65625, 114.396484375, 120.13671875, 125.876953125, 131.6171875, 137.357421875, 143.09765625, 148.837890625, 154.578125, 160.318359375, 166.05859375, 171.798828125, 177.5390625, 183.279296875, 189.01953125, 194.759765625, 200.5]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 3.0, 7.0, 9.0, 14.0, 12.0, 16.0, 20.0, 22.0, 27.0, 28.0, 43.0, 35.0, 45.0, 48.0, 53.0, 60.0, 42.0, 54.0, 50.0, 48.0, 48.0, 47.0, 45.0, 39.0, 33.0, 22.0, 25.0, 27.0, 17.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2510986328125, -13.744384765625, -13.2376708984375, -12.73095703125, -12.2242431640625, -11.717529296875, -11.2108154296875, -10.7041015625, -10.1973876953125, -9.690673828125, -9.1839599609375, -8.67724609375, -8.1705322265625, -7.663818359375, -7.1571044921875, -6.650390625, -6.1436767578125, -5.636962890625, -5.1302490234375, -4.62353515625, -4.1168212890625, -3.610107421875, -3.1033935546875, -2.5966796875, -2.0899658203125, -1.583251953125, -1.0765380859375, -0.56982421875, -0.0631103515625, 0.443603515625, 0.9503173828125, 1.45703125, 1.9637451171875, 2.470458984375, 2.9771728515625, 3.48388671875, 3.9906005859375, 4.497314453125, 5.0040283203125, 5.5107421875, 6.0174560546875, 6.524169921875, 7.0308837890625, 7.53759765625, 8.0443115234375, 8.551025390625, 9.0577392578125, 9.564453125, 10.0711669921875, 10.577880859375, 11.0845947265625, 11.59130859375, 12.0980224609375, 12.604736328125, 13.1114501953125, 13.6181640625, 14.1248779296875, 14.631591796875, 15.1383056640625, 15.64501953125, 16.1517333984375, 16.658447265625, 17.1651611328125, 17.671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 6.0, 17.0, 16.0, 19.0, 30.0, 43.0, 57.0, 66.0, 98.0, 156.0, 174.0, 281.0, 373.0, 503.0, 791.0, 1202.0, 1784.0, 2762.0, 4507.0, 7988.0, 15524.0, 37854.0, 146286.0, 3755257.0, 144818.0, 37586.0, 15455.0, 7846.0, 4339.0, 2707.0, 1814.0, 1227.0, 813.0, 523.0, 374.0, 241.0, 215.0, 139.0, 84.0, 73.0, 54.0, 36.0, 41.0, 18.0, 25.0, 24.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-42.1875, -40.80419921875, -39.4208984375, -38.03759765625, -36.654296875, -35.27099609375, -33.8876953125, -32.50439453125, -31.12109375, -29.73779296875, -28.3544921875, -26.97119140625, -25.587890625, -24.20458984375, -22.8212890625, -21.43798828125, -20.0546875, -18.67138671875, -17.2880859375, -15.90478515625, -14.521484375, -13.13818359375, -11.7548828125, -10.37158203125, -8.98828125, -7.60498046875, -6.2216796875, -4.83837890625, -3.455078125, -2.07177734375, -0.6884765625, 0.69482421875, 2.078125, 3.46142578125, 4.8447265625, 6.22802734375, 7.611328125, 8.99462890625, 10.3779296875, 11.76123046875, 13.14453125, 14.52783203125, 15.9111328125, 17.29443359375, 18.677734375, 20.06103515625, 21.4443359375, 22.82763671875, 24.2109375, 25.59423828125, 26.9775390625, 28.36083984375, 29.744140625, 31.12744140625, 32.5107421875, 33.89404296875, 35.27734375, 36.66064453125, 38.0439453125, 39.42724609375, 40.810546875, 42.19384765625, 43.5771484375, 44.96044921875, 46.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 24.0, 32.0, 42.0, 58.0, 166.0, 2757.0, 580.0, 135.0, 74.0, 33.0, 33.0, 21.0, 12.0, 8.0, 12.0, 14.0, 4.0, 6.0, 5.0, 6.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.417724609375, -12.98388671875, -12.550048828125, -12.1162109375, -11.682373046875, -11.24853515625, -10.814697265625, -10.380859375, -9.947021484375, -9.51318359375, -9.079345703125, -8.6455078125, -8.211669921875, -7.77783203125, -7.343994140625, -6.91015625, -6.476318359375, -6.04248046875, -5.608642578125, -5.1748046875, -4.740966796875, -4.30712890625, -3.873291015625, -3.439453125, -3.005615234375, -2.57177734375, -2.137939453125, -1.7041015625, -1.270263671875, -0.83642578125, -0.402587890625, 0.03125, 0.465087890625, 0.89892578125, 1.332763671875, 1.7666015625, 2.200439453125, 2.63427734375, 3.068115234375, 3.501953125, 3.935791015625, 4.36962890625, 4.803466796875, 5.2373046875, 5.671142578125, 6.10498046875, 6.538818359375, 6.97265625, 7.406494140625, 7.84033203125, 8.274169921875, 8.7080078125, 9.141845703125, 9.57568359375, 10.009521484375, 10.443359375, 10.877197265625, 11.31103515625, 11.744873046875, 12.1787109375, 12.612548828125, 13.04638671875, 13.480224609375, 13.9140625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 13.0, 11.0, 24.0, 33.0, 65.0, 72.0, 93.0, 99.0, 128.0, 113.0, 74.0, 78.0, 59.0, 39.0, 33.0, 19.0, 11.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.242706298828125, -53.68707275390625, -51.13143539428711, -48.575801849365234, -46.020164489746094, -43.46453094482422, -40.908897399902344, -38.35326385498047, -35.79762649536133, -33.24199295043945, -30.686355590820312, -28.130722045898438, -25.57508659362793, -23.019451141357422, -20.463817596435547, -17.90818214416504, -15.352546691894531, -12.796911239624023, -10.241276741027832, -7.685641765594482, -5.130006790161133, -2.574371337890625, -0.018736839294433594, 2.536897659301758, 5.092533111572266, 7.648168087005615, 10.203803062438965, 12.759437561035156, 15.315073013305664, 17.870708465576172, 20.426342010498047, 22.981977462768555, 25.537612915039062, 28.09324836730957, 30.648883819580078, 33.20451736450195, 35.760154724121094, 38.31578826904297, 40.871421813964844, 43.42705535888672, 45.98269271850586, 48.538326263427734, 51.093963623046875, 53.64959716796875, 56.205230712890625, 58.760868072509766, 61.31650161743164, 63.87213897705078, 66.42777252197266, 68.98340606689453, 71.5390396118164, 74.09468078613281, 76.65031433105469, 79.20594787597656, 81.76158142089844, 84.31721496582031, 86.87284851074219, 89.42848205566406, 91.98411560058594, 94.53975677490234, 97.09539031982422, 99.6510238647461, 102.20665740966797, 104.76229095458984, 107.31793212890625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 4.0, 10.0, 10.0, 14.0, 15.0, 19.0, 24.0, 21.0, 23.0, 40.0, 36.0, 34.0, 31.0, 36.0, 38.0, 28.0, 30.0, 41.0, 37.0, 38.0, 41.0, 36.0, 38.0, 39.0, 36.0, 28.0, 36.0, 32.0, 27.0, 21.0, 21.0, 17.0, 15.0, 18.0, 12.0, 10.0, 5.0, 3.0, 8.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.32070541381836, -37.068180084228516, -35.81565475463867, -34.56312561035156, -33.31060028076172, -32.058074951171875, -30.80554962158203, -29.553022384643555, -28.300495147705078, -27.047969818115234, -25.795442581176758, -24.542917251586914, -23.290390014648438, -22.037864685058594, -20.78533935546875, -19.532812118530273, -18.28028678894043, -17.027761459350586, -15.77523422241211, -14.522708892822266, -13.270181655883789, -12.017656326293945, -10.765130043029785, -9.512603759765625, -8.260077476501465, -7.007551193237305, -5.7550249099731445, -4.502499103546143, -3.2499728202819824, -1.9974465370178223, -0.7449207305908203, 0.5076055526733398, 1.7601318359375, 3.01265811920166, 4.26518440246582, 5.517710208892822, 6.770236492156982, 8.022762298583984, 9.275288581848145, 10.527814865112305, 11.780341148376465, 13.032867431640625, 14.285393714904785, 15.537919998168945, 16.79044532775879, 18.042972564697266, 19.29549789428711, 20.548023223876953, 21.80055046081543, 23.053075790405273, 24.30560302734375, 25.558128356933594, 26.81065559387207, 28.063180923461914, 29.31570816040039, 30.568233489990234, 31.820758819580078, 33.07328414916992, 34.325809478759766, 35.578338623046875, 36.83086395263672, 38.08338928222656, 39.335914611816406, 40.58843994140625, 41.84096908569336]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 9.0, 10.0, 25.0, 32.0, 42.0, 59.0, 101.0, 166.0, 285.0, 497.0, 924.0, 1927.0, 4163.0, 9613.0, 25535.0, 69676.0, 190384.0, 338799.0, 248888.0, 98783.0, 35308.0, 12871.0, 5384.0, 2445.0, 1216.0, 567.0, 334.0, 165.0, 114.0, 59.0, 47.0, 39.0, 31.0, 14.0, 12.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.65625, -42.1845703125, -40.712890625, -39.2412109375, -37.76953125, -36.2978515625, -34.826171875, -33.3544921875, -31.8828125, -30.4111328125, -28.939453125, -27.4677734375, -25.99609375, -24.5244140625, -23.052734375, -21.5810546875, -20.109375, -18.6376953125, -17.166015625, -15.6943359375, -14.22265625, -12.7509765625, -11.279296875, -9.8076171875, -8.3359375, -6.8642578125, -5.392578125, -3.9208984375, -2.44921875, -0.9775390625, 0.494140625, 1.9658203125, 3.4375, 4.9091796875, 6.380859375, 7.8525390625, 9.32421875, 10.7958984375, 12.267578125, 13.7392578125, 15.2109375, 16.6826171875, 18.154296875, 19.6259765625, 21.09765625, 22.5693359375, 24.041015625, 25.5126953125, 26.984375, 28.4560546875, 29.927734375, 31.3994140625, 32.87109375, 34.3427734375, 35.814453125, 37.2861328125, 38.7578125, 40.2294921875, 41.701171875, 43.1728515625, 44.64453125, 46.1162109375, 47.587890625, 49.0595703125, 50.53125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 5.0, 6.0, 8.0, 11.0, 9.0, 12.0, 23.0, 22.0, 26.0, 32.0, 32.0, 40.0, 45.0, 44.0, 50.0, 48.0, 49.0, 56.0, 56.0, 35.0, 41.0, 40.0, 55.0, 42.0, 34.0, 30.0, 25.0, 28.0, 13.0, 9.0, 10.0, 9.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.3046875, -14.7872314453125, -14.269775390625, -13.7523193359375, -13.23486328125, -12.7174072265625, -12.199951171875, -11.6824951171875, -11.1650390625, -10.6475830078125, -10.130126953125, -9.6126708984375, -9.09521484375, -8.5777587890625, -8.060302734375, -7.5428466796875, -7.025390625, -6.5079345703125, -5.990478515625, -5.4730224609375, -4.95556640625, -4.4381103515625, -3.920654296875, -3.4031982421875, -2.8857421875, -2.3682861328125, -1.850830078125, -1.3333740234375, -0.81591796875, -0.2984619140625, 0.218994140625, 0.7364501953125, 1.25390625, 1.7713623046875, 2.288818359375, 2.8062744140625, 3.32373046875, 3.8411865234375, 4.358642578125, 4.8760986328125, 5.3935546875, 5.9110107421875, 6.428466796875, 6.9459228515625, 7.46337890625, 7.9808349609375, 8.498291015625, 9.0157470703125, 9.533203125, 10.0506591796875, 10.568115234375, 11.0855712890625, 11.60302734375, 12.1204833984375, 12.637939453125, 13.1553955078125, 13.6728515625, 14.1903076171875, 14.707763671875, 15.2252197265625, 15.74267578125, 16.2601318359375, 16.777587890625, 17.2950439453125, 17.8125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 9.0, 11.0, 18.0, 19.0, 23.0, 32.0, 47.0, 68.0, 112.0, 116.0, 155.0, 222.0, 292.0, 444.0, 646.0, 937.0, 1565.0, 2975.0, 7065.0, 21924.0, 84508.0, 336573.0, 425987.0, 117560.0, 29469.0, 8975.0, 3619.0, 1781.0, 980.0, 687.0, 458.0, 324.0, 263.0, 173.0, 130.0, 84.0, 68.0, 56.0, 46.0, 29.0, 26.0, 21.0, 18.0, 5.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-57.71875, -56.02685546875, -54.3349609375, -52.64306640625, -50.951171875, -49.25927734375, -47.5673828125, -45.87548828125, -44.18359375, -42.49169921875, -40.7998046875, -39.10791015625, -37.416015625, -35.72412109375, -34.0322265625, -32.34033203125, -30.6484375, -28.95654296875, -27.2646484375, -25.57275390625, -23.880859375, -22.18896484375, -20.4970703125, -18.80517578125, -17.11328125, -15.42138671875, -13.7294921875, -12.03759765625, -10.345703125, -8.65380859375, -6.9619140625, -5.27001953125, -3.578125, -1.88623046875, -0.1943359375, 1.49755859375, 3.189453125, 4.88134765625, 6.5732421875, 8.26513671875, 9.95703125, 11.64892578125, 13.3408203125, 15.03271484375, 16.724609375, 18.41650390625, 20.1083984375, 21.80029296875, 23.4921875, 25.18408203125, 26.8759765625, 28.56787109375, 30.259765625, 31.95166015625, 33.6435546875, 35.33544921875, 37.02734375, 38.71923828125, 40.4111328125, 42.10302734375, 43.794921875, 45.48681640625, 47.1787109375, 48.87060546875, 50.5625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 17.0, 26.0, 27.0, 29.0, 22.0, 34.0, 46.0, 35.0, 53.0, 49.0, 41.0, 54.0, 49.0, 28.0, 42.0, 60.0, 47.0, 51.0, 25.0, 33.0, 25.0, 26.0, 24.0, 19.0, 13.0, 23.0, 10.0, 12.0, 7.0, 2.0, 10.0, 3.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.1875, -71.953125, -69.71875, -67.484375, -65.25, -63.015625, -60.78125, -58.546875, -56.3125, -54.078125, -51.84375, -49.609375, -47.375, -45.140625, -42.90625, -40.671875, -38.4375, -36.203125, -33.96875, -31.734375, -29.5, -27.265625, -25.03125, -22.796875, -20.5625, -18.328125, -16.09375, -13.859375, -11.625, -9.390625, -7.15625, -4.921875, -2.6875, -0.453125, 1.78125, 4.015625, 6.25, 8.484375, 10.71875, 12.953125, 15.1875, 17.421875, 19.65625, 21.890625, 24.125, 26.359375, 28.59375, 30.828125, 33.0625, 35.296875, 37.53125, 39.765625, 42.0, 44.234375, 46.46875, 48.703125, 50.9375, 53.171875, 55.40625, 57.640625, 59.875, 62.109375, 64.34375, 66.578125, 68.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 11.0, 11.0, 22.0, 21.0, 56.0, 60.0, 86.0, 145.0, 222.0, 368.0, 575.0, 1029.0, 2002.0, 4395.0, 12061.0, 46392.0, 244882.0, 557161.0, 135381.0, 28356.0, 8300.0, 3312.0, 1487.0, 863.0, 493.0, 278.0, 181.0, 117.0, 81.0, 49.0, 32.0, 33.0, 17.0, 13.0, 11.0, 7.0, 6.0, 7.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.921875, -25.094482421875, -24.26708984375, -23.439697265625, -22.6123046875, -21.784912109375, -20.95751953125, -20.130126953125, -19.302734375, -18.475341796875, -17.64794921875, -16.820556640625, -15.9931640625, -15.165771484375, -14.33837890625, -13.510986328125, -12.68359375, -11.856201171875, -11.02880859375, -10.201416015625, -9.3740234375, -8.546630859375, -7.71923828125, -6.891845703125, -6.064453125, -5.237060546875, -4.40966796875, -3.582275390625, -2.7548828125, -1.927490234375, -1.10009765625, -0.272705078125, 0.5546875, 1.382080078125, 2.20947265625, 3.036865234375, 3.8642578125, 4.691650390625, 5.51904296875, 6.346435546875, 7.173828125, 8.001220703125, 8.82861328125, 9.656005859375, 10.4833984375, 11.310791015625, 12.13818359375, 12.965576171875, 13.79296875, 14.620361328125, 15.44775390625, 16.275146484375, 17.1025390625, 17.929931640625, 18.75732421875, 19.584716796875, 20.412109375, 21.239501953125, 22.06689453125, 22.894287109375, 23.7216796875, 24.549072265625, 25.37646484375, 26.203857421875, 27.03125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 5.0, 9.0, 10.0, 13.0, 18.0, 21.0, 29.0, 29.0, 37.0, 49.0, 54.0, 56.0, 71.0, 94.0, 85.0, 67.0, 60.0, 51.0, 42.0, 33.0, 27.0, 28.0, 17.0, 19.0, 11.0, 6.0, 8.0, 3.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.003204345703125, -0.003092348575592041, -0.002980351448059082, -0.002868354320526123, -0.002756357192993164, -0.002644360065460205, -0.002532362937927246, -0.002420365810394287, -0.002308368682861328, -0.002196371555328369, -0.00208437442779541, -0.001972377300262451, -0.0018603801727294922, -0.0017483830451965332, -0.0016363859176635742, -0.0015243887901306152, -0.0014123916625976562, -0.0013003945350646973, -0.0011883974075317383, -0.0010764002799987793, -0.0009644031524658203, -0.0008524060249328613, -0.0007404088973999023, -0.0006284117698669434, -0.0005164146423339844, -0.0004044175148010254, -0.0002924203872680664, -0.00018042325973510742, -6.842613220214844e-05, 4.357099533081055e-05, 0.00015556812286376953, 0.0002675652503967285, 0.0003795623779296875, 0.0004915595054626465, 0.0006035566329956055, 0.0007155537605285645, 0.0008275508880615234, 0.0009395480155944824, 0.0010515451431274414, 0.0011635422706604004, 0.0012755393981933594, 0.0013875365257263184, 0.0014995336532592773, 0.0016115307807922363, 0.0017235279083251953, 0.0018355250358581543, 0.0019475221633911133, 0.0020595192909240723, 0.0021715164184570312, 0.0022835135459899902, 0.0023955106735229492, 0.002507507801055908, 0.002619504928588867, 0.002731502056121826, 0.002843499183654785, 0.002955496311187744, 0.003067493438720703, 0.003179490566253662, 0.003291487693786621, 0.00340348482131958, 0.003515481948852539, 0.003627479076385498, 0.003739476203918457, 0.003851473331451416, 0.003963470458984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 17.0, 24.0, 42.0, 58.0, 102.0, 195.0, 361.0, 781.0, 1999.0, 6420.0, 41046.0, 576527.0, 384960.0, 27773.0, 5079.0, 1664.0, 741.0, 335.0, 155.0, 105.0, 49.0, 29.0, 19.0, 15.0, 7.0, 8.0, 3.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.75, -46.38232421875, -45.0146484375, -43.64697265625, -42.279296875, -40.91162109375, -39.5439453125, -38.17626953125, -36.80859375, -35.44091796875, -34.0732421875, -32.70556640625, -31.337890625, -29.97021484375, -28.6025390625, -27.23486328125, -25.8671875, -24.49951171875, -23.1318359375, -21.76416015625, -20.396484375, -19.02880859375, -17.6611328125, -16.29345703125, -14.92578125, -13.55810546875, -12.1904296875, -10.82275390625, -9.455078125, -8.08740234375, -6.7197265625, -5.35205078125, -3.984375, -2.61669921875, -1.2490234375, 0.11865234375, 1.486328125, 2.85400390625, 4.2216796875, 5.58935546875, 6.95703125, 8.32470703125, 9.6923828125, 11.06005859375, 12.427734375, 13.79541015625, 15.1630859375, 16.53076171875, 17.8984375, 19.26611328125, 20.6337890625, 22.00146484375, 23.369140625, 24.73681640625, 26.1044921875, 27.47216796875, 28.83984375, 30.20751953125, 31.5751953125, 32.94287109375, 34.310546875, 35.67822265625, 37.0458984375, 38.41357421875, 39.78125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 11.0, 5.0, 7.0, 4.0, 18.0, 17.0, 26.0, 39.0, 62.0, 66.0, 93.0, 88.0, 115.0, 97.0, 84.0, 68.0, 54.0, 38.0, 27.0, 17.0, 23.0, 15.0, 10.0, 12.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.976318359375, -29.96826171875, -28.960205078125, -27.9521484375, -26.944091796875, -25.93603515625, -24.927978515625, -23.919921875, -22.911865234375, -21.90380859375, -20.895751953125, -19.8876953125, -18.879638671875, -17.87158203125, -16.863525390625, -15.85546875, -14.847412109375, -13.83935546875, -12.831298828125, -11.8232421875, -10.815185546875, -9.80712890625, -8.799072265625, -7.791015625, -6.782958984375, -5.77490234375, -4.766845703125, -3.7587890625, -2.750732421875, -1.74267578125, -0.734619140625, 0.2734375, 1.281494140625, 2.28955078125, 3.297607421875, 4.3056640625, 5.313720703125, 6.32177734375, 7.329833984375, 8.337890625, 9.345947265625, 10.35400390625, 11.362060546875, 12.3701171875, 13.378173828125, 14.38623046875, 15.394287109375, 16.40234375, 17.410400390625, 18.41845703125, 19.426513671875, 20.4345703125, 21.442626953125, 22.45068359375, 23.458740234375, 24.466796875, 25.474853515625, 26.48291015625, 27.490966796875, 28.4990234375, 29.507080078125, 30.51513671875, 31.523193359375, 32.53125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 8.0, 8.0, 35.0, 83.0, 114.0, 208.0, 207.0, 152.0, 101.0, 38.0, 32.0, 4.0, 10.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-259.57855224609375, -233.72531127929688, -207.87208557128906, -182.01885986328125, -156.16561889648438, -130.3123779296875, -104.45915222167969, -78.60592651367188, -52.752685546875, -26.899452209472656, -1.0462188720703125, 24.80701446533203, 50.660247802734375, 76.51348876953125, 102.36671447753906, 128.21994018554688, 154.07318115234375, 179.92642211914062, 205.77964782714844, 231.63287353515625, 257.4861145019531, 283.33935546875, 309.19256591796875, 335.0458068847656, 360.8990478515625, 386.7522888183594, 412.60552978515625, 438.458740234375, 464.3119812011719, 490.16522216796875, 516.0184326171875, 541.8717041015625, 567.724853515625, 593.5780639648438, 619.4313354492188, 645.2845458984375, 671.1378173828125, 696.9910278320312, 722.84423828125, 748.697509765625, 774.5507202148438, 800.4039306640625, 826.2572021484375, 852.1104125976562, 877.963623046875, 903.81689453125, 929.6701049804688, 955.5233154296875, 981.3765869140625, 1007.2297973632812, 1033.0830078125, 1058.936279296875, 1084.78955078125, 1110.642822265625, 1136.4959716796875, 1162.3492431640625, 1188.202392578125, 1214.0556640625, 1239.9088134765625, 1265.7620849609375, 1291.6153564453125, 1317.468505859375, 1343.32177734375, 1369.175048828125, 1395.0283203125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 7.0, 7.0, 7.0, 11.0, 15.0, 16.0, 13.0, 17.0, 16.0, 12.0, 29.0, 22.0, 26.0, 43.0, 28.0, 35.0, 48.0, 42.0, 34.0, 40.0, 42.0, 50.0, 44.0, 23.0, 43.0, 38.0, 37.0, 30.0, 35.0, 21.0, 26.0, 23.0, 19.0, 20.0, 8.0, 9.0, 10.0, 8.0, 5.0, 8.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-272.5573425292969, -263.57769775390625, -254.59808349609375, -245.6184539794922, -236.63882446289062, -227.65919494628906, -218.6795654296875, -209.69993591308594, -200.72030639648438, -191.7406768798828, -182.76104736328125, -173.7814178466797, -164.80178833007812, -155.82215881347656, -146.842529296875, -137.86289978027344, -128.88327026367188, -119.90364074707031, -110.92401123046875, -101.94438171386719, -92.96475219726562, -83.98512268066406, -75.0054931640625, -66.02586364746094, -57.046234130859375, -48.06660461425781, -39.08697509765625, -30.107345581054688, -21.127716064453125, -12.148086547851562, -3.16845703125, 5.8111724853515625, 14.790802001953125, 23.770431518554688, 32.75006103515625, 41.72969055175781, 50.709320068359375, 59.68894958496094, 68.6685791015625, 77.64820861816406, 86.62783813476562, 95.60746765136719, 104.58709716796875, 113.56672668457031, 122.54635620117188, 131.52598571777344, 140.505615234375, 149.48524475097656, 158.46487426757812, 167.4445037841797, 176.42413330078125, 185.4037628173828, 194.38339233398438, 203.36302185058594, 212.3426513671875, 221.32228088378906, 230.30191040039062, 239.2815399169922, 248.26116943359375, 257.24078369140625, 266.2204284667969, 275.2000732421875, 284.1796875, 293.1593017578125, 302.1389465332031]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 8.0, 8.0, 5.0, 9.0, 14.0, 22.0, 42.0, 57.0, 79.0, 126.0, 192.0, 308.0, 551.0, 1148.0, 2889.0, 7971.0, 36371.0, 4096517.0, 34724.0, 7878.0, 2758.0, 1205.0, 553.0, 313.0, 169.0, 111.0, 78.0, 58.0, 42.0, 20.0, 16.0, 13.0, 9.0, 10.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-124.3125, -120.2353515625, -116.158203125, -112.0810546875, -108.00390625, -103.9267578125, -99.849609375, -95.7724609375, -91.6953125, -87.6181640625, -83.541015625, -79.4638671875, -75.38671875, -71.3095703125, -67.232421875, -63.1552734375, -59.078125, -55.0009765625, -50.923828125, -46.8466796875, -42.76953125, -38.6923828125, -34.615234375, -30.5380859375, -26.4609375, -22.3837890625, -18.306640625, -14.2294921875, -10.15234375, -6.0751953125, -1.998046875, 2.0791015625, 6.15625, 10.2333984375, 14.310546875, 18.3876953125, 22.46484375, 26.5419921875, 30.619140625, 34.6962890625, 38.7734375, 42.8505859375, 46.927734375, 51.0048828125, 55.08203125, 59.1591796875, 63.236328125, 67.3134765625, 71.390625, 75.4677734375, 79.544921875, 83.6220703125, 87.69921875, 91.7763671875, 95.853515625, 99.9306640625, 104.0078125, 108.0849609375, 112.162109375, 116.2392578125, 120.31640625, 124.3935546875, 128.470703125, 132.5478515625, 136.625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 5.0, 7.0, 14.0, 12.0, 16.0, 27.0, 32.0, 35.0, 43.0, 49.0, 42.0, 39.0, 60.0, 52.0, 64.0, 59.0, 52.0, 47.0, 72.0, 30.0, 34.0, 23.0, 31.0, 26.0, 21.0, 18.0, 10.0, 15.0, 11.0, 9.0, 4.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.09375, -19.4970703125, -18.900390625, -18.3037109375, -17.70703125, -17.1103515625, -16.513671875, -15.9169921875, -15.3203125, -14.7236328125, -14.126953125, -13.5302734375, -12.93359375, -12.3369140625, -11.740234375, -11.1435546875, -10.546875, -9.9501953125, -9.353515625, -8.7568359375, -8.16015625, -7.5634765625, -6.966796875, -6.3701171875, -5.7734375, -5.1767578125, -4.580078125, -3.9833984375, -3.38671875, -2.7900390625, -2.193359375, -1.5966796875, -1.0, -0.4033203125, 0.193359375, 0.7900390625, 1.38671875, 1.9833984375, 2.580078125, 3.1767578125, 3.7734375, 4.3701171875, 4.966796875, 5.5634765625, 6.16015625, 6.7568359375, 7.353515625, 7.9501953125, 8.546875, 9.1435546875, 9.740234375, 10.3369140625, 10.93359375, 11.5302734375, 12.126953125, 12.7236328125, 13.3203125, 13.9169921875, 14.513671875, 15.1103515625, 15.70703125, 16.3037109375, 16.900390625, 17.4970703125, 18.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 13.0, 20.0, 15.0, 28.0, 18.0, 29.0, 31.0, 45.0, 48.0, 67.0, 107.0, 180.0, 346.0, 803.0, 2255.0, 7594.0, 48189.0, 4098783.0, 26967.0, 5455.0, 1765.0, 658.0, 277.0, 164.0, 105.0, 48.0, 40.0, 43.0, 43.0, 28.0, 22.0, 17.0, 19.0, 11.0, 10.0, 8.0, 11.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.625, -138.080078125, -133.53515625, -128.990234375, -124.4453125, -119.900390625, -115.35546875, -110.810546875, -106.265625, -101.720703125, -97.17578125, -92.630859375, -88.0859375, -83.541015625, -78.99609375, -74.451171875, -69.90625, -65.361328125, -60.81640625, -56.271484375, -51.7265625, -47.181640625, -42.63671875, -38.091796875, -33.546875, -29.001953125, -24.45703125, -19.912109375, -15.3671875, -10.822265625, -6.27734375, -1.732421875, 2.8125, 7.357421875, 11.90234375, 16.447265625, 20.9921875, 25.537109375, 30.08203125, 34.626953125, 39.171875, 43.716796875, 48.26171875, 52.806640625, 57.3515625, 61.896484375, 66.44140625, 70.986328125, 75.53125, 80.076171875, 84.62109375, 89.166015625, 93.7109375, 98.255859375, 102.80078125, 107.345703125, 111.890625, 116.435546875, 120.98046875, 125.525390625, 130.0703125, 134.615234375, 139.16015625, 143.705078125, 148.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 8.0, 13.0, 28.0, 68.0, 3608.0, 259.0, 37.0, 14.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.8134765625, -34.689453125, -33.5654296875, -32.44140625, -31.3173828125, -30.193359375, -29.0693359375, -27.9453125, -26.8212890625, -25.697265625, -24.5732421875, -23.44921875, -22.3251953125, -21.201171875, -20.0771484375, -18.953125, -17.8291015625, -16.705078125, -15.5810546875, -14.45703125, -13.3330078125, -12.208984375, -11.0849609375, -9.9609375, -8.8369140625, -7.712890625, -6.5888671875, -5.46484375, -4.3408203125, -3.216796875, -2.0927734375, -0.96875, 0.1552734375, 1.279296875, 2.4033203125, 3.52734375, 4.6513671875, 5.775390625, 6.8994140625, 8.0234375, 9.1474609375, 10.271484375, 11.3955078125, 12.51953125, 13.6435546875, 14.767578125, 15.8916015625, 17.015625, 18.1396484375, 19.263671875, 20.3876953125, 21.51171875, 22.6357421875, 23.759765625, 24.8837890625, 26.0078125, 27.1318359375, 28.255859375, 29.3798828125, 30.50390625, 31.6279296875, 32.751953125, 33.8759765625, 35.0]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 12.0, 44.0, 72.0, 178.0, 274.0, 228.0, 102.0, 51.0, 26.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.46912384033203, -113.3116683959961, -108.15421295166016, -102.99675750732422, -97.83930206298828, -92.68184661865234, -87.52439880371094, -82.366943359375, -77.20948791503906, -72.05203247070312, -66.89457702636719, -61.73712158203125, -56.57966613769531, -51.422210693359375, -46.2647590637207, -41.107303619384766, -35.94984436035156, -30.792388916015625, -25.634933471679688, -20.477479934692383, -15.320024490356445, -10.162569046020508, -5.005115509033203, 0.15233993530273438, 5.309795379638672, 10.46725082397461, 15.62470531463623, 20.78215980529785, 25.93961524963379, 31.097070693969727, 36.25452423095703, 41.41197967529297, 46.569427490234375, 51.72688293457031, 56.88433837890625, 62.04179382324219, 67.19924926757812, 72.35670471191406, 77.51416015625, 82.67161560058594, 87.82907104492188, 92.98652648925781, 98.14398193359375, 103.30143737792969, 108.45889282226562, 113.61634826660156, 118.7738037109375, 123.93125915527344, 129.08871459960938, 134.2461700439453, 139.40362548828125, 144.5610809326172, 149.71853637695312, 154.87599182128906, 160.033447265625, 165.19090270996094, 170.3483428955078, 175.50579833984375, 180.6632537841797, 185.82070922851562, 190.97816467285156, 196.1356201171875, 201.29307556152344, 206.45053100585938, 211.6079864501953]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 10.0, 8.0, 13.0, 12.0, 15.0, 18.0, 20.0, 32.0, 31.0, 33.0, 33.0, 36.0, 34.0, 30.0, 34.0, 46.0, 34.0, 41.0, 46.0, 30.0, 35.0, 36.0, 45.0, 39.0, 26.0, 32.0, 26.0, 24.0, 26.0, 29.0, 13.0, 17.0, 16.0, 15.0, 13.0, 4.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.481239318847656, -39.245887756347656, -38.01053237915039, -36.77518081665039, -35.539825439453125, -34.304473876953125, -33.06911849975586, -31.83376693725586, -30.598411560058594, -29.36305809020996, -28.127704620361328, -26.892351150512695, -25.656997680664062, -24.42164421081543, -23.186290740966797, -21.950939178466797, -20.715585708618164, -19.48023223876953, -18.2448787689209, -17.009525299072266, -15.774171829223633, -14.538818359375, -13.303465843200684, -12.06811237335205, -10.832758903503418, -9.597405433654785, -8.362051963806152, -7.126698970794678, -5.891345500946045, -4.655992031097412, -3.4206390380859375, -2.1852855682373047, -0.9499320983886719, 0.2854212522506714, 1.5207746028900146, 2.7561278343200684, 3.991481304168701, 5.226834774017334, 6.462187767028809, 7.697541236877441, 8.932894706726074, 10.168248176574707, 11.40360164642334, 12.638954162597656, 13.874307632446289, 15.109661102294922, 16.345014572143555, 17.580368041992188, 18.81572151184082, 20.051074981689453, 21.286428451538086, 22.52178192138672, 23.75713539123535, 24.992488861083984, 26.227840423583984, 27.46319580078125, 28.69854736328125, 29.933900833129883, 31.169254302978516, 32.404605865478516, 33.63996124267578, 34.87531280517578, 36.11066818237305, 37.34601974487305, 38.58137512207031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 9.0, 15.0, 18.0, 27.0, 36.0, 48.0, 85.0, 110.0, 156.0, 234.0, 391.0, 648.0, 1121.0, 2286.0, 4813.0, 10972.0, 27369.0, 69740.0, 173911.0, 319887.0, 251223.0, 111116.0, 43261.0, 17017.0, 7080.0, 3108.0, 1583.0, 809.0, 486.0, 344.0, 187.0, 133.0, 90.0, 50.0, 44.0, 29.0, 29.0, 18.0, 12.0, 7.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-42.75, -41.4033203125, -40.056640625, -38.7099609375, -37.36328125, -36.0166015625, -34.669921875, -33.3232421875, -31.9765625, -30.6298828125, -29.283203125, -27.9365234375, -26.58984375, -25.2431640625, -23.896484375, -22.5498046875, -21.203125, -19.8564453125, -18.509765625, -17.1630859375, -15.81640625, -14.4697265625, -13.123046875, -11.7763671875, -10.4296875, -9.0830078125, -7.736328125, -6.3896484375, -5.04296875, -3.6962890625, -2.349609375, -1.0029296875, 0.34375, 1.6904296875, 3.037109375, 4.3837890625, 5.73046875, 7.0771484375, 8.423828125, 9.7705078125, 11.1171875, 12.4638671875, 13.810546875, 15.1572265625, 16.50390625, 17.8505859375, 19.197265625, 20.5439453125, 21.890625, 23.2373046875, 24.583984375, 25.9306640625, 27.27734375, 28.6240234375, 29.970703125, 31.3173828125, 32.6640625, 34.0107421875, 35.357421875, 36.7041015625, 38.05078125, 39.3974609375, 40.744140625, 42.0908203125, 43.4375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 3.0, 5.0, 9.0, 4.0, 14.0, 15.0, 18.0, 14.0, 30.0, 36.0, 35.0, 34.0, 43.0, 34.0, 36.0, 47.0, 45.0, 67.0, 50.0, 73.0, 52.0, 44.0, 29.0, 39.0, 25.0, 33.0, 29.0, 22.0, 16.0, 13.0, 13.0, 17.0, 10.0, 6.0, 9.0, 6.0, 3.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.53125, -18.93896484375, -18.3466796875, -17.75439453125, -17.162109375, -16.56982421875, -15.9775390625, -15.38525390625, -14.79296875, -14.20068359375, -13.6083984375, -13.01611328125, -12.423828125, -11.83154296875, -11.2392578125, -10.64697265625, -10.0546875, -9.46240234375, -8.8701171875, -8.27783203125, -7.685546875, -7.09326171875, -6.5009765625, -5.90869140625, -5.31640625, -4.72412109375, -4.1318359375, -3.53955078125, -2.947265625, -2.35498046875, -1.7626953125, -1.17041015625, -0.578125, 0.01416015625, 0.6064453125, 1.19873046875, 1.791015625, 2.38330078125, 2.9755859375, 3.56787109375, 4.16015625, 4.75244140625, 5.3447265625, 5.93701171875, 6.529296875, 7.12158203125, 7.7138671875, 8.30615234375, 8.8984375, 9.49072265625, 10.0830078125, 10.67529296875, 11.267578125, 11.85986328125, 12.4521484375, 13.04443359375, 13.63671875, 14.22900390625, 14.8212890625, 15.41357421875, 16.005859375, 16.59814453125, 17.1904296875, 17.78271484375, 18.375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 9.0, 8.0, 14.0, 17.0, 23.0, 33.0, 54.0, 61.0, 96.0, 118.0, 173.0, 250.0, 405.0, 549.0, 949.0, 1542.0, 3724.0, 13276.0, 77720.0, 522283.0, 359805.0, 51097.0, 9656.0, 2943.0, 1369.0, 773.0, 504.0, 334.0, 212.0, 165.0, 99.0, 76.0, 56.0, 46.0, 28.0, 23.0, 15.0, 15.0, 7.0, 11.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.125, -69.7900390625, -67.455078125, -65.1201171875, -62.78515625, -60.4501953125, -58.115234375, -55.7802734375, -53.4453125, -51.1103515625, -48.775390625, -46.4404296875, -44.10546875, -41.7705078125, -39.435546875, -37.1005859375, -34.765625, -32.4306640625, -30.095703125, -27.7607421875, -25.42578125, -23.0908203125, -20.755859375, -18.4208984375, -16.0859375, -13.7509765625, -11.416015625, -9.0810546875, -6.74609375, -4.4111328125, -2.076171875, 0.2587890625, 2.59375, 4.9287109375, 7.263671875, 9.5986328125, 11.93359375, 14.2685546875, 16.603515625, 18.9384765625, 21.2734375, 23.6083984375, 25.943359375, 28.2783203125, 30.61328125, 32.9482421875, 35.283203125, 37.6181640625, 39.953125, 42.2880859375, 44.623046875, 46.9580078125, 49.29296875, 51.6279296875, 53.962890625, 56.2978515625, 58.6328125, 60.9677734375, 63.302734375, 65.6376953125, 67.97265625, 70.3076171875, 72.642578125, 74.9775390625, 77.3125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 13.0, 8.0, 10.0, 8.0, 15.0, 17.0, 13.0, 20.0, 32.0, 31.0, 26.0, 42.0, 41.0, 26.0, 31.0, 41.0, 52.0, 56.0, 49.0, 39.0, 49.0, 51.0, 47.0, 41.0, 36.0, 29.0, 26.0, 18.0, 17.0, 23.0, 18.0, 23.0, 13.0, 9.0, 11.0, 5.0, 3.0, 0.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-86.0625, -83.4873046875, -80.912109375, -78.3369140625, -75.76171875, -73.1865234375, -70.611328125, -68.0361328125, -65.4609375, -62.8857421875, -60.310546875, -57.7353515625, -55.16015625, -52.5849609375, -50.009765625, -47.4345703125, -44.859375, -42.2841796875, -39.708984375, -37.1337890625, -34.55859375, -31.9833984375, -29.408203125, -26.8330078125, -24.2578125, -21.6826171875, -19.107421875, -16.5322265625, -13.95703125, -11.3818359375, -8.806640625, -6.2314453125, -3.65625, -1.0810546875, 1.494140625, 4.0693359375, 6.64453125, 9.2197265625, 11.794921875, 14.3701171875, 16.9453125, 19.5205078125, 22.095703125, 24.6708984375, 27.24609375, 29.8212890625, 32.396484375, 34.9716796875, 37.546875, 40.1220703125, 42.697265625, 45.2724609375, 47.84765625, 50.4228515625, 52.998046875, 55.5732421875, 58.1484375, 60.7236328125, 63.298828125, 65.8740234375, 68.44921875, 71.0244140625, 73.599609375, 76.1748046875, 78.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 7.0, 6.0, 5.0, 11.0, 18.0, 15.0, 16.0, 26.0, 17.0, 35.0, 36.0, 85.0, 86.0, 149.0, 204.0, 408.0, 917.0, 2940.0, 15225.0, 265928.0, 725751.0, 29529.0, 4531.0, 1296.0, 483.0, 265.0, 148.0, 106.0, 62.0, 58.0, 39.0, 32.0, 22.0, 17.0, 17.0, 13.0, 16.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-74.8125, -72.6220703125, -70.431640625, -68.2412109375, -66.05078125, -63.8603515625, -61.669921875, -59.4794921875, -57.2890625, -55.0986328125, -52.908203125, -50.7177734375, -48.52734375, -46.3369140625, -44.146484375, -41.9560546875, -39.765625, -37.5751953125, -35.384765625, -33.1943359375, -31.00390625, -28.8134765625, -26.623046875, -24.4326171875, -22.2421875, -20.0517578125, -17.861328125, -15.6708984375, -13.48046875, -11.2900390625, -9.099609375, -6.9091796875, -4.71875, -2.5283203125, -0.337890625, 1.8525390625, 4.04296875, 6.2333984375, 8.423828125, 10.6142578125, 12.8046875, 14.9951171875, 17.185546875, 19.3759765625, 21.56640625, 23.7568359375, 25.947265625, 28.1376953125, 30.328125, 32.5185546875, 34.708984375, 36.8994140625, 39.08984375, 41.2802734375, 43.470703125, 45.6611328125, 47.8515625, 50.0419921875, 52.232421875, 54.4228515625, 56.61328125, 58.8037109375, 60.994140625, 63.1845703125, 65.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 13.0, 15.0, 34.0, 35.0, 69.0, 123.0, 159.0, 156.0, 132.0, 80.0, 59.0, 35.0, 19.0, 19.0, 12.0, 3.0, 6.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00930023193359375, -0.009020805358886719, -0.008741378784179688, -0.008461952209472656, -0.008182525634765625, -0.007903099060058594, -0.0076236724853515625, -0.007344245910644531, -0.0070648193359375, -0.006785392761230469, -0.0065059661865234375, -0.006226539611816406, -0.005947113037109375, -0.005667686462402344, -0.0053882598876953125, -0.005108833312988281, -0.00482940673828125, -0.004549980163574219, -0.0042705535888671875, -0.003991127014160156, -0.003711700439453125, -0.0034322738647460938, -0.0031528472900390625, -0.0028734207153320312, -0.002593994140625, -0.0023145675659179688, -0.0020351409912109375, -0.0017557144165039062, -0.001476287841796875, -0.0011968612670898438, -0.0009174346923828125, -0.0006380081176757812, -0.00035858154296875, -7.915496826171875e-05, 0.0002002716064453125, 0.00047969818115234375, 0.000759124755859375, 0.0010385513305664062, 0.0013179779052734375, 0.0015974044799804688, 0.0018768310546875, 0.0021562576293945312, 0.0024356842041015625, 0.0027151107788085938, 0.002994537353515625, 0.0032739639282226562, 0.0035533905029296875, 0.0038328170776367188, 0.00411224365234375, 0.004391670227050781, 0.0046710968017578125, 0.004950523376464844, 0.005229949951171875, 0.005509376525878906, 0.0057888031005859375, 0.006068229675292969, 0.00634765625, 0.006627082824707031, 0.0069065093994140625, 0.007185935974121094, 0.007465362548828125, 0.007744789123535156, 0.008024215698242188, 0.008303642272949219, 0.00858306884765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 8.0, 9.0, 18.0, 26.0, 39.0, 38.0, 55.0, 64.0, 136.0, 239.0, 463.0, 1039.0, 2624.0, 9700.0, 71910.0, 842647.0, 102289.0, 11890.0, 3077.0, 1102.0, 500.0, 251.0, 149.0, 84.0, 54.0, 45.0, 22.0, 19.0, 11.0, 9.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.5771484375, -66.404296875, -64.2314453125, -62.05859375, -59.8857421875, -57.712890625, -55.5400390625, -53.3671875, -51.1943359375, -49.021484375, -46.8486328125, -44.67578125, -42.5029296875, -40.330078125, -38.1572265625, -35.984375, -33.8115234375, -31.638671875, -29.4658203125, -27.29296875, -25.1201171875, -22.947265625, -20.7744140625, -18.6015625, -16.4287109375, -14.255859375, -12.0830078125, -9.91015625, -7.7373046875, -5.564453125, -3.3916015625, -1.21875, 0.9541015625, 3.126953125, 5.2998046875, 7.47265625, 9.6455078125, 11.818359375, 13.9912109375, 16.1640625, 18.3369140625, 20.509765625, 22.6826171875, 24.85546875, 27.0283203125, 29.201171875, 31.3740234375, 33.546875, 35.7197265625, 37.892578125, 40.0654296875, 42.23828125, 44.4111328125, 46.583984375, 48.7568359375, 50.9296875, 53.1025390625, 55.275390625, 57.4482421875, 59.62109375, 61.7939453125, 63.966796875, 66.1396484375, 68.3125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 12.0, 7.0, 20.0, 23.0, 29.0, 45.0, 52.0, 73.0, 76.0, 129.0, 120.0, 99.0, 75.0, 59.0, 50.0, 34.0, 24.0, 5.0, 14.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.19873046875, -32.6474609375, -31.09619140625, -29.544921875, -27.99365234375, -26.4423828125, -24.89111328125, -23.33984375, -21.78857421875, -20.2373046875, -18.68603515625, -17.134765625, -15.58349609375, -14.0322265625, -12.48095703125, -10.9296875, -9.37841796875, -7.8271484375, -6.27587890625, -4.724609375, -3.17333984375, -1.6220703125, -0.07080078125, 1.48046875, 3.03173828125, 4.5830078125, 6.13427734375, 7.685546875, 9.23681640625, 10.7880859375, 12.33935546875, 13.890625, 15.44189453125, 16.9931640625, 18.54443359375, 20.095703125, 21.64697265625, 23.1982421875, 24.74951171875, 26.30078125, 27.85205078125, 29.4033203125, 30.95458984375, 32.505859375, 34.05712890625, 35.6083984375, 37.15966796875, 38.7109375, 40.26220703125, 41.8134765625, 43.36474609375, 44.916015625, 46.46728515625, 48.0185546875, 49.56982421875, 51.12109375, 52.67236328125, 54.2236328125, 55.77490234375, 57.326171875, 58.87744140625, 60.4287109375, 61.97998046875, 63.53125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 27.0, 91.0, 199.0, 315.0, 216.0, 92.0, 37.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-855.9484252929688, -816.4798583984375, -777.01123046875, -737.5426635742188, -698.0740966796875, -658.60546875, -619.1369018554688, -579.6683349609375, -540.19970703125, -500.7311096191406, -461.26251220703125, -421.7939453125, -382.3253479003906, -342.85675048828125, -303.38818359375, -263.9195861816406, -224.45098876953125, -184.98239135742188, -145.51380920410156, -106.04521942138672, -66.57662963867188, -27.1080322265625, 12.360549926757812, 51.829132080078125, 91.2977294921875, 130.76632690429688, 170.2349090576172, 209.7034912109375, 249.17208862304688, 288.64068603515625, 328.1092529296875, 367.5778503417969, 407.0465087890625, 446.5151062011719, 485.98370361328125, 525.4522705078125, 564.9208984375, 604.3894653320312, 643.8580322265625, 683.32666015625, 722.7952270507812, 762.2637939453125, 801.732421875, 841.2009887695312, 880.6695556640625, 920.13818359375, 959.6067504882812, 999.0753173828125, 1038.5439453125, 1078.0125732421875, 1117.4810791015625, 1156.94970703125, 1196.4183349609375, 1235.886962890625, 1275.35546875, 1314.8240966796875, 1354.292724609375, 1393.7613525390625, 1433.2298583984375, 1472.698486328125, 1512.1671142578125, 1551.6357421875, 1591.104248046875, 1630.5728759765625, 1670.0413818359375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 8.0, 7.0, 6.0, 14.0, 11.0, 14.0, 16.0, 23.0, 25.0, 22.0, 34.0, 36.0, 28.0, 39.0, 37.0, 39.0, 48.0, 38.0, 41.0, 40.0, 65.0, 37.0, 46.0, 40.0, 41.0, 30.0, 33.0, 33.0, 19.0, 25.0, 12.0, 13.0, 12.0, 9.0, 13.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-381.6477355957031, -369.9373779296875, -358.2270202636719, -346.51666259765625, -334.80633544921875, -323.0959777832031, -311.3856201171875, -299.6752624511719, -287.96490478515625, -276.2545471191406, -264.544189453125, -252.83384704589844, -241.12350463867188, -229.41314697265625, -217.70278930664062, -205.992431640625, -194.2821044921875, -182.57174682617188, -170.8614044189453, -159.1510467529297, -147.44070434570312, -135.7303466796875, -124.01998901367188, -112.30963897705078, -100.59928894042969, -88.8889389038086, -77.1785888671875, -65.46823120117188, -53.75788116455078, -42.04753112792969, -30.337173461914062, -18.62682342529297, -6.91650390625, 4.793848037719727, 16.504199981689453, 28.214553833007812, 39.924903869628906, 51.63525390625, 63.345611572265625, 75.05596160888672, 86.76631164550781, 98.4766616821289, 110.18701171875, 121.89736938476562, 133.60772705078125, 145.3180694580078, 157.02842712402344, 168.73876953125, 180.44912719726562, 192.15948486328125, 203.8698272705078, 215.58018493652344, 227.29052734375, 239.00088500976562, 250.71124267578125, 262.4216003417969, 274.1319580078125, 285.8423156738281, 297.55267333984375, 309.26300048828125, 320.9733581542969, 332.6837158203125, 344.3940734863281, 356.10443115234375, 367.81475830078125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 12.0, 22.0, 39.0, 46.0, 86.0, 125.0, 241.0, 365.0, 771.0, 1657.0, 3946.0, 11590.0, 52905.0, 4039562.0, 62431.0, 12598.0, 4269.0, 1754.0, 803.0, 438.0, 221.0, 136.0, 83.0, 57.0, 37.0, 26.0, 13.0, 8.0, 7.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-86.0625, -83.244140625, -80.42578125, -77.607421875, -74.7890625, -71.970703125, -69.15234375, -66.333984375, -63.515625, -60.697265625, -57.87890625, -55.060546875, -52.2421875, -49.423828125, -46.60546875, -43.787109375, -40.96875, -38.150390625, -35.33203125, -32.513671875, -29.6953125, -26.876953125, -24.05859375, -21.240234375, -18.421875, -15.603515625, -12.78515625, -9.966796875, -7.1484375, -4.330078125, -1.51171875, 1.306640625, 4.125, 6.943359375, 9.76171875, 12.580078125, 15.3984375, 18.216796875, 21.03515625, 23.853515625, 26.671875, 29.490234375, 32.30859375, 35.126953125, 37.9453125, 40.763671875, 43.58203125, 46.400390625, 49.21875, 52.037109375, 54.85546875, 57.673828125, 60.4921875, 63.310546875, 66.12890625, 68.947265625, 71.765625, 74.583984375, 77.40234375, 80.220703125, 83.0390625, 85.857421875, 88.67578125, 91.494140625, 94.3125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 8.0, 6.0, 10.0, 17.0, 13.0, 20.0, 25.0, 27.0, 47.0, 59.0, 46.0, 45.0, 56.0, 59.0, 62.0, 66.0, 62.0, 65.0, 55.0, 43.0, 33.0, 33.0, 23.0, 24.0, 21.0, 15.0, 14.0, 8.0, 9.0, 6.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.984375, -17.266845703125, -16.54931640625, -15.831787109375, -15.1142578125, -14.396728515625, -13.67919921875, -12.961669921875, -12.244140625, -11.526611328125, -10.80908203125, -10.091552734375, -9.3740234375, -8.656494140625, -7.93896484375, -7.221435546875, -6.50390625, -5.786376953125, -5.06884765625, -4.351318359375, -3.6337890625, -2.916259765625, -2.19873046875, -1.481201171875, -0.763671875, -0.046142578125, 0.67138671875, 1.388916015625, 2.1064453125, 2.823974609375, 3.54150390625, 4.259033203125, 4.9765625, 5.694091796875, 6.41162109375, 7.129150390625, 7.8466796875, 8.564208984375, 9.28173828125, 9.999267578125, 10.716796875, 11.434326171875, 12.15185546875, 12.869384765625, 13.5869140625, 14.304443359375, 15.02197265625, 15.739501953125, 16.45703125, 17.174560546875, 17.89208984375, 18.609619140625, 19.3271484375, 20.044677734375, 20.76220703125, 21.479736328125, 22.197265625, 22.914794921875, 23.63232421875, 24.349853515625, 25.0673828125, 25.784912109375, 26.50244140625, 27.219970703125, 27.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 12.0, 17.0, 17.0, 22.0, 27.0, 41.0, 67.0, 76.0, 112.0, 170.0, 248.0, 334.0, 494.0, 697.0, 1196.0, 2048.0, 3968.0, 9200.0, 30140.0, 462443.0, 3626826.0, 35440.0, 10302.0, 4297.0, 2241.0, 1309.0, 814.0, 503.0, 350.0, 243.0, 176.0, 123.0, 82.0, 73.0, 50.0, 33.0, 23.0, 19.0, 11.0, 13.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.6875, -69.451171875, -67.21484375, -64.978515625, -62.7421875, -60.505859375, -58.26953125, -56.033203125, -53.796875, -51.560546875, -49.32421875, -47.087890625, -44.8515625, -42.615234375, -40.37890625, -38.142578125, -35.90625, -33.669921875, -31.43359375, -29.197265625, -26.9609375, -24.724609375, -22.48828125, -20.251953125, -18.015625, -15.779296875, -13.54296875, -11.306640625, -9.0703125, -6.833984375, -4.59765625, -2.361328125, -0.125, 2.111328125, 4.34765625, 6.583984375, 8.8203125, 11.056640625, 13.29296875, 15.529296875, 17.765625, 20.001953125, 22.23828125, 24.474609375, 26.7109375, 28.947265625, 31.18359375, 33.419921875, 35.65625, 37.892578125, 40.12890625, 42.365234375, 44.6015625, 46.837890625, 49.07421875, 51.310546875, 53.546875, 55.783203125, 58.01953125, 60.255859375, 62.4921875, 64.728515625, 66.96484375, 69.201171875, 71.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 13.0, 12.0, 23.0, 38.0, 62.0, 233.0, 3353.0, 160.0, 76.0, 34.0, 13.0, 12.0, 6.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.90625, -46.69140625, -45.4765625, -44.26171875, -43.046875, -41.83203125, -40.6171875, -39.40234375, -38.1875, -36.97265625, -35.7578125, -34.54296875, -33.328125, -32.11328125, -30.8984375, -29.68359375, -28.46875, -27.25390625, -26.0390625, -24.82421875, -23.609375, -22.39453125, -21.1796875, -19.96484375, -18.75, -17.53515625, -16.3203125, -15.10546875, -13.890625, -12.67578125, -11.4609375, -10.24609375, -9.03125, -7.81640625, -6.6015625, -5.38671875, -4.171875, -2.95703125, -1.7421875, -0.52734375, 0.6875, 1.90234375, 3.1171875, 4.33203125, 5.546875, 6.76171875, 7.9765625, 9.19140625, 10.40625, 11.62109375, 12.8359375, 14.05078125, 15.265625, 16.48046875, 17.6953125, 18.91015625, 20.125, 21.33984375, 22.5546875, 23.76953125, 24.984375, 26.19921875, 27.4140625, 28.62890625, 29.84375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 5.0, 15.0, 23.0, 59.0, 75.0, 151.0, 172.0, 161.0, 128.0, 80.0, 57.0, 25.0, 15.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.40093994140625, -212.0947265625, -206.7885284423828, -201.48233032226562, -196.17611694335938, -190.86990356445312, -185.56370544433594, -180.25750732421875, -174.9512939453125, -169.64508056640625, -164.33888244628906, -159.03268432617188, -153.72647094726562, -148.42025756835938, -143.1140594482422, -137.807861328125, -132.50164794921875, -127.19544219970703, -121.88923645019531, -116.5830307006836, -111.27682495117188, -105.97061920166016, -100.66441345214844, -95.35820770263672, -90.052001953125, -84.74579620361328, -79.43959045410156, -74.13338470458984, -68.82717895507812, -63.520973205566406, -58.21476745605469, -52.90856170654297, -47.60234069824219, -42.29613494873047, -36.98992919921875, -31.68372344970703, -26.377517700195312, -21.071311950683594, -15.765106201171875, -10.458900451660156, -5.1526947021484375, 0.15351104736328125, 5.459716796875, 10.765922546386719, 16.072128295898438, 21.378334045410156, 26.684539794921875, 31.990745544433594, 37.29695129394531, 42.60315704345703, 47.90936279296875, 53.21556854248047, 58.52177429199219, 63.827980041503906, 69.13418579101562, 74.44039154052734, 79.74659729003906, 85.05280303955078, 90.3590087890625, 95.66521453857422, 100.97142028808594, 106.27762603759766, 111.58383178710938, 116.8900375366211, 122.19624328613281]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 9.0, 10.0, 12.0, 9.0, 12.0, 21.0, 16.0, 22.0, 29.0, 29.0, 26.0, 37.0, 31.0, 37.0, 34.0, 50.0, 34.0, 38.0, 49.0, 45.0, 49.0, 43.0, 39.0, 40.0, 32.0, 28.0, 30.0, 23.0, 26.0, 16.0, 13.0, 14.0, 16.0, 15.0, 11.0, 7.0, 10.0, 6.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-63.826290130615234, -61.83027648925781, -59.83426284790039, -57.83824920654297, -55.84223556518555, -53.846221923828125, -51.85021209716797, -49.85419845581055, -47.858184814453125, -45.8621711730957, -43.86615753173828, -41.87014389038086, -39.87413024902344, -37.87812042236328, -35.882102966308594, -33.88609313964844, -31.890077590942383, -29.89406394958496, -27.89805030822754, -25.90203857421875, -23.906024932861328, -21.910011291503906, -19.913997650146484, -17.917984008789062, -15.921971321105957, -13.925957679748535, -11.92994499206543, -9.933931350708008, -7.937918186187744, -5.9419050216674805, -3.9458913803100586, -1.9498786926269531, 0.04613494873046875, 2.0421481132507324, 4.038161277770996, 6.034174919128418, 8.030187606811523, 10.026201248168945, 12.022214889526367, 14.018227577209473, 16.014240264892578, 18.01025390625, 20.006267547607422, 22.002281188964844, 23.998292922973633, 25.994306564331055, 27.990320205688477, 29.986331939697266, 31.98234748840332, 33.97835922241211, 35.97437286376953, 37.97038650512695, 39.966400146484375, 41.9624137878418, 43.95842742919922, 45.95444107055664, 47.95045471191406, 49.946468353271484, 51.942481994628906, 53.93849563598633, 55.93450927734375, 57.930519104003906, 59.926536560058594, 61.92254638671875, 63.91856002807617]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 9.0, 11.0, 20.0, 28.0, 35.0, 58.0, 69.0, 121.0, 196.0, 340.0, 607.0, 1179.0, 2495.0, 5885.0, 15655.0, 46812.0, 149228.0, 391602.0, 289958.0, 95393.0, 30287.0, 10575.0, 4164.0, 1752.0, 867.0, 454.0, 249.0, 170.0, 128.0, 75.0, 45.0, 25.0, 18.0, 12.0, 7.0, 3.0, 5.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-70.8125, -68.7177734375, -66.623046875, -64.5283203125, -62.43359375, -60.3388671875, -58.244140625, -56.1494140625, -54.0546875, -51.9599609375, -49.865234375, -47.7705078125, -45.67578125, -43.5810546875, -41.486328125, -39.3916015625, -37.296875, -35.2021484375, -33.107421875, -31.0126953125, -28.91796875, -26.8232421875, -24.728515625, -22.6337890625, -20.5390625, -18.4443359375, -16.349609375, -14.2548828125, -12.16015625, -10.0654296875, -7.970703125, -5.8759765625, -3.78125, -1.6865234375, 0.408203125, 2.5029296875, 4.59765625, 6.6923828125, 8.787109375, 10.8818359375, 12.9765625, 15.0712890625, 17.166015625, 19.2607421875, 21.35546875, 23.4501953125, 25.544921875, 27.6396484375, 29.734375, 31.8291015625, 33.923828125, 36.0185546875, 38.11328125, 40.2080078125, 42.302734375, 44.3974609375, 46.4921875, 48.5869140625, 50.681640625, 52.7763671875, 54.87109375, 56.9658203125, 59.060546875, 61.1552734375, 63.25]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 11.0, 6.0, 16.0, 11.0, 16.0, 23.0, 25.0, 26.0, 33.0, 61.0, 42.0, 48.0, 46.0, 56.0, 66.0, 56.0, 58.0, 62.0, 43.0, 42.0, 50.0, 34.0, 25.0, 27.0, 22.0, 19.0, 15.0, 9.0, 13.0, 8.0, 4.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.205810546875, -17.48974609375, -16.773681640625, -16.0576171875, -15.341552734375, -14.62548828125, -13.909423828125, -13.193359375, -12.477294921875, -11.76123046875, -11.045166015625, -10.3291015625, -9.613037109375, -8.89697265625, -8.180908203125, -7.46484375, -6.748779296875, -6.03271484375, -5.316650390625, -4.6005859375, -3.884521484375, -3.16845703125, -2.452392578125, -1.736328125, -1.020263671875, -0.30419921875, 0.411865234375, 1.1279296875, 1.843994140625, 2.56005859375, 3.276123046875, 3.9921875, 4.708251953125, 5.42431640625, 6.140380859375, 6.8564453125, 7.572509765625, 8.28857421875, 9.004638671875, 9.720703125, 10.436767578125, 11.15283203125, 11.868896484375, 12.5849609375, 13.301025390625, 14.01708984375, 14.733154296875, 15.44921875, 16.165283203125, 16.88134765625, 17.597412109375, 18.3134765625, 19.029541015625, 19.74560546875, 20.461669921875, 21.177734375, 21.893798828125, 22.60986328125, 23.325927734375, 24.0419921875, 24.758056640625, 25.47412109375, 26.190185546875, 26.90625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 5.0, 11.0, 6.0, 12.0, 22.0, 23.0, 39.0, 74.0, 88.0, 187.0, 243.0, 422.0, 783.0, 1483.0, 4084.0, 17238.0, 151091.0, 730729.0, 120401.0, 14614.0, 3710.0, 1501.0, 705.0, 385.0, 234.0, 156.0, 103.0, 64.0, 32.0, 30.0, 20.0, 12.0, 8.0, 8.0, 5.0, 5.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.375, -115.806640625, -112.23828125, -108.669921875, -105.1015625, -101.533203125, -97.96484375, -94.396484375, -90.828125, -87.259765625, -83.69140625, -80.123046875, -76.5546875, -72.986328125, -69.41796875, -65.849609375, -62.28125, -58.712890625, -55.14453125, -51.576171875, -48.0078125, -44.439453125, -40.87109375, -37.302734375, -33.734375, -30.166015625, -26.59765625, -23.029296875, -19.4609375, -15.892578125, -12.32421875, -8.755859375, -5.1875, -1.619140625, 1.94921875, 5.517578125, 9.0859375, 12.654296875, 16.22265625, 19.791015625, 23.359375, 26.927734375, 30.49609375, 34.064453125, 37.6328125, 41.201171875, 44.76953125, 48.337890625, 51.90625, 55.474609375, 59.04296875, 62.611328125, 66.1796875, 69.748046875, 73.31640625, 76.884765625, 80.453125, 84.021484375, 87.58984375, 91.158203125, 94.7265625, 98.294921875, 101.86328125, 105.431640625, 109.0]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 6.0, 14.0, 21.0, 18.0, 23.0, 18.0, 33.0, 41.0, 41.0, 56.0, 54.0, 46.0, 51.0, 47.0, 71.0, 51.0, 56.0, 42.0, 46.0, 41.0, 47.0, 22.0, 26.0, 23.0, 31.0, 15.0, 7.0, 10.0, 9.0, 5.0, 8.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4375, -85.4072265625, -82.376953125, -79.3466796875, -76.31640625, -73.2861328125, -70.255859375, -67.2255859375, -64.1953125, -61.1650390625, -58.134765625, -55.1044921875, -52.07421875, -49.0439453125, -46.013671875, -42.9833984375, -39.953125, -36.9228515625, -33.892578125, -30.8623046875, -27.83203125, -24.8017578125, -21.771484375, -18.7412109375, -15.7109375, -12.6806640625, -9.650390625, -6.6201171875, -3.58984375, -0.5595703125, 2.470703125, 5.5009765625, 8.53125, 11.5615234375, 14.591796875, 17.6220703125, 20.65234375, 23.6826171875, 26.712890625, 29.7431640625, 32.7734375, 35.8037109375, 38.833984375, 41.8642578125, 44.89453125, 47.9248046875, 50.955078125, 53.9853515625, 57.015625, 60.0458984375, 63.076171875, 66.1064453125, 69.13671875, 72.1669921875, 75.197265625, 78.2275390625, 81.2578125, 84.2880859375, 87.318359375, 90.3486328125, 93.37890625, 96.4091796875, 99.439453125, 102.4697265625, 105.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 13.0, 12.0, 14.0, 26.0, 21.0, 36.0, 42.0, 62.0, 109.0, 140.0, 287.0, 508.0, 993.0, 2525.0, 8341.0, 49811.0, 693336.0, 261697.0, 22065.0, 4852.0, 1755.0, 770.0, 411.0, 211.0, 139.0, 91.0, 74.0, 51.0, 28.0, 24.0, 27.0, 14.0, 10.0, 13.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.65625, -44.220703125, -42.78515625, -41.349609375, -39.9140625, -38.478515625, -37.04296875, -35.607421875, -34.171875, -32.736328125, -31.30078125, -29.865234375, -28.4296875, -26.994140625, -25.55859375, -24.123046875, -22.6875, -21.251953125, -19.81640625, -18.380859375, -16.9453125, -15.509765625, -14.07421875, -12.638671875, -11.203125, -9.767578125, -8.33203125, -6.896484375, -5.4609375, -4.025390625, -2.58984375, -1.154296875, 0.28125, 1.716796875, 3.15234375, 4.587890625, 6.0234375, 7.458984375, 8.89453125, 10.330078125, 11.765625, 13.201171875, 14.63671875, 16.072265625, 17.5078125, 18.943359375, 20.37890625, 21.814453125, 23.25, 24.685546875, 26.12109375, 27.556640625, 28.9921875, 30.427734375, 31.86328125, 33.298828125, 34.734375, 36.169921875, 37.60546875, 39.041015625, 40.4765625, 41.912109375, 43.34765625, 44.783203125, 46.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 17.0, 16.0, 9.0, 14.0, 24.0, 40.0, 54.0, 53.0, 75.0, 70.0, 106.0, 111.0, 86.0, 69.0, 55.0, 36.0, 32.0, 24.0, 19.0, 13.0, 11.0, 13.0, 8.0, 7.0, 5.0, 2.0, 5.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005535125732421875, -0.005357980728149414, -0.005180835723876953, -0.005003690719604492, -0.004826545715332031, -0.00464940071105957, -0.004472255706787109, -0.0042951107025146484, -0.0041179656982421875, -0.0039408206939697266, -0.0037636756896972656, -0.0035865306854248047, -0.0034093856811523438, -0.003232240676879883, -0.003055095672607422, -0.002877950668334961, -0.0027008056640625, -0.002523660659790039, -0.002346515655517578, -0.002169370651245117, -0.0019922256469726562, -0.0018150806427001953, -0.0016379356384277344, -0.0014607906341552734, -0.0012836456298828125, -0.0011065006256103516, -0.0009293556213378906, -0.0007522106170654297, -0.0005750656127929688, -0.0003979206085205078, -0.00022077560424804688, -4.363059997558594e-05, 0.000133514404296875, 0.00031065940856933594, 0.0004878044128417969, 0.0006649494171142578, 0.0008420944213867188, 0.0010192394256591797, 0.0011963844299316406, 0.0013735294342041016, 0.0015506744384765625, 0.0017278194427490234, 0.0019049644470214844, 0.0020821094512939453, 0.0022592544555664062, 0.002436399459838867, 0.002613544464111328, 0.002790689468383789, 0.00296783447265625, 0.003144979476928711, 0.003322124481201172, 0.003499269485473633, 0.0036764144897460938, 0.0038535594940185547, 0.004030704498291016, 0.0042078495025634766, 0.0043849945068359375, 0.0045621395111083984, 0.004739284515380859, 0.00491642951965332, 0.005093574523925781, 0.005270719528198242, 0.005447864532470703, 0.005625009536743164, 0.005802154541015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 9.0, 4.0, 5.0, 8.0, 9.0, 18.0, 39.0, 34.0, 42.0, 80.0, 97.0, 144.0, 242.0, 398.0, 711.0, 1594.0, 4307.0, 15714.0, 124204.0, 782295.0, 97723.0, 13657.0, 3969.0, 1507.0, 680.0, 371.0, 208.0, 129.0, 105.0, 57.0, 47.0, 26.0, 35.0, 25.0, 16.0, 7.0, 12.0, 10.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-52.59375, -51.1103515625, -49.626953125, -48.1435546875, -46.66015625, -45.1767578125, -43.693359375, -42.2099609375, -40.7265625, -39.2431640625, -37.759765625, -36.2763671875, -34.79296875, -33.3095703125, -31.826171875, -30.3427734375, -28.859375, -27.3759765625, -25.892578125, -24.4091796875, -22.92578125, -21.4423828125, -19.958984375, -18.4755859375, -16.9921875, -15.5087890625, -14.025390625, -12.5419921875, -11.05859375, -9.5751953125, -8.091796875, -6.6083984375, -5.125, -3.6416015625, -2.158203125, -0.6748046875, 0.80859375, 2.2919921875, 3.775390625, 5.2587890625, 6.7421875, 8.2255859375, 9.708984375, 11.1923828125, 12.67578125, 14.1591796875, 15.642578125, 17.1259765625, 18.609375, 20.0927734375, 21.576171875, 23.0595703125, 24.54296875, 26.0263671875, 27.509765625, 28.9931640625, 30.4765625, 31.9599609375, 33.443359375, 34.9267578125, 36.41015625, 37.8935546875, 39.376953125, 40.8603515625, 42.34375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 7.0, 7.0, 10.0, 6.0, 18.0, 25.0, 22.0, 54.0, 75.0, 98.0, 142.0, 134.0, 127.0, 82.0, 62.0, 32.0, 26.0, 14.0, 13.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.40625, -41.80712890625, -40.2080078125, -38.60888671875, -37.009765625, -35.41064453125, -33.8115234375, -32.21240234375, -30.61328125, -29.01416015625, -27.4150390625, -25.81591796875, -24.216796875, -22.61767578125, -21.0185546875, -19.41943359375, -17.8203125, -16.22119140625, -14.6220703125, -13.02294921875, -11.423828125, -9.82470703125, -8.2255859375, -6.62646484375, -5.02734375, -3.42822265625, -1.8291015625, -0.22998046875, 1.369140625, 2.96826171875, 4.5673828125, 6.16650390625, 7.765625, 9.36474609375, 10.9638671875, 12.56298828125, 14.162109375, 15.76123046875, 17.3603515625, 18.95947265625, 20.55859375, 22.15771484375, 23.7568359375, 25.35595703125, 26.955078125, 28.55419921875, 30.1533203125, 31.75244140625, 33.3515625, 34.95068359375, 36.5498046875, 38.14892578125, 39.748046875, 41.34716796875, 42.9462890625, 44.54541015625, 46.14453125, 47.74365234375, 49.3427734375, 50.94189453125, 52.541015625, 54.14013671875, 55.7392578125, 57.33837890625, 58.9375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 16.0, 46.0, 95.0, 136.0, 230.0, 215.0, 137.0, 60.0, 23.0, 18.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-635.205322265625, -603.095703125, -570.986083984375, -538.87646484375, -506.7668762207031, -474.6572570800781, -442.54766845703125, -410.43804931640625, -378.32843017578125, -346.21881103515625, -314.10919189453125, -281.9996032714844, -249.88998413085938, -217.78036499023438, -185.67076110839844, -153.5611572265625, -121.4515380859375, -89.34192657470703, -57.23231506347656, -25.122703552246094, 6.986907958984375, 39.096527099609375, 71.20613098144531, 103.31573486328125, 135.42535400390625, 167.53497314453125, 199.6445770263672, 231.75418090820312, 263.8638000488281, 295.9734191894531, 328.0830078125, 360.192626953125, 392.3023681640625, 424.4119873046875, 456.5216064453125, 488.6311950683594, 520.7408447265625, 552.8504638671875, 584.9600219726562, 617.0696411132812, 649.1792602539062, 681.2888793945312, 713.3984985351562, 745.5081176757812, 777.61767578125, 809.727294921875, 841.8369140625, 873.946533203125, 906.05615234375, 938.165771484375, 970.275390625, 1002.385009765625, 1034.49462890625, 1066.604248046875, 1098.7138671875, 1130.823486328125, 1162.93310546875, 1195.042724609375, 1227.15234375, 1259.261962890625, 1291.37158203125, 1323.481201171875, 1355.5908203125, 1387.700439453125, 1419.8099365234375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 16.0, 13.0, 18.0, 16.0, 24.0, 30.0, 29.0, 42.0, 50.0, 44.0, 56.0, 60.0, 62.0, 47.0, 57.0, 57.0, 42.0, 42.0, 35.0, 40.0, 41.0, 26.0, 24.0, 16.0, 19.0, 9.0, 14.0, 8.0, 8.0, 1.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.69232177734375, -450.9377136230469, -437.1830749511719, -423.428466796875, -409.673828125, -395.9192199707031, -382.16461181640625, -368.40997314453125, -354.6553649902344, -340.9007568359375, -327.1461181640625, -313.3915100097656, -299.6368713378906, -285.88226318359375, -272.12762451171875, -258.3730163574219, -244.61839294433594, -230.86376953125, -217.10914611816406, -203.35452270507812, -189.59991455078125, -175.8452911376953, -162.09066772460938, -148.3360595703125, -134.5814208984375, -120.82679748535156, -107.07218170166016, -93.31755828857422, -79.56294250488281, -65.80831909179688, -52.05369567871094, -38.29907989501953, -24.544464111328125, -10.789843559265137, 2.9647769927978516, 16.719398498535156, 30.474018096923828, 44.2286376953125, 57.98326110839844, 71.73787689208984, 85.49250030517578, 99.24712371826172, 113.00173950195312, 126.75636291503906, 140.510986328125, 154.26559448242188, 168.02023315429688, 181.77484130859375, 195.5294647216797, 209.28408813476562, 223.03871154785156, 236.7933349609375, 250.54794311523438, 264.30255126953125, 278.05718994140625, 291.8117980957031, 305.5664367675781, 319.321044921875, 333.07568359375, 346.8302917480469, 360.5849304199219, 374.33953857421875, 388.09417724609375, 401.8487854003906, 415.6033935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 21.0, 25.0, 38.0, 58.0, 80.0, 118.0, 225.0, 443.0, 965.0, 2295.0, 5939.0, 18274.0, 71135.0, 849220.0, 3071013.0, 131416.0, 28367.0, 8798.0, 3102.0, 1363.0, 603.0, 311.0, 167.0, 103.0, 54.0, 33.0, 21.0, 20.0, 17.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -50.54638671875, -48.6865234375, -46.82666015625, -44.966796875, -43.10693359375, -41.2470703125, -39.38720703125, -37.52734375, -35.66748046875, -33.8076171875, -31.94775390625, -30.087890625, -28.22802734375, -26.3681640625, -24.50830078125, -22.6484375, -20.78857421875, -18.9287109375, -17.06884765625, -15.208984375, -13.34912109375, -11.4892578125, -9.62939453125, -7.76953125, -5.90966796875, -4.0498046875, -2.18994140625, -0.330078125, 1.52978515625, 3.3896484375, 5.24951171875, 7.109375, 8.96923828125, 10.8291015625, 12.68896484375, 14.548828125, 16.40869140625, 18.2685546875, 20.12841796875, 21.98828125, 23.84814453125, 25.7080078125, 27.56787109375, 29.427734375, 31.28759765625, 33.1474609375, 35.00732421875, 36.8671875, 38.72705078125, 40.5869140625, 42.44677734375, 44.306640625, 46.16650390625, 48.0263671875, 49.88623046875, 51.74609375, 53.60595703125, 55.4658203125, 57.32568359375, 59.185546875, 61.04541015625, 62.9052734375, 64.76513671875, 66.625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 7.0, 8.0, 5.0, 13.0, 16.0, 18.0, 21.0, 29.0, 34.0, 36.0, 35.0, 45.0, 56.0, 50.0, 55.0, 43.0, 54.0, 64.0, 52.0, 50.0, 52.0, 43.0, 35.0, 32.0, 22.0, 22.0, 14.0, 11.0, 13.0, 13.0, 11.0, 7.0, 5.0, 6.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.95703125, -19.3359375, -18.71484375, -18.09375, -17.47265625, -16.8515625, -16.23046875, -15.609375, -14.98828125, -14.3671875, -13.74609375, -13.125, -12.50390625, -11.8828125, -11.26171875, -10.640625, -10.01953125, -9.3984375, -8.77734375, -8.15625, -7.53515625, -6.9140625, -6.29296875, -5.671875, -5.05078125, -4.4296875, -3.80859375, -3.1875, -2.56640625, -1.9453125, -1.32421875, -0.703125, -0.08203125, 0.5390625, 1.16015625, 1.78125, 2.40234375, 3.0234375, 3.64453125, 4.265625, 4.88671875, 5.5078125, 6.12890625, 6.75, 7.37109375, 7.9921875, 8.61328125, 9.234375, 9.85546875, 10.4765625, 11.09765625, 11.71875, 12.33984375, 12.9609375, 13.58203125, 14.203125, 14.82421875, 15.4453125, 16.06640625, 16.6875, 17.30859375, 17.9296875, 18.55078125, 19.171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 10.0, 29.0, 31.0, 59.0, 96.0, 133.0, 303.0, 762.0, 2128.0, 7103.0, 30157.0, 235541.0, 3682107.0, 198499.0, 27616.0, 6396.0, 1958.0, 688.0, 304.0, 124.0, 79.0, 32.0, 30.0, 22.0, 18.0, 7.0, 7.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-97.75, -95.2734375, -92.796875, -90.3203125, -87.84375, -85.3671875, -82.890625, -80.4140625, -77.9375, -75.4609375, -72.984375, -70.5078125, -68.03125, -65.5546875, -63.078125, -60.6015625, -58.125, -55.6484375, -53.171875, -50.6953125, -48.21875, -45.7421875, -43.265625, -40.7890625, -38.3125, -35.8359375, -33.359375, -30.8828125, -28.40625, -25.9296875, -23.453125, -20.9765625, -18.5, -16.0234375, -13.546875, -11.0703125, -8.59375, -6.1171875, -3.640625, -1.1640625, 1.3125, 3.7890625, 6.265625, 8.7421875, 11.21875, 13.6953125, 16.171875, 18.6484375, 21.125, 23.6015625, 26.078125, 28.5546875, 31.03125, 33.5078125, 35.984375, 38.4609375, 40.9375, 43.4140625, 45.890625, 48.3671875, 50.84375, 53.3203125, 55.796875, 58.2734375, 60.75]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 5.0, 11.0, 6.0, 12.0, 18.0, 23.0, 37.0, 40.0, 67.0, 98.0, 174.0, 392.0, 934.0, 1173.0, 518.0, 206.0, 104.0, 65.0, 55.0, 40.0, 26.0, 21.0, 12.0, 10.0, 5.0, 5.0, 3.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.625, -61.515625, -59.40625, -57.296875, -55.1875, -53.078125, -50.96875, -48.859375, -46.75, -44.640625, -42.53125, -40.421875, -38.3125, -36.203125, -34.09375, -31.984375, -29.875, -27.765625, -25.65625, -23.546875, -21.4375, -19.328125, -17.21875, -15.109375, -13.0, -10.890625, -8.78125, -6.671875, -4.5625, -2.453125, -0.34375, 1.765625, 3.875, 5.984375, 8.09375, 10.203125, 12.3125, 14.421875, 16.53125, 18.640625, 20.75, 22.859375, 24.96875, 27.078125, 29.1875, 31.296875, 33.40625, 35.515625, 37.625, 39.734375, 41.84375, 43.953125, 46.0625, 48.171875, 50.28125, 52.390625, 54.5, 56.609375, 58.71875, 60.828125, 62.9375, 65.046875, 67.15625, 69.265625, 71.375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 5.0, 23.0, 34.0, 59.0, 136.0, 211.0, 215.0, 148.0, 80.0, 36.0, 15.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-595.4869384765625, -572.8504028320312, -550.2138061523438, -527.5772705078125, -504.94073486328125, -482.3041687011719, -459.6676025390625, -437.03106689453125, -414.3945007324219, -391.7579345703125, -369.12139892578125, -346.4848327636719, -323.8482666015625, -301.21173095703125, -278.5751647949219, -255.93861389160156, -233.30206298828125, -210.66551208496094, -188.02896118164062, -165.39239501953125, -142.75584411621094, -120.11929321289062, -97.48272705078125, -74.84617614746094, -52.209625244140625, -29.573070526123047, -6.936515808105469, 15.700042724609375, 38.33659362792969, 60.97314453125, 83.60971069335938, 106.24626159667969, 128.8828125, 151.5193634033203, 174.15591430664062, 196.79248046875, 219.4290313720703, 242.06558227539062, 264.7021484375, 287.33868408203125, 309.9752502441406, 332.61181640625, 355.24835205078125, 377.8849182128906, 400.521484375, 423.15802001953125, 445.7945861816406, 468.43115234375, 491.06768798828125, 513.7042236328125, 536.3408203125, 558.9773559570312, 581.6138916015625, 604.25048828125, 626.8870239257812, 649.5235595703125, 672.16015625, 694.7966918945312, 717.4332885742188, 740.06982421875, 762.7063598632812, 785.3428955078125, 807.9794921875, 830.6160278320312, 853.2525634765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 9.0, 8.0, 13.0, 10.0, 13.0, 23.0, 36.0, 26.0, 37.0, 30.0, 38.0, 38.0, 42.0, 41.0, 44.0, 47.0, 43.0, 55.0, 59.0, 39.0, 34.0, 43.0, 27.0, 27.0, 30.0, 27.0, 26.0, 17.0, 24.0, 19.0, 14.0, 6.0, 8.0, 3.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.61831665039062, -234.143798828125, -226.66928100585938, -219.1947479248047, -211.72023010253906, -204.24571228027344, -196.77117919921875, -189.29666137695312, -181.8221435546875, -174.34762573242188, -166.87310791015625, -159.39857482910156, -151.92405700683594, -144.4495391845703, -136.97500610351562, -129.50048828125, -122.02597045898438, -114.55145263671875, -107.0769271850586, -99.60240173339844, -92.12788391113281, -84.65336608886719, -77.17884063720703, -69.70431518554688, -62.22979736328125, -54.75527572631836, -47.28075408935547, -39.80623245239258, -32.33171081542969, -24.857189178466797, -17.382667541503906, -9.908145904541016, -2.433624267578125, 5.040897369384766, 12.515419006347656, 19.989940643310547, 27.464462280273438, 34.93898391723633, 42.41350555419922, 49.88802719116211, 57.362548828125, 64.83706665039062, 72.31159210205078, 79.78611755371094, 87.26063537597656, 94.73515319824219, 102.20967864990234, 109.6842041015625, 117.15872192382812, 124.63323974609375, 132.10775756835938, 139.58229064941406, 147.0568084716797, 154.5313262939453, 162.005859375, 169.48037719726562, 176.95489501953125, 184.42941284179688, 191.9039306640625, 199.3784637451172, 206.8529815673828, 214.32749938964844, 221.80203247070312, 229.27655029296875, 236.75106811523438]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 14.0, 9.0, 13.0, 26.0, 37.0, 67.0, 105.0, 145.0, 252.0, 528.0, 1242.0, 3326.0, 10165.0, 37341.0, 159266.0, 515420.0, 242928.0, 55747.0, 14480.0, 4358.0, 1576.0, 677.0, 289.0, 205.0, 113.0, 68.0, 37.0, 30.0, 21.0, 14.0, 7.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-87.3125, -84.7919921875, -82.271484375, -79.7509765625, -77.23046875, -74.7099609375, -72.189453125, -69.6689453125, -67.1484375, -64.6279296875, -62.107421875, -59.5869140625, -57.06640625, -54.5458984375, -52.025390625, -49.5048828125, -46.984375, -44.4638671875, -41.943359375, -39.4228515625, -36.90234375, -34.3818359375, -31.861328125, -29.3408203125, -26.8203125, -24.2998046875, -21.779296875, -19.2587890625, -16.73828125, -14.2177734375, -11.697265625, -9.1767578125, -6.65625, -4.1357421875, -1.615234375, 0.9052734375, 3.42578125, 5.9462890625, 8.466796875, 10.9873046875, 13.5078125, 16.0283203125, 18.548828125, 21.0693359375, 23.58984375, 26.1103515625, 28.630859375, 31.1513671875, 33.671875, 36.1923828125, 38.712890625, 41.2333984375, 43.75390625, 46.2744140625, 48.794921875, 51.3154296875, 53.8359375, 56.3564453125, 58.876953125, 61.3974609375, 63.91796875, 66.4384765625, 68.958984375, 71.4794921875, 74.0]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 12.0, 9.0, 9.0, 12.0, 22.0, 21.0, 24.0, 21.0, 44.0, 32.0, 46.0, 44.0, 52.0, 48.0, 48.0, 52.0, 44.0, 62.0, 48.0, 41.0, 40.0, 44.0, 44.0, 37.0, 21.0, 21.0, 18.0, 9.0, 12.0, 11.0, 6.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.88623046875, -19.2412109375, -18.59619140625, -17.951171875, -17.30615234375, -16.6611328125, -16.01611328125, -15.37109375, -14.72607421875, -14.0810546875, -13.43603515625, -12.791015625, -12.14599609375, -11.5009765625, -10.85595703125, -10.2109375, -9.56591796875, -8.9208984375, -8.27587890625, -7.630859375, -6.98583984375, -6.3408203125, -5.69580078125, -5.05078125, -4.40576171875, -3.7607421875, -3.11572265625, -2.470703125, -1.82568359375, -1.1806640625, -0.53564453125, 0.109375, 0.75439453125, 1.3994140625, 2.04443359375, 2.689453125, 3.33447265625, 3.9794921875, 4.62451171875, 5.26953125, 5.91455078125, 6.5595703125, 7.20458984375, 7.849609375, 8.49462890625, 9.1396484375, 9.78466796875, 10.4296875, 11.07470703125, 11.7197265625, 12.36474609375, 13.009765625, 13.65478515625, 14.2998046875, 14.94482421875, 15.58984375, 16.23486328125, 16.8798828125, 17.52490234375, 18.169921875, 18.81494140625, 19.4599609375, 20.10498046875, 20.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 4.0, 14.0, 15.0, 12.0, 21.0, 30.0, 46.0, 77.0, 137.0, 185.0, 325.0, 645.0, 1346.0, 3486.0, 14443.0, 155117.0, 796631.0, 62618.0, 8664.0, 2379.0, 1062.0, 515.0, 293.0, 172.0, 115.0, 59.0, 51.0, 28.0, 21.0, 12.0, 6.0, 6.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.375, -137.83203125, -133.2890625, -128.74609375, -124.203125, -119.66015625, -115.1171875, -110.57421875, -106.03125, -101.48828125, -96.9453125, -92.40234375, -87.859375, -83.31640625, -78.7734375, -74.23046875, -69.6875, -65.14453125, -60.6015625, -56.05859375, -51.515625, -46.97265625, -42.4296875, -37.88671875, -33.34375, -28.80078125, -24.2578125, -19.71484375, -15.171875, -10.62890625, -6.0859375, -1.54296875, 3.0, 7.54296875, 12.0859375, 16.62890625, 21.171875, 25.71484375, 30.2578125, 34.80078125, 39.34375, 43.88671875, 48.4296875, 52.97265625, 57.515625, 62.05859375, 66.6015625, 71.14453125, 75.6875, 80.23046875, 84.7734375, 89.31640625, 93.859375, 98.40234375, 102.9453125, 107.48828125, 112.03125, 116.57421875, 121.1171875, 125.66015625, 130.203125, 134.74609375, 139.2890625, 143.83203125, 148.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 11.0, 17.0, 16.0, 13.0, 23.0, 26.0, 43.0, 36.0, 44.0, 44.0, 52.0, 70.0, 49.0, 62.0, 57.0, 51.0, 59.0, 47.0, 42.0, 38.0, 32.0, 33.0, 16.0, 19.0, 16.0, 18.0, 14.0, 4.0, 7.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.5, -85.2255859375, -81.951171875, -78.6767578125, -75.40234375, -72.1279296875, -68.853515625, -65.5791015625, -62.3046875, -59.0302734375, -55.755859375, -52.4814453125, -49.20703125, -45.9326171875, -42.658203125, -39.3837890625, -36.109375, -32.8349609375, -29.560546875, -26.2861328125, -23.01171875, -19.7373046875, -16.462890625, -13.1884765625, -9.9140625, -6.6396484375, -3.365234375, -0.0908203125, 3.18359375, 6.4580078125, 9.732421875, 13.0068359375, 16.28125, 19.5556640625, 22.830078125, 26.1044921875, 29.37890625, 32.6533203125, 35.927734375, 39.2021484375, 42.4765625, 45.7509765625, 49.025390625, 52.2998046875, 55.57421875, 58.8486328125, 62.123046875, 65.3974609375, 68.671875, 71.9462890625, 75.220703125, 78.4951171875, 81.76953125, 85.0439453125, 88.318359375, 91.5927734375, 94.8671875, 98.1416015625, 101.416015625, 104.6904296875, 107.96484375, 111.2392578125, 114.513671875, 117.7880859375, 121.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 1.0, 7.0, 10.0, 9.0, 14.0, 21.0, 27.0, 34.0, 73.0, 68.0, 145.0, 246.0, 458.0, 972.0, 2776.0, 11089.0, 100926.0, 846185.0, 72069.0, 9140.0, 2346.0, 893.0, 408.0, 225.0, 136.0, 76.0, 56.0, 32.0, 22.0, 17.0, 13.0, 20.0, 10.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.65625, -50.9814453125, -49.306640625, -47.6318359375, -45.95703125, -44.2822265625, -42.607421875, -40.9326171875, -39.2578125, -37.5830078125, -35.908203125, -34.2333984375, -32.55859375, -30.8837890625, -29.208984375, -27.5341796875, -25.859375, -24.1845703125, -22.509765625, -20.8349609375, -19.16015625, -17.4853515625, -15.810546875, -14.1357421875, -12.4609375, -10.7861328125, -9.111328125, -7.4365234375, -5.76171875, -4.0869140625, -2.412109375, -0.7373046875, 0.9375, 2.6123046875, 4.287109375, 5.9619140625, 7.63671875, 9.3115234375, 10.986328125, 12.6611328125, 14.3359375, 16.0107421875, 17.685546875, 19.3603515625, 21.03515625, 22.7099609375, 24.384765625, 26.0595703125, 27.734375, 29.4091796875, 31.083984375, 32.7587890625, 34.43359375, 36.1083984375, 37.783203125, 39.4580078125, 41.1328125, 42.8076171875, 44.482421875, 46.1572265625, 47.83203125, 49.5068359375, 51.181640625, 52.8564453125, 54.53125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 8.0, 7.0, 5.0, 13.0, 17.0, 22.0, 39.0, 54.0, 99.0, 167.0, 204.0, 160.0, 87.0, 38.0, 29.0, 18.0, 16.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.013058662414550781, -0.012666702270507812, -0.012274742126464844, -0.011882781982421875, -0.011490821838378906, -0.011098861694335938, -0.010706901550292969, -0.01031494140625, -0.009922981262207031, -0.009531021118164062, -0.009139060974121094, -0.008747100830078125, -0.008355140686035156, -0.007963180541992188, -0.007571220397949219, -0.00717926025390625, -0.006787300109863281, -0.0063953399658203125, -0.006003379821777344, -0.005611419677734375, -0.005219459533691406, -0.0048274993896484375, -0.004435539245605469, -0.0040435791015625, -0.0036516189575195312, -0.0032596588134765625, -0.0028676986694335938, -0.002475738525390625, -0.0020837783813476562, -0.0016918182373046875, -0.0012998580932617188, -0.00090789794921875, -0.0005159378051757812, -0.0001239776611328125, 0.00026798248291015625, 0.000659942626953125, 0.0010519027709960938, 0.0014438629150390625, 0.0018358230590820312, 0.002227783203125, 0.0026197433471679688, 0.0030117034912109375, 0.0034036636352539062, 0.003795623779296875, 0.004187583923339844, 0.0045795440673828125, 0.004971504211425781, 0.00536346435546875, 0.005755424499511719, 0.0061473846435546875, 0.006539344787597656, 0.006931304931640625, 0.007323265075683594, 0.0077152252197265625, 0.008107185363769531, 0.0084991455078125, 0.008891105651855469, 0.009283065795898438, 0.009675025939941406, 0.010066986083984375, 0.010458946228027344, 0.010850906372070312, 0.011242866516113281, 0.01163482666015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 14.0, 14.0, 21.0, 32.0, 34.0, 66.0, 103.0, 171.0, 304.0, 623.0, 1541.0, 4856.0, 25991.0, 611010.0, 376625.0, 20390.0, 4115.0, 1361.0, 574.0, 275.0, 128.0, 77.0, 65.0, 48.0, 30.0, 15.0, 12.0, 9.0, 10.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.15625, -47.39697265625, -45.6376953125, -43.87841796875, -42.119140625, -40.35986328125, -38.6005859375, -36.84130859375, -35.08203125, -33.32275390625, -31.5634765625, -29.80419921875, -28.044921875, -26.28564453125, -24.5263671875, -22.76708984375, -21.0078125, -19.24853515625, -17.4892578125, -15.72998046875, -13.970703125, -12.21142578125, -10.4521484375, -8.69287109375, -6.93359375, -5.17431640625, -3.4150390625, -1.65576171875, 0.103515625, 1.86279296875, 3.6220703125, 5.38134765625, 7.140625, 8.89990234375, 10.6591796875, 12.41845703125, 14.177734375, 15.93701171875, 17.6962890625, 19.45556640625, 21.21484375, 22.97412109375, 24.7333984375, 26.49267578125, 28.251953125, 30.01123046875, 31.7705078125, 33.52978515625, 35.2890625, 37.04833984375, 38.8076171875, 40.56689453125, 42.326171875, 44.08544921875, 45.8447265625, 47.60400390625, 49.36328125, 51.12255859375, 52.8818359375, 54.64111328125, 56.400390625, 58.15966796875, 59.9189453125, 61.67822265625, 63.4375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 13.0, 12.0, 13.0, 30.0, 26.0, 51.0, 75.0, 70.0, 101.0, 123.0, 116.0, 72.0, 76.0, 59.0, 34.0, 26.0, 18.0, 13.0, 7.0, 8.0, 6.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.79296875, -36.5234375, -35.25390625, -33.984375, -32.71484375, -31.4453125, -30.17578125, -28.90625, -27.63671875, -26.3671875, -25.09765625, -23.828125, -22.55859375, -21.2890625, -20.01953125, -18.75, -17.48046875, -16.2109375, -14.94140625, -13.671875, -12.40234375, -11.1328125, -9.86328125, -8.59375, -7.32421875, -6.0546875, -4.78515625, -3.515625, -2.24609375, -0.9765625, 0.29296875, 1.5625, 2.83203125, 4.1015625, 5.37109375, 6.640625, 7.91015625, 9.1796875, 10.44921875, 11.71875, 12.98828125, 14.2578125, 15.52734375, 16.796875, 18.06640625, 19.3359375, 20.60546875, 21.875, 23.14453125, 24.4140625, 25.68359375, 26.953125, 28.22265625, 29.4921875, 30.76171875, 32.03125, 33.30078125, 34.5703125, 35.83984375, 37.109375, 38.37890625, 39.6484375, 40.91796875, 42.1875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 15.0, 37.0, 70.0, 123.0, 195.0, 212.0, 160.0, 81.0, 40.0, 28.0, 12.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1059.01806640625, -1032.680908203125, -1006.3436279296875, -980.0064086914062, -953.669189453125, -927.33203125, -900.9948120117188, -874.6575927734375, -848.3203735351562, -821.983154296875, -795.6459350585938, -769.3087158203125, -742.9715576171875, -716.63427734375, -690.297119140625, -663.9598999023438, -637.6226806640625, -611.2854614257812, -584.9482421875, -558.6110229492188, -532.2738037109375, -505.9366149902344, -479.59942626953125, -453.26220703125, -426.92498779296875, -400.5877685546875, -374.25054931640625, -347.9133605957031, -321.5761413574219, -295.2389221191406, -268.9017333984375, -242.56451416015625, -216.227294921875, -189.89007568359375, -163.55287170410156, -137.21566772460938, -110.87844848632812, -84.54122924804688, -58.20402526855469, -31.8668212890625, -5.52960205078125, 20.80760955810547, 47.14482116699219, 73.4820327758789, 99.81924438476562, 126.15646362304688, 152.49366760253906, 178.83087158203125, 205.1680908203125, 231.50531005859375, 257.842529296875, 284.1797180175781, 310.5169372558594, 336.8541564941406, 363.19134521484375, 389.528564453125, 415.86578369140625, 442.2030029296875, 468.54022216796875, 494.8774108886719, 521.214599609375, 547.5518798828125, 573.8890380859375, 600.2262573242188, 626.5634765625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 12.0, 19.0, 15.0, 20.0, 40.0, 48.0, 58.0, 51.0, 55.0, 74.0, 96.0, 80.0, 74.0, 59.0, 66.0, 52.0, 44.0, 38.0, 19.0, 20.0, 21.0, 10.0, 10.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-653.1954345703125, -636.46875, -619.7420043945312, -603.0153198242188, -586.28857421875, -569.5618896484375, -552.8351440429688, -536.1084594726562, -519.3817138671875, -502.6549987792969, -485.92828369140625, -469.2015686035156, -452.474853515625, -435.7481689453125, -419.0214538574219, -402.29473876953125, -385.56805419921875, -368.8413391113281, -352.1146240234375, -335.3879089355469, -318.66119384765625, -301.93450927734375, -285.2077941894531, -268.4810791015625, -251.75436401367188, -235.02764892578125, -218.30093383789062, -201.57423400878906, -184.84751892089844, -168.1208038330078, -151.39410400390625, -134.66738891601562, -117.940673828125, -101.21395874023438, -84.48725128173828, -67.76054382324219, -51.03382873535156, -34.30711364746094, -17.580406188964844, -0.85369873046875, 15.873016357421875, 32.599727630615234, 49.326438903808594, 66.05314636230469, 82.77986145019531, 99.50657653808594, 116.23328399658203, 132.95999145507812, 149.68670654296875, 166.41342163085938, 183.14013671875, 199.86683654785156, 216.5935516357422, 233.3202667236328, 250.04696655273438, 266.773681640625, 283.5003967285156, 300.22711181640625, 316.9538269042969, 333.6805419921875, 350.4072265625, 367.13397216796875, 383.86065673828125, 400.5873718261719, 417.3140869140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 16.0, 12.0, 19.0, 24.0, 36.0, 57.0, 97.0, 185.0, 380.0, 902.0, 2639.0, 9081.0, 47235.0, 2144638.0, 1928712.0, 46502.0, 9393.0, 2685.0, 860.0, 348.0, 194.0, 122.0, 51.0, 32.0, 21.0, 12.0, 6.0, 3.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.0, -87.69189453125, -85.3837890625, -83.07568359375, -80.767578125, -78.45947265625, -76.1513671875, -73.84326171875, -71.53515625, -69.22705078125, -66.9189453125, -64.61083984375, -62.302734375, -59.99462890625, -57.6865234375, -55.37841796875, -53.0703125, -50.76220703125, -48.4541015625, -46.14599609375, -43.837890625, -41.52978515625, -39.2216796875, -36.91357421875, -34.60546875, -32.29736328125, -29.9892578125, -27.68115234375, -25.373046875, -23.06494140625, -20.7568359375, -18.44873046875, -16.140625, -13.83251953125, -11.5244140625, -9.21630859375, -6.908203125, -4.60009765625, -2.2919921875, 0.01611328125, 2.32421875, 4.63232421875, 6.9404296875, 9.24853515625, 11.556640625, 13.86474609375, 16.1728515625, 18.48095703125, 20.7890625, 23.09716796875, 25.4052734375, 27.71337890625, 30.021484375, 32.32958984375, 34.6376953125, 36.94580078125, 39.25390625, 41.56201171875, 43.8701171875, 46.17822265625, 48.486328125, 50.79443359375, 53.1025390625, 55.41064453125, 57.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 13.0, 20.0, 22.0, 52.0, 69.0, 105.0, 121.0, 141.0, 124.0, 104.0, 99.0, 45.0, 42.0, 24.0, 15.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.375, -73.76171875, -72.1484375, -70.53515625, -68.921875, -67.30859375, -65.6953125, -64.08203125, -62.46875, -60.85546875, -59.2421875, -57.62890625, -56.015625, -54.40234375, -52.7890625, -51.17578125, -49.5625, -47.94921875, -46.3359375, -44.72265625, -43.109375, -41.49609375, -39.8828125, -38.26953125, -36.65625, -35.04296875, -33.4296875, -31.81640625, -30.203125, -28.58984375, -26.9765625, -25.36328125, -23.75, -22.13671875, -20.5234375, -18.91015625, -17.296875, -15.68359375, -14.0703125, -12.45703125, -10.84375, -9.23046875, -7.6171875, -6.00390625, -4.390625, -2.77734375, -1.1640625, 0.44921875, 2.0625, 3.67578125, 5.2890625, 6.90234375, 8.515625, 10.12890625, 11.7421875, 13.35546875, 14.96875, 16.58203125, 18.1953125, 19.80859375, 21.421875, 23.03515625, 24.6484375, 26.26171875, 27.875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 9.0, 14.0, 12.0, 22.0, 30.0, 53.0, 57.0, 114.0, 201.0, 344.0, 625.0, 1137.0, 2238.0, 4686.0, 10106.0, 24165.0, 71291.0, 425621.0, 3227434.0, 322881.0, 62652.0, 22043.0, 9294.0, 4394.0, 2197.0, 1173.0, 615.0, 336.0, 204.0, 116.0, 73.0, 47.0, 30.0, 19.0, 16.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.25, -45.83740234375, -44.4248046875, -43.01220703125, -41.599609375, -40.18701171875, -38.7744140625, -37.36181640625, -35.94921875, -34.53662109375, -33.1240234375, -31.71142578125, -30.298828125, -28.88623046875, -27.4736328125, -26.06103515625, -24.6484375, -23.23583984375, -21.8232421875, -20.41064453125, -18.998046875, -17.58544921875, -16.1728515625, -14.76025390625, -13.34765625, -11.93505859375, -10.5224609375, -9.10986328125, -7.697265625, -6.28466796875, -4.8720703125, -3.45947265625, -2.046875, -0.63427734375, 0.7783203125, 2.19091796875, 3.603515625, 5.01611328125, 6.4287109375, 7.84130859375, 9.25390625, 10.66650390625, 12.0791015625, 13.49169921875, 14.904296875, 16.31689453125, 17.7294921875, 19.14208984375, 20.5546875, 21.96728515625, 23.3798828125, 24.79248046875, 26.205078125, 27.61767578125, 29.0302734375, 30.44287109375, 31.85546875, 33.26806640625, 34.6806640625, 36.09326171875, 37.505859375, 38.91845703125, 40.3310546875, 41.74365234375, 43.15625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 11.0, 12.0, 6.0, 19.0, 21.0, 21.0, 39.0, 48.0, 72.0, 99.0, 221.0, 377.0, 824.0, 1049.0, 533.0, 248.0, 141.0, 89.0, 73.0, 37.0, 25.0, 13.0, 14.0, 17.0, 5.0, 14.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.9375, -52.31982421875, -50.7021484375, -49.08447265625, -47.466796875, -45.84912109375, -44.2314453125, -42.61376953125, -40.99609375, -39.37841796875, -37.7607421875, -36.14306640625, -34.525390625, -32.90771484375, -31.2900390625, -29.67236328125, -28.0546875, -26.43701171875, -24.8193359375, -23.20166015625, -21.583984375, -19.96630859375, -18.3486328125, -16.73095703125, -15.11328125, -13.49560546875, -11.8779296875, -10.26025390625, -8.642578125, -7.02490234375, -5.4072265625, -3.78955078125, -2.171875, -0.55419921875, 1.0634765625, 2.68115234375, 4.298828125, 5.91650390625, 7.5341796875, 9.15185546875, 10.76953125, 12.38720703125, 14.0048828125, 15.62255859375, 17.240234375, 18.85791015625, 20.4755859375, 22.09326171875, 23.7109375, 25.32861328125, 26.9462890625, 28.56396484375, 30.181640625, 31.79931640625, 33.4169921875, 35.03466796875, 36.65234375, 38.27001953125, 39.8876953125, 41.50537109375, 43.123046875, 44.74072265625, 46.3583984375, 47.97607421875, 49.59375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 18.0, 21.0, 39.0, 95.0, 182.0, 213.0, 196.0, 105.0, 66.0, 22.0, 14.0, 5.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-520.798583984375, -501.9437255859375, -483.0888671875, -464.2339782714844, -445.3791198730469, -426.5242614746094, -407.66937255859375, -388.81451416015625, -369.95965576171875, -351.10479736328125, -332.24993896484375, -313.3950500488281, -294.5401916503906, -275.6853332519531, -256.8304443359375, -237.9755859375, -219.1207275390625, -200.265869140625, -181.41099548339844, -162.55612182617188, -143.70126342773438, -124.84639739990234, -105.99153137207031, -87.13665771484375, -68.28179931640625, -49.42693328857422, -30.572067260742188, -11.717201232910156, 7.137664794921875, 25.992530822753906, 44.84739685058594, 63.7022705078125, 82.55712890625, 101.41199493408203, 120.26686096191406, 139.12173461914062, 157.97659301757812, 176.83145141601562, 195.6863250732422, 214.54119873046875, 233.39605712890625, 252.25091552734375, 271.10577392578125, 289.9606628417969, 308.8155212402344, 327.6703796386719, 346.5252685546875, 365.380126953125, 384.2349853515625, 403.08984375, 421.9447021484375, 440.7995910644531, 459.6544494628906, 478.5093078613281, 497.36419677734375, 516.2190551757812, 535.0739135742188, 553.9287719726562, 572.7836303710938, 591.6384887695312, 610.493408203125, 629.3482666015625, 648.203125, 667.0579833984375, 685.912841796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 2.0, 11.0, 6.0, 15.0, 16.0, 16.0, 13.0, 20.0, 22.0, 26.0, 22.0, 26.0, 38.0, 24.0, 38.0, 39.0, 36.0, 32.0, 42.0, 43.0, 43.0, 45.0, 26.0, 31.0, 43.0, 28.0, 23.0, 31.0, 28.0, 27.0, 24.0, 25.0, 27.0, 24.0, 16.0, 13.0, 7.0, 6.0, 4.0, 9.0, 6.0, 4.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-185.49554443359375, -179.41937255859375, -173.3431854248047, -167.2670135498047, -161.19082641601562, -155.11465454101562, -149.03846740722656, -142.96229553222656, -136.8861083984375, -130.8099365234375, -124.73374938964844, -118.6575698852539, -112.58139038085938, -106.50521087646484, -100.42903137207031, -94.35285949707031, -88.27667999267578, -82.20050048828125, -76.12432098388672, -70.04814147949219, -63.971961975097656, -57.895782470703125, -51.81960678100586, -45.74342727661133, -39.6672477722168, -33.591068267822266, -27.514888763427734, -21.438711166381836, -15.362531661987305, -9.286352157592773, -3.210174560546875, 2.8660049438476562, 8.942184448242188, 15.018363952636719, 21.09454345703125, 27.17072105407715, 33.24690246582031, 39.323081970214844, 45.39925765991211, 51.47543716430664, 57.55161666870117, 63.6277961730957, 69.70397186279297, 75.7801513671875, 81.85633087158203, 87.93251037597656, 94.0086898803711, 100.08486938476562, 106.16104888916016, 112.23722839355469, 118.31340789794922, 124.38958740234375, 130.46575927734375, 136.5419464111328, 142.6181182861328, 148.69430541992188, 154.77047729492188, 160.84664916992188, 166.92283630371094, 172.99900817871094, 179.0751953125, 185.1513671875, 191.22755432128906, 197.30372619628906, 203.37991333007812]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 10.0, 15.0, 19.0, 32.0, 57.0, 129.0, 265.0, 746.0, 2134.0, 8307.0, 41107.0, 266819.0, 590132.0, 113042.0, 19284.0, 4396.0, 1242.0, 429.0, 184.0, 88.0, 52.0, 27.0, 16.0, 11.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.0625, -88.0546875, -85.046875, -82.0390625, -79.03125, -76.0234375, -73.015625, -70.0078125, -67.0, -63.9921875, -60.984375, -57.9765625, -54.96875, -51.9609375, -48.953125, -45.9453125, -42.9375, -39.9296875, -36.921875, -33.9140625, -30.90625, -27.8984375, -24.890625, -21.8828125, -18.875, -15.8671875, -12.859375, -9.8515625, -6.84375, -3.8359375, -0.828125, 2.1796875, 5.1875, 8.1953125, 11.203125, 14.2109375, 17.21875, 20.2265625, 23.234375, 26.2421875, 29.25, 32.2578125, 35.265625, 38.2734375, 41.28125, 44.2890625, 47.296875, 50.3046875, 53.3125, 56.3203125, 59.328125, 62.3359375, 65.34375, 68.3515625, 71.359375, 74.3671875, 77.375, 80.3828125, 83.390625, 86.3984375, 89.40625, 92.4140625, 95.421875, 98.4296875, 101.4375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 4.0, 16.0, 27.0, 39.0, 45.0, 61.0, 59.0, 69.0, 72.0, 90.0, 77.0, 83.0, 68.0, 55.0, 56.0, 51.0, 34.0, 36.0, 13.0, 15.0, 12.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-47.53125, -46.4326171875, -45.333984375, -44.2353515625, -43.13671875, -42.0380859375, -40.939453125, -39.8408203125, -38.7421875, -37.6435546875, -36.544921875, -35.4462890625, -34.34765625, -33.2490234375, -32.150390625, -31.0517578125, -29.953125, -28.8544921875, -27.755859375, -26.6572265625, -25.55859375, -24.4599609375, -23.361328125, -22.2626953125, -21.1640625, -20.0654296875, -18.966796875, -17.8681640625, -16.76953125, -15.6708984375, -14.572265625, -13.4736328125, -12.375, -11.2763671875, -10.177734375, -9.0791015625, -7.98046875, -6.8818359375, -5.783203125, -4.6845703125, -3.5859375, -2.4873046875, -1.388671875, -0.2900390625, 0.80859375, 1.9072265625, 3.005859375, 4.1044921875, 5.203125, 6.3017578125, 7.400390625, 8.4990234375, 9.59765625, 10.6962890625, 11.794921875, 12.8935546875, 13.9921875, 15.0908203125, 16.189453125, 17.2880859375, 18.38671875, 19.4853515625, 20.583984375, 21.6826171875, 22.78125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 22.0, 15.0, 35.0, 32.0, 49.0, 96.0, 132.0, 231.0, 381.0, 660.0, 1342.0, 2991.0, 7945.0, 27366.0, 124755.0, 616837.0, 205447.0, 41519.0, 11253.0, 3836.0, 1569.0, 812.0, 447.0, 289.0, 169.0, 95.0, 75.0, 48.0, 34.0, 12.0, 17.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-93.9375, -91.3740234375, -88.810546875, -86.2470703125, -83.68359375, -81.1201171875, -78.556640625, -75.9931640625, -73.4296875, -70.8662109375, -68.302734375, -65.7392578125, -63.17578125, -60.6123046875, -58.048828125, -55.4853515625, -52.921875, -50.3583984375, -47.794921875, -45.2314453125, -42.66796875, -40.1044921875, -37.541015625, -34.9775390625, -32.4140625, -29.8505859375, -27.287109375, -24.7236328125, -22.16015625, -19.5966796875, -17.033203125, -14.4697265625, -11.90625, -9.3427734375, -6.779296875, -4.2158203125, -1.65234375, 0.9111328125, 3.474609375, 6.0380859375, 8.6015625, 11.1650390625, 13.728515625, 16.2919921875, 18.85546875, 21.4189453125, 23.982421875, 26.5458984375, 29.109375, 31.6728515625, 34.236328125, 36.7998046875, 39.36328125, 41.9267578125, 44.490234375, 47.0537109375, 49.6171875, 52.1806640625, 54.744140625, 57.3076171875, 59.87109375, 62.4345703125, 64.998046875, 67.5615234375, 70.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 15.0, 10.0, 17.0, 19.0, 13.0, 24.0, 23.0, 28.0, 35.0, 27.0, 29.0, 46.0, 40.0, 47.0, 50.0, 49.0, 42.0, 48.0, 47.0, 50.0, 35.0, 43.0, 25.0, 35.0, 27.0, 19.0, 28.0, 22.0, 9.0, 9.0, 18.0, 11.0, 5.0, 11.0, 0.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.9375, -74.3701171875, -71.802734375, -69.2353515625, -66.66796875, -64.1005859375, -61.533203125, -58.9658203125, -56.3984375, -53.8310546875, -51.263671875, -48.6962890625, -46.12890625, -43.5615234375, -40.994140625, -38.4267578125, -35.859375, -33.2919921875, -30.724609375, -28.1572265625, -25.58984375, -23.0224609375, -20.455078125, -17.8876953125, -15.3203125, -12.7529296875, -10.185546875, -7.6181640625, -5.05078125, -2.4833984375, 0.083984375, 2.6513671875, 5.21875, 7.7861328125, 10.353515625, 12.9208984375, 15.48828125, 18.0556640625, 20.623046875, 23.1904296875, 25.7578125, 28.3251953125, 30.892578125, 33.4599609375, 36.02734375, 38.5947265625, 41.162109375, 43.7294921875, 46.296875, 48.8642578125, 51.431640625, 53.9990234375, 56.56640625, 59.1337890625, 61.701171875, 64.2685546875, 66.8359375, 69.4033203125, 71.970703125, 74.5380859375, 77.10546875, 79.6728515625, 82.240234375, 84.8076171875, 87.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 10.0, 11.0, 17.0, 25.0, 47.0, 45.0, 93.0, 171.0, 332.0, 871.0, 2737.0, 13679.0, 195415.0, 783156.0, 43740.0, 5583.0, 1486.0, 543.0, 255.0, 112.0, 85.0, 39.0, 31.0, 17.0, 11.0, 7.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.537109375, -39.82421875, -38.111328125, -36.3984375, -34.685546875, -32.97265625, -31.259765625, -29.546875, -27.833984375, -26.12109375, -24.408203125, -22.6953125, -20.982421875, -19.26953125, -17.556640625, -15.84375, -14.130859375, -12.41796875, -10.705078125, -8.9921875, -7.279296875, -5.56640625, -3.853515625, -2.140625, -0.427734375, 1.28515625, 2.998046875, 4.7109375, 6.423828125, 8.13671875, 9.849609375, 11.5625, 13.275390625, 14.98828125, 16.701171875, 18.4140625, 20.126953125, 21.83984375, 23.552734375, 25.265625, 26.978515625, 28.69140625, 30.404296875, 32.1171875, 33.830078125, 35.54296875, 37.255859375, 38.96875, 40.681640625, 42.39453125, 44.107421875, 45.8203125, 47.533203125, 49.24609375, 50.958984375, 52.671875, 54.384765625, 56.09765625, 57.810546875, 59.5234375, 61.236328125, 62.94921875, 64.662109375, 66.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 11.0, 7.0, 7.0, 15.0, 24.0, 20.0, 34.0, 37.0, 65.0, 66.0, 73.0, 115.0, 114.0, 97.0, 61.0, 67.0, 55.0, 27.0, 22.0, 27.0, 12.0, 12.0, 10.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006763458251953125, -0.006570994853973389, -0.006378531455993652, -0.006186068058013916, -0.00599360466003418, -0.005801141262054443, -0.005608677864074707, -0.005416214466094971, -0.005223751068115234, -0.005031287670135498, -0.004838824272155762, -0.004646360874176025, -0.004453897476196289, -0.004261434078216553, -0.004068970680236816, -0.00387650728225708, -0.0036840438842773438, -0.0034915804862976074, -0.003299117088317871, -0.0031066536903381348, -0.0029141902923583984, -0.002721726894378662, -0.0025292634963989258, -0.0023368000984191895, -0.002144336700439453, -0.0019518733024597168, -0.0017594099044799805, -0.0015669465065002441, -0.0013744831085205078, -0.0011820197105407715, -0.0009895563125610352, -0.0007970929145812988, -0.0006046295166015625, -0.00041216611862182617, -0.00021970272064208984, -2.7239322662353516e-05, 0.0001652240753173828, 0.00035768747329711914, 0.0005501508712768555, 0.0007426142692565918, 0.0009350776672363281, 0.0011275410652160645, 0.0013200044631958008, 0.0015124678611755371, 0.0017049312591552734, 0.0018973946571350098, 0.002089858055114746, 0.0022823214530944824, 0.0024747848510742188, 0.002667248249053955, 0.0028597116470336914, 0.0030521750450134277, 0.003244638442993164, 0.0034371018409729004, 0.0036295652389526367, 0.003822028636932373, 0.004014492034912109, 0.004206955432891846, 0.004399418830871582, 0.004591882228851318, 0.004784345626831055, 0.004976809024810791, 0.005169272422790527, 0.005361735820770264, 0.00555419921875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 8.0, 17.0, 13.0, 24.0, 43.0, 46.0, 108.0, 155.0, 306.0, 577.0, 1079.0, 2475.0, 7036.0, 27665.0, 194920.0, 686138.0, 101728.0, 17272.0, 4911.0, 1998.0, 886.0, 460.0, 256.0, 145.0, 96.0, 61.0, 37.0, 23.0, 17.0, 12.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.90625, -32.82470703125, -31.7431640625, -30.66162109375, -29.580078125, -28.49853515625, -27.4169921875, -26.33544921875, -25.25390625, -24.17236328125, -23.0908203125, -22.00927734375, -20.927734375, -19.84619140625, -18.7646484375, -17.68310546875, -16.6015625, -15.52001953125, -14.4384765625, -13.35693359375, -12.275390625, -11.19384765625, -10.1123046875, -9.03076171875, -7.94921875, -6.86767578125, -5.7861328125, -4.70458984375, -3.623046875, -2.54150390625, -1.4599609375, -0.37841796875, 0.703125, 1.78466796875, 2.8662109375, 3.94775390625, 5.029296875, 6.11083984375, 7.1923828125, 8.27392578125, 9.35546875, 10.43701171875, 11.5185546875, 12.60009765625, 13.681640625, 14.76318359375, 15.8447265625, 16.92626953125, 18.0078125, 19.08935546875, 20.1708984375, 21.25244140625, 22.333984375, 23.41552734375, 24.4970703125, 25.57861328125, 26.66015625, 27.74169921875, 28.8232421875, 29.90478515625, 30.986328125, 32.06787109375, 33.1494140625, 34.23095703125, 35.3125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 16.0, 11.0, 31.0, 27.0, 44.0, 72.0, 102.0, 97.0, 126.0, 119.0, 104.0, 74.0, 53.0, 39.0, 16.0, 16.0, 15.0, 7.0, 6.0, 4.0, 8.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.322265625, -34.05078125, -32.779296875, -31.5078125, -30.236328125, -28.96484375, -27.693359375, -26.421875, -25.150390625, -23.87890625, -22.607421875, -21.3359375, -20.064453125, -18.79296875, -17.521484375, -16.25, -14.978515625, -13.70703125, -12.435546875, -11.1640625, -9.892578125, -8.62109375, -7.349609375, -6.078125, -4.806640625, -3.53515625, -2.263671875, -0.9921875, 0.279296875, 1.55078125, 2.822265625, 4.09375, 5.365234375, 6.63671875, 7.908203125, 9.1796875, 10.451171875, 11.72265625, 12.994140625, 14.265625, 15.537109375, 16.80859375, 18.080078125, 19.3515625, 20.623046875, 21.89453125, 23.166015625, 24.4375, 25.708984375, 26.98046875, 28.251953125, 29.5234375, 30.794921875, 32.06640625, 33.337890625, 34.609375, 35.880859375, 37.15234375, 38.423828125, 39.6953125, 40.966796875, 42.23828125, 43.509765625, 44.78125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 9.0, 13.0, 21.0, 65.0, 121.0, 193.0, 226.0, 162.0, 80.0, 50.0, 23.0, 14.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-844.7828369140625, -820.2403564453125, -795.6979370117188, -771.1554565429688, -746.6129760742188, -722.070556640625, -697.528076171875, -672.985595703125, -648.4431762695312, -623.9006958007812, -599.3582763671875, -574.8157958984375, -550.2733154296875, -525.7308959960938, -501.18841552734375, -476.6459655761719, -452.1034851074219, -427.56103515625, -403.0185546875, -378.4761047363281, -353.93365478515625, -329.39117431640625, -304.8487243652344, -280.3062744140625, -255.76380920410156, -231.22134399414062, -206.67889404296875, -182.1364288330078, -157.59396362304688, -133.051513671875, -108.50904846191406, -83.96659851074219, -59.42413330078125, -34.881675720214844, -10.339214324951172, 14.2032470703125, 38.745704650878906, 63.28816223144531, 87.83062744140625, 112.37307739257812, 136.91554260253906, 161.4580078125, 186.00045776367188, 210.5429229736328, 235.08538818359375, 259.6278381347656, 284.1702880859375, 308.7127685546875, 333.2552185058594, 357.79766845703125, 382.34014892578125, 406.8825988769531, 431.425048828125, 455.967529296875, 480.5099792480469, 505.05242919921875, 529.5949096679688, 554.1373901367188, 578.6798095703125, 603.2222900390625, 627.7647705078125, 652.3071899414062, 676.8496704101562, 701.39208984375, 725.9345703125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 4.0, 9.0, 14.0, 17.0, 15.0, 11.0, 18.0, 19.0, 30.0, 30.0, 35.0, 36.0, 35.0, 37.0, 47.0, 52.0, 65.0, 60.0, 53.0, 34.0, 43.0, 43.0, 47.0, 29.0, 23.0, 31.0, 23.0, 29.0, 21.0, 18.0, 21.0, 10.0, 10.0, 7.0, 6.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.74908447265625, -299.2730407714844, -287.7969970703125, -276.3209533691406, -264.84490966796875, -253.3688507080078, -241.89279174804688, -230.416748046875, -218.94070434570312, -207.46466064453125, -195.98861694335938, -184.51255798339844, -173.03651428222656, -161.5604705810547, -150.08441162109375, -138.60836791992188, -127.13232421875, -115.65628051757812, -104.18022918701172, -92.70417785644531, -81.22813415527344, -69.75209045410156, -58.276039123535156, -46.79998779296875, -35.323944091796875, -23.847896575927734, -12.371849060058594, -0.8958015441894531, 10.580245971679688, 22.056293487548828, 33.53234100341797, 45.008392333984375, 56.484405517578125, 67.96044921875, 79.4365005493164, 90.91255187988281, 102.38859558105469, 113.86463928222656, 125.34069061279297, 136.81674194335938, 148.29278564453125, 159.76882934570312, 171.244873046875, 182.72093200683594, 194.1969757080078, 205.6730194091797, 217.14907836914062, 228.6251220703125, 240.10116577148438, 251.57720947265625, 263.0532531738281, 274.529296875, 286.00537109375, 297.4814147949219, 308.95745849609375, 320.4335021972656, 331.9095458984375, 343.3855895996094, 354.86163330078125, 366.3376770019531, 377.813720703125, 389.289794921875, 400.7658386230469, 412.24188232421875, 423.7179260253906]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 23.0, 26.0, 43.0, 74.0, 169.0, 471.0, 1103.0, 3701.0, 15559.0, 94453.0, 2428740.0, 1562501.0, 69442.0, 12641.0, 3359.0, 1059.0, 421.0, 198.0, 87.0, 80.0, 33.0, 25.0, 14.0, 6.0, 6.0, 4.0, 3.0, 9.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-76.25, -74.29150390625, -72.3330078125, -70.37451171875, -68.416015625, -66.45751953125, -64.4990234375, -62.54052734375, -60.58203125, -58.62353515625, -56.6650390625, -54.70654296875, -52.748046875, -50.78955078125, -48.8310546875, -46.87255859375, -44.9140625, -42.95556640625, -40.9970703125, -39.03857421875, -37.080078125, -35.12158203125, -33.1630859375, -31.20458984375, -29.24609375, -27.28759765625, -25.3291015625, -23.37060546875, -21.412109375, -19.45361328125, -17.4951171875, -15.53662109375, -13.578125, -11.61962890625, -9.6611328125, -7.70263671875, -5.744140625, -3.78564453125, -1.8271484375, 0.13134765625, 2.08984375, 4.04833984375, 6.0068359375, 7.96533203125, 9.923828125, 11.88232421875, 13.8408203125, 15.79931640625, 17.7578125, 19.71630859375, 21.6748046875, 23.63330078125, 25.591796875, 27.55029296875, 29.5087890625, 31.46728515625, 33.42578125, 35.38427734375, 37.3427734375, 39.30126953125, 41.259765625, 43.21826171875, 45.1767578125, 47.13525390625, 49.09375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 7.0, 8.0, 11.0, 18.0, 17.0, 23.0, 25.0, 41.0, 40.0, 40.0, 32.0, 51.0, 52.0, 59.0, 60.0, 79.0, 56.0, 50.0, 54.0, 32.0, 46.0, 30.0, 33.0, 29.0, 21.0, 19.0, 14.0, 18.0, 10.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.171875, -24.4755859375, -23.779296875, -23.0830078125, -22.38671875, -21.6904296875, -20.994140625, -20.2978515625, -19.6015625, -18.9052734375, -18.208984375, -17.5126953125, -16.81640625, -16.1201171875, -15.423828125, -14.7275390625, -14.03125, -13.3349609375, -12.638671875, -11.9423828125, -11.24609375, -10.5498046875, -9.853515625, -9.1572265625, -8.4609375, -7.7646484375, -7.068359375, -6.3720703125, -5.67578125, -4.9794921875, -4.283203125, -3.5869140625, -2.890625, -2.1943359375, -1.498046875, -0.8017578125, -0.10546875, 0.5908203125, 1.287109375, 1.9833984375, 2.6796875, 3.3759765625, 4.072265625, 4.7685546875, 5.46484375, 6.1611328125, 6.857421875, 7.5537109375, 8.25, 8.9462890625, 9.642578125, 10.3388671875, 11.03515625, 11.7314453125, 12.427734375, 13.1240234375, 13.8203125, 14.5166015625, 15.212890625, 15.9091796875, 16.60546875, 17.3017578125, 17.998046875, 18.6943359375, 19.390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 7.0, 10.0, 10.0, 17.0, 30.0, 36.0, 52.0, 63.0, 92.0, 128.0, 273.0, 455.0, 757.0, 1362.0, 2660.0, 5688.0, 12934.0, 33723.0, 105147.0, 583510.0, 2863722.0, 440730.0, 91615.0, 29529.0, 11505.0, 4946.0, 2303.0, 1190.0, 678.0, 368.0, 212.0, 157.0, 85.0, 76.0, 47.0, 43.0, 22.0, 21.0, 19.0, 9.0, 10.0, 6.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.4375, -35.19970703125, -33.9619140625, -32.72412109375, -31.486328125, -30.24853515625, -29.0107421875, -27.77294921875, -26.53515625, -25.29736328125, -24.0595703125, -22.82177734375, -21.583984375, -20.34619140625, -19.1083984375, -17.87060546875, -16.6328125, -15.39501953125, -14.1572265625, -12.91943359375, -11.681640625, -10.44384765625, -9.2060546875, -7.96826171875, -6.73046875, -5.49267578125, -4.2548828125, -3.01708984375, -1.779296875, -0.54150390625, 0.6962890625, 1.93408203125, 3.171875, 4.40966796875, 5.6474609375, 6.88525390625, 8.123046875, 9.36083984375, 10.5986328125, 11.83642578125, 13.07421875, 14.31201171875, 15.5498046875, 16.78759765625, 18.025390625, 19.26318359375, 20.5009765625, 21.73876953125, 22.9765625, 24.21435546875, 25.4521484375, 26.68994140625, 27.927734375, 29.16552734375, 30.4033203125, 31.64111328125, 32.87890625, 34.11669921875, 35.3544921875, 36.59228515625, 37.830078125, 39.06787109375, 40.3056640625, 41.54345703125, 42.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 2.0, 5.0, 4.0, 6.0, 10.0, 11.0, 14.0, 19.0, 34.0, 31.0, 54.0, 62.0, 116.0, 179.0, 291.0, 665.0, 802.0, 699.0, 364.0, 231.0, 150.0, 91.0, 69.0, 44.0, 31.0, 26.0, 14.0, 12.0, 9.0, 9.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.65625, -57.71533203125, -55.7744140625, -53.83349609375, -51.892578125, -49.95166015625, -48.0107421875, -46.06982421875, -44.12890625, -42.18798828125, -40.2470703125, -38.30615234375, -36.365234375, -34.42431640625, -32.4833984375, -30.54248046875, -28.6015625, -26.66064453125, -24.7197265625, -22.77880859375, -20.837890625, -18.89697265625, -16.9560546875, -15.01513671875, -13.07421875, -11.13330078125, -9.1923828125, -7.25146484375, -5.310546875, -3.36962890625, -1.4287109375, 0.51220703125, 2.453125, 4.39404296875, 6.3349609375, 8.27587890625, 10.216796875, 12.15771484375, 14.0986328125, 16.03955078125, 17.98046875, 19.92138671875, 21.8623046875, 23.80322265625, 25.744140625, 27.68505859375, 29.6259765625, 31.56689453125, 33.5078125, 35.44873046875, 37.3896484375, 39.33056640625, 41.271484375, 43.21240234375, 45.1533203125, 47.09423828125, 49.03515625, 50.97607421875, 52.9169921875, 54.85791015625, 56.798828125, 58.73974609375, 60.6806640625, 62.62158203125, 64.5625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 12.0, 43.0, 81.0, 210.0, 323.0, 200.0, 69.0, 26.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-433.897216796875, -401.48358154296875, -369.0699462890625, -336.65631103515625, -304.24267578125, -271.82904052734375, -239.41543579101562, -207.00180053710938, -174.58816528320312, -142.17453002929688, -109.76090240478516, -77.34727478027344, -44.93363952636719, -12.520004272460938, 19.89361572265625, 52.3072509765625, 84.72088623046875, 117.134521484375, 149.54815673828125, 181.96177673339844, 214.3754119873047, 246.78904724121094, 279.2026672363281, 311.6163024902344, 344.0299377441406, 376.4435729980469, 408.8572082519531, 441.27081298828125, 473.6844482421875, 506.09808349609375, 538.51171875, 570.9253540039062, 603.3389892578125, 635.7526245117188, 668.166259765625, 700.5798950195312, 732.9935302734375, 765.4071655273438, 797.82080078125, 830.234375, 862.6480712890625, 895.0617065429688, 927.475341796875, 959.8889770507812, 992.3026123046875, 1024.7161865234375, 1057.1298828125, 1089.54345703125, 1121.95703125, 1154.37060546875, 1186.7843017578125, 1219.1978759765625, 1251.611572265625, 1284.025146484375, 1316.4388427734375, 1348.8524169921875, 1381.26611328125, 1413.6796875, 1446.0933837890625, 1478.5069580078125, 1510.920654296875, 1543.334228515625, 1575.7479248046875, 1608.1614990234375, 1640.5751953125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 7.0, 16.0, 13.0, 21.0, 25.0, 21.0, 25.0, 35.0, 36.0, 37.0, 45.0, 45.0, 47.0, 35.0, 46.0, 52.0, 40.0, 43.0, 37.0, 47.0, 35.0, 41.0, 31.0, 21.0, 24.0, 21.0, 15.0, 15.0, 13.0, 19.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-301.70928955078125, -293.31610107421875, -284.9228820800781, -276.5296630859375, -268.136474609375, -259.7432861328125, -251.35006713867188, -242.9568634033203, -234.56365966796875, -226.1704559326172, -217.77725219726562, -209.38404846191406, -200.9908447265625, -192.59764099121094, -184.20443725585938, -175.8112335205078, -167.41802978515625, -159.0248260498047, -150.63162231445312, -142.23841857910156, -133.84521484375, -125.45201110839844, -117.05880737304688, -108.66560363769531, -100.27239990234375, -91.87919616699219, -83.48599243164062, -75.09278869628906, -66.6995849609375, -58.30638122558594, -49.913177490234375, -41.51997375488281, -33.12678527832031, -24.73358154296875, -16.340377807617188, -7.947174072265625, 0.4460296630859375, 8.8392333984375, 17.232437133789062, 25.625640869140625, 34.01884460449219, 42.41204833984375, 50.80525207519531, 59.198455810546875, 67.59165954589844, 75.98486328125, 84.37806701660156, 92.77127075195312, 101.16447448730469, 109.55767822265625, 117.95088195800781, 126.34408569335938, 134.73728942871094, 143.1304931640625, 151.52369689941406, 159.91690063476562, 168.3101043701172, 176.70330810546875, 185.0965118408203, 193.48971557617188, 201.88291931152344, 210.276123046875, 218.66932678222656, 227.06253051757812, 235.4557342529297]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 12.0, 6.0, 27.0, 39.0, 53.0, 102.0, 205.0, 518.0, 1687.0, 6403.0, 29905.0, 168116.0, 585459.0, 208659.0, 36712.0, 7495.0, 2001.0, 643.0, 234.0, 133.0, 50.0, 31.0, 20.0, 14.0, 10.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.1875, -102.310546875, -99.43359375, -96.556640625, -93.6796875, -90.802734375, -87.92578125, -85.048828125, -82.171875, -79.294921875, -76.41796875, -73.541015625, -70.6640625, -67.787109375, -64.91015625, -62.033203125, -59.15625, -56.279296875, -53.40234375, -50.525390625, -47.6484375, -44.771484375, -41.89453125, -39.017578125, -36.140625, -33.263671875, -30.38671875, -27.509765625, -24.6328125, -21.755859375, -18.87890625, -16.001953125, -13.125, -10.248046875, -7.37109375, -4.494140625, -1.6171875, 1.259765625, 4.13671875, 7.013671875, 9.890625, 12.767578125, 15.64453125, 18.521484375, 21.3984375, 24.275390625, 27.15234375, 30.029296875, 32.90625, 35.783203125, 38.66015625, 41.537109375, 44.4140625, 47.291015625, 50.16796875, 53.044921875, 55.921875, 58.798828125, 61.67578125, 64.552734375, 67.4296875, 70.306640625, 73.18359375, 76.060546875, 78.9375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 11.0, 8.0, 13.0, 15.0, 20.0, 24.0, 22.0, 39.0, 39.0, 42.0, 31.0, 53.0, 47.0, 50.0, 57.0, 66.0, 53.0, 53.0, 59.0, 40.0, 37.0, 38.0, 37.0, 27.0, 18.0, 25.0, 19.0, 13.0, 4.0, 15.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.20166015625, -23.4970703125, -22.79248046875, -22.087890625, -21.38330078125, -20.6787109375, -19.97412109375, -19.26953125, -18.56494140625, -17.8603515625, -17.15576171875, -16.451171875, -15.74658203125, -15.0419921875, -14.33740234375, -13.6328125, -12.92822265625, -12.2236328125, -11.51904296875, -10.814453125, -10.10986328125, -9.4052734375, -8.70068359375, -7.99609375, -7.29150390625, -6.5869140625, -5.88232421875, -5.177734375, -4.47314453125, -3.7685546875, -3.06396484375, -2.359375, -1.65478515625, -0.9501953125, -0.24560546875, 0.458984375, 1.16357421875, 1.8681640625, 2.57275390625, 3.27734375, 3.98193359375, 4.6865234375, 5.39111328125, 6.095703125, 6.80029296875, 7.5048828125, 8.20947265625, 8.9140625, 9.61865234375, 10.3232421875, 11.02783203125, 11.732421875, 12.43701171875, 13.1416015625, 13.84619140625, 14.55078125, 15.25537109375, 15.9599609375, 16.66455078125, 17.369140625, 18.07373046875, 18.7783203125, 19.48291015625, 20.1875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 22.0, 26.0, 33.0, 41.0, 51.0, 56.0, 96.0, 162.0, 200.0, 316.0, 411.0, 668.0, 1037.0, 1846.0, 3521.0, 8932.0, 32776.0, 178264.0, 660289.0, 121314.0, 23837.0, 7117.0, 2967.0, 1592.0, 971.0, 589.0, 413.0, 281.0, 181.0, 145.0, 98.0, 81.0, 58.0, 33.0, 20.0, 36.0, 17.0, 11.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-95.1875, -92.3369140625, -89.486328125, -86.6357421875, -83.78515625, -80.9345703125, -78.083984375, -75.2333984375, -72.3828125, -69.5322265625, -66.681640625, -63.8310546875, -60.98046875, -58.1298828125, -55.279296875, -52.4287109375, -49.578125, -46.7275390625, -43.876953125, -41.0263671875, -38.17578125, -35.3251953125, -32.474609375, -29.6240234375, -26.7734375, -23.9228515625, -21.072265625, -18.2216796875, -15.37109375, -12.5205078125, -9.669921875, -6.8193359375, -3.96875, -1.1181640625, 1.732421875, 4.5830078125, 7.43359375, 10.2841796875, 13.134765625, 15.9853515625, 18.8359375, 21.6865234375, 24.537109375, 27.3876953125, 30.23828125, 33.0888671875, 35.939453125, 38.7900390625, 41.640625, 44.4912109375, 47.341796875, 50.1923828125, 53.04296875, 55.8935546875, 58.744140625, 61.5947265625, 64.4453125, 67.2958984375, 70.146484375, 72.9970703125, 75.84765625, 78.6982421875, 81.548828125, 84.3994140625, 87.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 9.0, 10.0, 18.0, 6.0, 16.0, 19.0, 23.0, 36.0, 34.0, 35.0, 39.0, 36.0, 55.0, 62.0, 46.0, 50.0, 54.0, 66.0, 40.0, 52.0, 48.0, 36.0, 45.0, 33.0, 23.0, 20.0, 25.0, 6.0, 14.0, 6.0, 12.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-117.0, -113.580078125, -110.16015625, -106.740234375, -103.3203125, -99.900390625, -96.48046875, -93.060546875, -89.640625, -86.220703125, -82.80078125, -79.380859375, -75.9609375, -72.541015625, -69.12109375, -65.701171875, -62.28125, -58.861328125, -55.44140625, -52.021484375, -48.6015625, -45.181640625, -41.76171875, -38.341796875, -34.921875, -31.501953125, -28.08203125, -24.662109375, -21.2421875, -17.822265625, -14.40234375, -10.982421875, -7.5625, -4.142578125, -0.72265625, 2.697265625, 6.1171875, 9.537109375, 12.95703125, 16.376953125, 19.796875, 23.216796875, 26.63671875, 30.056640625, 33.4765625, 36.896484375, 40.31640625, 43.736328125, 47.15625, 50.576171875, 53.99609375, 57.416015625, 60.8359375, 64.255859375, 67.67578125, 71.095703125, 74.515625, 77.935546875, 81.35546875, 84.775390625, 88.1953125, 91.615234375, 95.03515625, 98.455078125, 101.875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 11.0, 9.0, 6.0, 7.0, 10.0, 16.0, 11.0, 18.0, 36.0, 44.0, 48.0, 97.0, 178.0, 354.0, 968.0, 3706.0, 43336.0, 915200.0, 77201.0, 5190.0, 1140.0, 413.0, 170.0, 102.0, 68.0, 61.0, 37.0, 36.0, 9.0, 16.0, 6.0, 11.0, 9.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-59.4375, -57.61328125, -55.7890625, -53.96484375, -52.140625, -50.31640625, -48.4921875, -46.66796875, -44.84375, -43.01953125, -41.1953125, -39.37109375, -37.546875, -35.72265625, -33.8984375, -32.07421875, -30.25, -28.42578125, -26.6015625, -24.77734375, -22.953125, -21.12890625, -19.3046875, -17.48046875, -15.65625, -13.83203125, -12.0078125, -10.18359375, -8.359375, -6.53515625, -4.7109375, -2.88671875, -1.0625, 0.76171875, 2.5859375, 4.41015625, 6.234375, 8.05859375, 9.8828125, 11.70703125, 13.53125, 15.35546875, 17.1796875, 19.00390625, 20.828125, 22.65234375, 24.4765625, 26.30078125, 28.125, 29.94921875, 31.7734375, 33.59765625, 35.421875, 37.24609375, 39.0703125, 40.89453125, 42.71875, 44.54296875, 46.3671875, 48.19140625, 50.015625, 51.83984375, 53.6640625, 55.48828125, 57.3125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 6.0, 3.0, 6.0, 12.0, 12.0, 12.0, 10.0, 16.0, 24.0, 11.0, 33.0, 34.0, 45.0, 50.0, 74.0, 73.0, 82.0, 92.0, 70.0, 58.0, 50.0, 48.0, 33.0, 26.0, 22.0, 15.0, 14.0, 13.0, 14.0, 9.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004913330078125, -0.00474858283996582, -0.004583835601806641, -0.004419088363647461, -0.004254341125488281, -0.0040895938873291016, -0.003924846649169922, -0.003760099411010742, -0.0035953521728515625, -0.003430604934692383, -0.003265857696533203, -0.0031011104583740234, -0.0029363632202148438, -0.002771615982055664, -0.0026068687438964844, -0.0024421215057373047, -0.002277374267578125, -0.0021126270294189453, -0.0019478797912597656, -0.001783132553100586, -0.0016183853149414062, -0.0014536380767822266, -0.0012888908386230469, -0.0011241436004638672, -0.0009593963623046875, -0.0007946491241455078, -0.0006299018859863281, -0.00046515464782714844, -0.00030040740966796875, -0.00013566017150878906, 2.9087066650390625e-05, 0.0001938343048095703, 0.00035858154296875, 0.0005233287811279297, 0.0006880760192871094, 0.0008528232574462891, 0.0010175704956054688, 0.0011823177337646484, 0.0013470649719238281, 0.0015118122100830078, 0.0016765594482421875, 0.0018413066864013672, 0.002006053924560547, 0.0021708011627197266, 0.0023355484008789062, 0.002500295639038086, 0.0026650428771972656, 0.0028297901153564453, 0.002994537353515625, 0.0031592845916748047, 0.0033240318298339844, 0.003488779067993164, 0.0036535263061523438, 0.0038182735443115234, 0.003983020782470703, 0.004147768020629883, 0.0043125152587890625, 0.004477262496948242, 0.004642009735107422, 0.0048067569732666016, 0.004971504211425781, 0.005136251449584961, 0.005300998687744141, 0.00546574592590332, 0.0056304931640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 11.0, 11.0, 31.0, 34.0, 75.0, 129.0, 252.0, 560.0, 1698.0, 7353.0, 261921.0, 763236.0, 9972.0, 2018.0, 665.0, 267.0, 133.0, 67.0, 42.0, 25.0, 19.0, 10.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.0625, -95.09765625, -92.1328125, -89.16796875, -86.203125, -83.23828125, -80.2734375, -77.30859375, -74.34375, -71.37890625, -68.4140625, -65.44921875, -62.484375, -59.51953125, -56.5546875, -53.58984375, -50.625, -47.66015625, -44.6953125, -41.73046875, -38.765625, -35.80078125, -32.8359375, -29.87109375, -26.90625, -23.94140625, -20.9765625, -18.01171875, -15.046875, -12.08203125, -9.1171875, -6.15234375, -3.1875, -0.22265625, 2.7421875, 5.70703125, 8.671875, 11.63671875, 14.6015625, 17.56640625, 20.53125, 23.49609375, 26.4609375, 29.42578125, 32.390625, 35.35546875, 38.3203125, 41.28515625, 44.25, 47.21484375, 50.1796875, 53.14453125, 56.109375, 59.07421875, 62.0390625, 65.00390625, 67.96875, 70.93359375, 73.8984375, 76.86328125, 79.828125, 82.79296875, 85.7578125, 88.72265625, 91.6875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 10.0, 5.0, 10.0, 13.0, 17.0, 25.0, 25.0, 30.0, 44.0, 54.0, 58.0, 86.0, 93.0, 116.0, 77.0, 76.0, 57.0, 39.0, 40.0, 26.0, 22.0, 27.0, 9.0, 7.0, 7.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.637451171875, -24.75927734375, -23.881103515625, -23.0029296875, -22.124755859375, -21.24658203125, -20.368408203125, -19.490234375, -18.612060546875, -17.73388671875, -16.855712890625, -15.9775390625, -15.099365234375, -14.22119140625, -13.343017578125, -12.46484375, -11.586669921875, -10.70849609375, -9.830322265625, -8.9521484375, -8.073974609375, -7.19580078125, -6.317626953125, -5.439453125, -4.561279296875, -3.68310546875, -2.804931640625, -1.9267578125, -1.048583984375, -0.17041015625, 0.707763671875, 1.5859375, 2.464111328125, 3.34228515625, 4.220458984375, 5.0986328125, 5.976806640625, 6.85498046875, 7.733154296875, 8.611328125, 9.489501953125, 10.36767578125, 11.245849609375, 12.1240234375, 13.002197265625, 13.88037109375, 14.758544921875, 15.63671875, 16.514892578125, 17.39306640625, 18.271240234375, 19.1494140625, 20.027587890625, 20.90576171875, 21.783935546875, 22.662109375, 23.540283203125, 24.41845703125, 25.296630859375, 26.1748046875, 27.052978515625, 27.93115234375, 28.809326171875, 29.6875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 12.0, 19.0, 35.0, 83.0, 147.0, 284.0, 200.0, 121.0, 57.0, 19.0, 7.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-978.4988403320312, -950.3035888671875, -922.1082763671875, -893.9130249023438, -865.7177734375, -837.5225219726562, -809.3272705078125, -781.1319580078125, -752.9367065429688, -724.741455078125, -696.546142578125, -668.3508911132812, -640.1556396484375, -611.9603881835938, -583.76513671875, -555.56982421875, -527.3745727539062, -499.1793212890625, -470.9840393066406, -442.78875732421875, -414.593505859375, -386.39825439453125, -358.2029724121094, -330.0076904296875, -301.81243896484375, -273.6171875, -245.42190551757812, -217.2266387939453, -189.0313720703125, -160.8361053466797, -132.64083862304688, -104.44557189941406, -76.25030517578125, -48.05503845214844, -19.859771728515625, 8.335494995117188, 36.53076171875, 64.72602844238281, 92.92129516601562, 121.11656188964844, 149.31182861328125, 177.50709533691406, 205.70236206054688, 233.8976287841797, 262.0928955078125, 290.28814697265625, 318.4834289550781, 346.6787109375, 374.87396240234375, 403.0692138671875, 431.2644958496094, 459.45977783203125, 487.655029296875, 515.8502807617188, 544.0455322265625, 572.2408447265625, 600.4360961914062, 628.63134765625, 656.82666015625, 685.0219116210938, 713.2171630859375, 741.4124145507812, 769.607666015625, 797.802978515625, 825.9982299804688]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 8.0, 6.0, 12.0, 13.0, 22.0, 17.0, 24.0, 22.0, 26.0, 32.0, 32.0, 34.0, 43.0, 40.0, 42.0, 57.0, 57.0, 70.0, 56.0, 52.0, 44.0, 38.0, 35.0, 25.0, 29.0, 29.0, 19.0, 21.0, 17.0, 13.0, 17.0, 9.0, 10.0, 4.0, 2.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-329.3806457519531, -318.7096862792969, -308.03875732421875, -297.3677978515625, -286.6968688964844, -276.0259094238281, -265.35498046875, -254.68402099609375, -244.01307678222656, -233.34213256835938, -222.6711883544922, -212.000244140625, -201.32928466796875, -190.65835571289062, -179.98739624023438, -169.3164520263672, -158.6455078125, -147.9745635986328, -137.30361938476562, -126.6326675415039, -115.96172332763672, -105.29077911376953, -94.61982727050781, -83.94888305664062, -73.27793884277344, -62.60699462890625, -51.9360466003418, -41.265098571777344, -30.594154357910156, -19.92321014404297, -9.25225830078125, 1.4186859130859375, 12.08966064453125, 22.76060676574707, 33.43155288696289, 44.102500915527344, 54.77344512939453, 65.44438934326172, 76.11534118652344, 86.78628540039062, 97.45722961425781, 108.128173828125, 118.79911804199219, 129.47006225585938, 140.14102172851562, 150.81195068359375, 161.48291015625, 172.1538543701172, 182.82479858398438, 193.49574279785156, 204.16668701171875, 214.837646484375, 225.50857543945312, 236.17953491210938, 246.85047912597656, 257.52142333984375, 268.1923828125, 278.86334228515625, 289.5342712402344, 300.2052307128906, 310.87615966796875, 321.547119140625, 332.21807861328125, 342.8890075683594, 353.5599365234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 12.0, 26.0, 36.0, 32.0, 58.0, 119.0, 299.0, 1475.0, 17344.0, 3696304.0, 470470.0, 6836.0, 816.0, 220.0, 103.0, 45.0, 34.0, 19.0, 11.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-190.375, -186.0322265625, -181.689453125, -177.3466796875, -173.00390625, -168.6611328125, -164.318359375, -159.9755859375, -155.6328125, -151.2900390625, -146.947265625, -142.6044921875, -138.26171875, -133.9189453125, -129.576171875, -125.2333984375, -120.890625, -116.5478515625, -112.205078125, -107.8623046875, -103.51953125, -99.1767578125, -94.833984375, -90.4912109375, -86.1484375, -81.8056640625, -77.462890625, -73.1201171875, -68.77734375, -64.4345703125, -60.091796875, -55.7490234375, -51.40625, -47.0634765625, -42.720703125, -38.3779296875, -34.03515625, -29.6923828125, -25.349609375, -21.0068359375, -16.6640625, -12.3212890625, -7.978515625, -3.6357421875, 0.70703125, 5.0498046875, 9.392578125, 13.7353515625, 18.078125, 22.4208984375, 26.763671875, 31.1064453125, 35.44921875, 39.7919921875, 44.134765625, 48.4775390625, 52.8203125, 57.1630859375, 61.505859375, 65.8486328125, 70.19140625, 74.5341796875, 78.876953125, 83.2197265625, 87.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 10.0, 4.0, 13.0, 10.0, 10.0, 14.0, 20.0, 23.0, 20.0, 23.0, 32.0, 36.0, 40.0, 44.0, 47.0, 42.0, 39.0, 55.0, 55.0, 52.0, 42.0, 39.0, 39.0, 31.0, 39.0, 43.0, 33.0, 19.0, 23.0, 17.0, 11.0, 14.0, 15.0, 8.0, 11.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.53125, -16.9091796875, -16.287109375, -15.6650390625, -15.04296875, -14.4208984375, -13.798828125, -13.1767578125, -12.5546875, -11.9326171875, -11.310546875, -10.6884765625, -10.06640625, -9.4443359375, -8.822265625, -8.2001953125, -7.578125, -6.9560546875, -6.333984375, -5.7119140625, -5.08984375, -4.4677734375, -3.845703125, -3.2236328125, -2.6015625, -1.9794921875, -1.357421875, -0.7353515625, -0.11328125, 0.5087890625, 1.130859375, 1.7529296875, 2.375, 2.9970703125, 3.619140625, 4.2412109375, 4.86328125, 5.4853515625, 6.107421875, 6.7294921875, 7.3515625, 7.9736328125, 8.595703125, 9.2177734375, 9.83984375, 10.4619140625, 11.083984375, 11.7060546875, 12.328125, 12.9501953125, 13.572265625, 14.1943359375, 14.81640625, 15.4384765625, 16.060546875, 16.6826171875, 17.3046875, 17.9267578125, 18.548828125, 19.1708984375, 19.79296875, 20.4150390625, 21.037109375, 21.6591796875, 22.28125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 15.0, 28.0, 29.0, 37.0, 71.0, 130.0, 234.0, 457.0, 983.0, 2187.0, 5604.0, 16324.0, 60457.0, 391637.0, 3237476.0, 390994.0, 60612.0, 16744.0, 5904.0, 2301.0, 1032.0, 477.0, 204.0, 120.0, 83.0, 45.0, 24.0, 18.0, 13.0, 9.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.78125, -56.1982421875, -54.615234375, -53.0322265625, -51.44921875, -49.8662109375, -48.283203125, -46.7001953125, -45.1171875, -43.5341796875, -41.951171875, -40.3681640625, -38.78515625, -37.2021484375, -35.619140625, -34.0361328125, -32.453125, -30.8701171875, -29.287109375, -27.7041015625, -26.12109375, -24.5380859375, -22.955078125, -21.3720703125, -19.7890625, -18.2060546875, -16.623046875, -15.0400390625, -13.45703125, -11.8740234375, -10.291015625, -8.7080078125, -7.125, -5.5419921875, -3.958984375, -2.3759765625, -0.79296875, 0.7900390625, 2.373046875, 3.9560546875, 5.5390625, 7.1220703125, 8.705078125, 10.2880859375, 11.87109375, 13.4541015625, 15.037109375, 16.6201171875, 18.203125, 19.7861328125, 21.369140625, 22.9521484375, 24.53515625, 26.1181640625, 27.701171875, 29.2841796875, 30.8671875, 32.4501953125, 34.033203125, 35.6162109375, 37.19921875, 38.7822265625, 40.365234375, 41.9482421875, 43.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 9.0, 2.0, 7.0, 7.0, 5.0, 6.0, 15.0, 18.0, 20.0, 29.0, 49.0, 47.0, 74.0, 124.0, 155.0, 275.0, 513.0, 723.0, 711.0, 431.0, 267.0, 167.0, 106.0, 85.0, 62.0, 49.0, 28.0, 21.0, 21.0, 6.0, 13.0, 4.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.4375, -53.75927734375, -52.0810546875, -50.40283203125, -48.724609375, -47.04638671875, -45.3681640625, -43.68994140625, -42.01171875, -40.33349609375, -38.6552734375, -36.97705078125, -35.298828125, -33.62060546875, -31.9423828125, -30.26416015625, -28.5859375, -26.90771484375, -25.2294921875, -23.55126953125, -21.873046875, -20.19482421875, -18.5166015625, -16.83837890625, -15.16015625, -13.48193359375, -11.8037109375, -10.12548828125, -8.447265625, -6.76904296875, -5.0908203125, -3.41259765625, -1.734375, -0.05615234375, 1.6220703125, 3.30029296875, 4.978515625, 6.65673828125, 8.3349609375, 10.01318359375, 11.69140625, 13.36962890625, 15.0478515625, 16.72607421875, 18.404296875, 20.08251953125, 21.7607421875, 23.43896484375, 25.1171875, 26.79541015625, 28.4736328125, 30.15185546875, 31.830078125, 33.50830078125, 35.1865234375, 36.86474609375, 38.54296875, 40.22119140625, 41.8994140625, 43.57763671875, 45.255859375, 46.93408203125, 48.6123046875, 50.29052734375, 51.96875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 21.0, 58.0, 200.0, 353.0, 227.0, 87.0, 24.0, 13.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-472.80474853515625, -440.0065002441406, -407.208251953125, -374.40997314453125, -341.6117248535156, -308.8134765625, -276.01519775390625, -243.21694946289062, -210.418701171875, -177.62045288085938, -144.8221893310547, -112.02393341064453, -79.22567749023438, -46.42742919921875, -13.629165649414062, 19.169097900390625, 51.96734619140625, 84.7656021118164, 117.56385803222656, 150.36212158203125, 183.16036987304688, 215.9586181640625, 248.7568817138672, 281.5551452636719, 314.3533935546875, 347.1516418457031, 379.94989013671875, 412.7481689453125, 445.5464172363281, 478.34466552734375, 511.1429443359375, 543.941162109375, 576.739501953125, 609.5377807617188, 642.3359985351562, 675.13427734375, 707.9324951171875, 740.7307739257812, 773.529052734375, 806.3272705078125, 839.1255493164062, 871.923828125, 904.7220458984375, 937.5203247070312, 970.318603515625, 1003.1168212890625, 1035.9150390625, 1068.71337890625, 1101.5115966796875, 1134.309814453125, 1167.108154296875, 1199.9063720703125, 1232.70458984375, 1265.5029296875, 1298.3011474609375, 1331.099365234375, 1363.897705078125, 1396.6959228515625, 1429.4942626953125, 1462.29248046875, 1495.0906982421875, 1527.888916015625, 1560.687255859375, 1593.4854736328125, 1626.28369140625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 6.0, 9.0, 8.0, 6.0, 15.0, 12.0, 26.0, 22.0, 34.0, 34.0, 44.0, 47.0, 38.0, 45.0, 60.0, 55.0, 61.0, 53.0, 45.0, 40.0, 40.0, 50.0, 35.0, 36.0, 25.0, 26.0, 18.0, 21.0, 14.0, 23.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-293.5535888671875, -284.6994934082031, -275.8453674316406, -266.99127197265625, -258.13714599609375, -249.28305053710938, -240.42893981933594, -231.5748291015625, -222.72071838378906, -213.86660766601562, -205.0124969482422, -196.15838623046875, -187.30429077148438, -178.45016479492188, -169.5960693359375, -160.74195861816406, -151.88784790039062, -143.0337371826172, -134.17962646484375, -125.32552337646484, -116.4714126586914, -107.61730194091797, -98.76319885253906, -89.90908813476562, -81.05497741699219, -72.20086669921875, -63.34675979614258, -54.492652893066406, -45.63854217529297, -36.78443145751953, -27.93032455444336, -19.076217651367188, -10.22210693359375, -1.3679981231689453, 7.486110687255859, 16.340219497680664, 25.19432830810547, 34.048439025878906, 42.90254592895508, 51.75665283203125, 60.61076354980469, 69.46487426757812, 78.31898498535156, 87.17308807373047, 96.0271987915039, 104.88130950927734, 113.73541259765625, 122.58952331542969, 131.44363403320312, 140.29774475097656, 149.15185546875, 158.00596618652344, 166.86007690429688, 175.71417236328125, 184.5682830810547, 193.42239379882812, 202.27650451660156, 211.130615234375, 219.98472595214844, 228.83883666992188, 237.69293212890625, 246.54705810546875, 255.40115356445312, 264.2552490234375, 273.109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 6.0, 6.0, 4.0, 10.0, 12.0, 18.0, 46.0, 65.0, 111.0, 228.0, 569.0, 1439.0, 3877.0, 11746.0, 46374.0, 244964.0, 571273.0, 128750.0, 27087.0, 7492.0, 2625.0, 985.0, 436.0, 179.0, 97.0, 46.0, 26.0, 18.0, 17.0, 12.0, 7.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.53125, -61.02197265625, -58.5126953125, -56.00341796875, -53.494140625, -50.98486328125, -48.4755859375, -45.96630859375, -43.45703125, -40.94775390625, -38.4384765625, -35.92919921875, -33.419921875, -30.91064453125, -28.4013671875, -25.89208984375, -23.3828125, -20.87353515625, -18.3642578125, -15.85498046875, -13.345703125, -10.83642578125, -8.3271484375, -5.81787109375, -3.30859375, -0.79931640625, 1.7099609375, 4.21923828125, 6.728515625, 9.23779296875, 11.7470703125, 14.25634765625, 16.765625, 19.27490234375, 21.7841796875, 24.29345703125, 26.802734375, 29.31201171875, 31.8212890625, 34.33056640625, 36.83984375, 39.34912109375, 41.8583984375, 44.36767578125, 46.876953125, 49.38623046875, 51.8955078125, 54.40478515625, 56.9140625, 59.42333984375, 61.9326171875, 64.44189453125, 66.951171875, 69.46044921875, 71.9697265625, 74.47900390625, 76.98828125, 79.49755859375, 82.0068359375, 84.51611328125, 87.025390625, 89.53466796875, 92.0439453125, 94.55322265625, 97.0625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 4.0, 0.0, 6.0, 10.0, 11.0, 7.0, 14.0, 11.0, 15.0, 26.0, 20.0, 22.0, 18.0, 34.0, 19.0, 34.0, 28.0, 29.0, 38.0, 26.0, 43.0, 51.0, 44.0, 39.0, 56.0, 33.0, 30.0, 46.0, 38.0, 27.0, 29.0, 25.0, 19.0, 22.0, 15.0, 21.0, 13.0, 11.0, 10.0, 6.0, 7.0, 6.0, 8.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-19.09375, -18.533447265625, -17.97314453125, -17.412841796875, -16.8525390625, -16.292236328125, -15.73193359375, -15.171630859375, -14.611328125, -14.051025390625, -13.49072265625, -12.930419921875, -12.3701171875, -11.809814453125, -11.24951171875, -10.689208984375, -10.12890625, -9.568603515625, -9.00830078125, -8.447998046875, -7.8876953125, -7.327392578125, -6.76708984375, -6.206787109375, -5.646484375, -5.086181640625, -4.52587890625, -3.965576171875, -3.4052734375, -2.844970703125, -2.28466796875, -1.724365234375, -1.1640625, -0.603759765625, -0.04345703125, 0.516845703125, 1.0771484375, 1.637451171875, 2.19775390625, 2.758056640625, 3.318359375, 3.878662109375, 4.43896484375, 4.999267578125, 5.5595703125, 6.119873046875, 6.68017578125, 7.240478515625, 7.80078125, 8.361083984375, 8.92138671875, 9.481689453125, 10.0419921875, 10.602294921875, 11.16259765625, 11.722900390625, 12.283203125, 12.843505859375, 13.40380859375, 13.964111328125, 14.5244140625, 15.084716796875, 15.64501953125, 16.205322265625, 16.765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 12.0, 19.0, 13.0, 23.0, 39.0, 56.0, 67.0, 99.0, 177.0, 289.0, 485.0, 1012.0, 2283.0, 7096.0, 40197.0, 732853.0, 235179.0, 20318.0, 4595.0, 1739.0, 815.0, 413.0, 285.0, 156.0, 98.0, 58.0, 40.0, 31.0, 30.0, 12.0, 10.0, 14.0, 5.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-138.5, -134.1484375, -129.796875, -125.4453125, -121.09375, -116.7421875, -112.390625, -108.0390625, -103.6875, -99.3359375, -94.984375, -90.6328125, -86.28125, -81.9296875, -77.578125, -73.2265625, -68.875, -64.5234375, -60.171875, -55.8203125, -51.46875, -47.1171875, -42.765625, -38.4140625, -34.0625, -29.7109375, -25.359375, -21.0078125, -16.65625, -12.3046875, -7.953125, -3.6015625, 0.75, 5.1015625, 9.453125, 13.8046875, 18.15625, 22.5078125, 26.859375, 31.2109375, 35.5625, 39.9140625, 44.265625, 48.6171875, 52.96875, 57.3203125, 61.671875, 66.0234375, 70.375, 74.7265625, 79.078125, 83.4296875, 87.78125, 92.1328125, 96.484375, 100.8359375, 105.1875, 109.5390625, 113.890625, 118.2421875, 122.59375, 126.9453125, 131.296875, 135.6484375, 140.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 13.0, 16.0, 9.0, 19.0, 22.0, 28.0, 44.0, 49.0, 38.0, 61.0, 68.0, 61.0, 73.0, 77.0, 61.0, 59.0, 55.0, 39.0, 42.0, 31.0, 27.0, 25.0, 10.0, 16.0, 7.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.1875, -123.5283203125, -119.869140625, -116.2099609375, -112.55078125, -108.8916015625, -105.232421875, -101.5732421875, -97.9140625, -94.2548828125, -90.595703125, -86.9365234375, -83.27734375, -79.6181640625, -75.958984375, -72.2998046875, -68.640625, -64.9814453125, -61.322265625, -57.6630859375, -54.00390625, -50.3447265625, -46.685546875, -43.0263671875, -39.3671875, -35.7080078125, -32.048828125, -28.3896484375, -24.73046875, -21.0712890625, -17.412109375, -13.7529296875, -10.09375, -6.4345703125, -2.775390625, 0.8837890625, 4.54296875, 8.2021484375, 11.861328125, 15.5205078125, 19.1796875, 22.8388671875, 26.498046875, 30.1572265625, 33.81640625, 37.4755859375, 41.134765625, 44.7939453125, 48.453125, 52.1123046875, 55.771484375, 59.4306640625, 63.08984375, 66.7490234375, 70.408203125, 74.0673828125, 77.7265625, 81.3857421875, 85.044921875, 88.7041015625, 92.36328125, 96.0224609375, 99.681640625, 103.3408203125, 107.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 3.0, 10.0, 13.0, 21.0, 23.0, 31.0, 57.0, 85.0, 165.0, 362.0, 826.0, 2579.0, 12858.0, 257563.0, 746038.0, 22305.0, 3641.0, 1106.0, 399.0, 161.0, 98.0, 56.0, 29.0, 27.0, 14.0, 18.0, 7.0, 5.0, 10.0, 4.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.59375, -47.0810546875, -45.568359375, -44.0556640625, -42.54296875, -41.0302734375, -39.517578125, -38.0048828125, -36.4921875, -34.9794921875, -33.466796875, -31.9541015625, -30.44140625, -28.9287109375, -27.416015625, -25.9033203125, -24.390625, -22.8779296875, -21.365234375, -19.8525390625, -18.33984375, -16.8271484375, -15.314453125, -13.8017578125, -12.2890625, -10.7763671875, -9.263671875, -7.7509765625, -6.23828125, -4.7255859375, -3.212890625, -1.7001953125, -0.1875, 1.3251953125, 2.837890625, 4.3505859375, 5.86328125, 7.3759765625, 8.888671875, 10.4013671875, 11.9140625, 13.4267578125, 14.939453125, 16.4521484375, 17.96484375, 19.4775390625, 20.990234375, 22.5029296875, 24.015625, 25.5283203125, 27.041015625, 28.5537109375, 30.06640625, 31.5791015625, 33.091796875, 34.6044921875, 36.1171875, 37.6298828125, 39.142578125, 40.6552734375, 42.16796875, 43.6806640625, 45.193359375, 46.7060546875, 48.21875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 10.0, 14.0, 17.0, 25.0, 31.0, 30.0, 36.0, 71.0, 86.0, 142.0, 131.0, 138.0, 68.0, 43.0, 32.0, 26.0, 22.0, 9.0, 15.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00748443603515625, -0.007258474826812744, -0.007032513618469238, -0.006806552410125732, -0.0065805912017822266, -0.006354629993438721, -0.006128668785095215, -0.005902707576751709, -0.005676746368408203, -0.005450785160064697, -0.005224823951721191, -0.0049988627433776855, -0.00477290153503418, -0.004546940326690674, -0.004320979118347168, -0.004095017910003662, -0.0038690567016601562, -0.0036430954933166504, -0.0034171342849731445, -0.0031911730766296387, -0.002965211868286133, -0.002739250659942627, -0.002513289451599121, -0.0022873282432556152, -0.0020613670349121094, -0.0018354058265686035, -0.0016094446182250977, -0.0013834834098815918, -0.001157522201538086, -0.0009315609931945801, -0.0007055997848510742, -0.00047963857650756836, -0.0002536773681640625, -2.771615982055664e-05, 0.00019824504852294922, 0.0004242062568664551, 0.0006501674652099609, 0.0008761286735534668, 0.0011020898818969727, 0.0013280510902404785, 0.0015540122985839844, 0.0017799735069274902, 0.002005934715270996, 0.002231895923614502, 0.002457857131958008, 0.0026838183403015137, 0.0029097795486450195, 0.0031357407569885254, 0.0033617019653320312, 0.003587663173675537, 0.003813624382019043, 0.004039585590362549, 0.004265546798706055, 0.0044915080070495605, 0.004717469215393066, 0.004943430423736572, 0.005169391632080078, 0.005395352840423584, 0.00562131404876709, 0.005847275257110596, 0.0060732364654541016, 0.006299197673797607, 0.006525158882141113, 0.006751120090484619, 0.006977081298828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 11.0, 14.0, 33.0, 26.0, 57.0, 81.0, 99.0, 177.0, 311.0, 599.0, 1257.0, 3324.0, 11923.0, 107438.0, 833029.0, 74622.0, 10103.0, 2986.0, 1108.0, 550.0, 269.0, 157.0, 100.0, 83.0, 50.0, 32.0, 21.0, 17.0, 13.0, 6.0, 14.0, 8.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.21875, -30.158203125, -29.09765625, -28.037109375, -26.9765625, -25.916015625, -24.85546875, -23.794921875, -22.734375, -21.673828125, -20.61328125, -19.552734375, -18.4921875, -17.431640625, -16.37109375, -15.310546875, -14.25, -13.189453125, -12.12890625, -11.068359375, -10.0078125, -8.947265625, -7.88671875, -6.826171875, -5.765625, -4.705078125, -3.64453125, -2.583984375, -1.5234375, -0.462890625, 0.59765625, 1.658203125, 2.71875, 3.779296875, 4.83984375, 5.900390625, 6.9609375, 8.021484375, 9.08203125, 10.142578125, 11.203125, 12.263671875, 13.32421875, 14.384765625, 15.4453125, 16.505859375, 17.56640625, 18.626953125, 19.6875, 20.748046875, 21.80859375, 22.869140625, 23.9296875, 24.990234375, 26.05078125, 27.111328125, 28.171875, 29.232421875, 30.29296875, 31.353515625, 32.4140625, 33.474609375, 34.53515625, 35.595703125, 36.65625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 4.0, 9.0, 13.0, 9.0, 24.0, 25.0, 29.0, 48.0, 62.0, 78.0, 78.0, 94.0, 103.0, 92.0, 70.0, 71.0, 39.0, 30.0, 26.0, 22.0, 16.0, 11.0, 8.0, 1.0, 10.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.500244140625, -20.67236328125, -19.844482421875, -19.0166015625, -18.188720703125, -17.36083984375, -16.532958984375, -15.705078125, -14.877197265625, -14.04931640625, -13.221435546875, -12.3935546875, -11.565673828125, -10.73779296875, -9.909912109375, -9.08203125, -8.254150390625, -7.42626953125, -6.598388671875, -5.7705078125, -4.942626953125, -4.11474609375, -3.286865234375, -2.458984375, -1.631103515625, -0.80322265625, 0.024658203125, 0.8525390625, 1.680419921875, 2.50830078125, 3.336181640625, 4.1640625, 4.991943359375, 5.81982421875, 6.647705078125, 7.4755859375, 8.303466796875, 9.13134765625, 9.959228515625, 10.787109375, 11.614990234375, 12.44287109375, 13.270751953125, 14.0986328125, 14.926513671875, 15.75439453125, 16.582275390625, 17.41015625, 18.238037109375, 19.06591796875, 19.893798828125, 20.7216796875, 21.549560546875, 22.37744140625, 23.205322265625, 24.033203125, 24.861083984375, 25.68896484375, 26.516845703125, 27.3447265625, 28.172607421875, 29.00048828125, 29.828369140625, 30.65625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 10.0, 26.0, 39.0, 143.0, 365.0, 275.0, 89.0, 22.0, 13.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-742.5076904296875, -706.910400390625, -671.3131103515625, -635.7158203125, -600.1185302734375, -564.521240234375, -528.9239501953125, -493.32666015625, -457.7293701171875, -422.132080078125, -386.5347900390625, -350.9375, -315.3402099609375, -279.742919921875, -244.1456298828125, -208.54833984375, -172.9510498046875, -137.353759765625, -101.7564697265625, -66.1591796875, -30.5618896484375, 5.035400390625, 40.6326904296875, 76.22998046875, 111.8272705078125, 147.424560546875, 183.0218505859375, 218.619140625, 254.2164306640625, 289.813720703125, 325.4110107421875, 361.00830078125, 396.605712890625, 432.2030029296875, 467.80029296875, 503.3975830078125, 538.994873046875, 574.5921630859375, 610.189453125, 645.7867431640625, 681.384033203125, 716.9813232421875, 752.57861328125, 788.1759033203125, 823.773193359375, 859.3704833984375, 894.9677734375, 930.5650634765625, 966.162353515625, 1001.7596435546875, 1037.35693359375, 1072.9542236328125, 1108.551513671875, 1144.1488037109375, 1179.74609375, 1215.3433837890625, 1250.940673828125, 1286.5379638671875, 1322.13525390625, 1357.7325439453125, 1393.329833984375, 1428.9271240234375, 1464.5244140625, 1500.1217041015625, 1535.718994140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 9.0, 8.0, 10.0, 12.0, 11.0, 11.0, 16.0, 25.0, 24.0, 20.0, 24.0, 27.0, 26.0, 42.0, 37.0, 49.0, 60.0, 69.0, 64.0, 59.0, 53.0, 39.0, 44.0, 22.0, 24.0, 34.0, 20.0, 20.0, 29.0, 16.0, 18.0, 12.0, 16.0, 11.0, 4.0, 3.0, 5.0, 9.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-374.6380615234375, -363.3945007324219, -352.1509094238281, -340.9073486328125, -329.66375732421875, -318.4201965332031, -307.1766357421875, -295.93304443359375, -284.689453125, -273.4458923339844, -262.2023010253906, -250.958740234375, -239.71514892578125, -228.47158813476562, -217.22801208496094, -205.98443603515625, -194.74087524414062, -183.49729919433594, -172.25372314453125, -161.01016235351562, -149.76657104492188, -138.52301025390625, -127.27943420410156, -116.03585815429688, -104.79228210449219, -93.5487060546875, -82.30513000488281, -71.06156158447266, -59.81798553466797, -48.57440948486328, -37.330841064453125, -26.087265014648438, -14.84368896484375, -3.6001148223876953, 7.643459320068359, 18.88703155517578, 30.13060760498047, 41.374183654785156, 52.61775207519531, 63.861328125, 75.10490417480469, 86.34848022460938, 97.59205627441406, 108.83562469482422, 120.0792007446289, 131.32278442382812, 142.56634521484375, 153.80992126464844, 165.05349731445312, 176.2970733642578, 187.5406494140625, 198.78421020507812, 210.02780151367188, 221.2713623046875, 232.5149383544922, 243.75851440429688, 255.00209045410156, 266.24566650390625, 277.4892272949219, 288.7328186035156, 299.97637939453125, 311.219970703125, 322.4635314941406, 333.70709228515625, 344.95068359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 9.0, 2.0, 18.0, 25.0, 32.0, 35.0, 66.0, 116.0, 151.0, 235.0, 458.0, 999.0, 2493.0, 8428.0, 47529.0, 2387911.0, 1697011.0, 37312.0, 7227.0, 2228.0, 911.0, 435.0, 272.0, 137.0, 75.0, 45.0, 38.0, 25.0, 19.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.84375, -49.76611328125, -47.6884765625, -45.61083984375, -43.533203125, -41.45556640625, -39.3779296875, -37.30029296875, -35.22265625, -33.14501953125, -31.0673828125, -28.98974609375, -26.912109375, -24.83447265625, -22.7568359375, -20.67919921875, -18.6015625, -16.52392578125, -14.4462890625, -12.36865234375, -10.291015625, -8.21337890625, -6.1357421875, -4.05810546875, -1.98046875, 0.09716796875, 2.1748046875, 4.25244140625, 6.330078125, 8.40771484375, 10.4853515625, 12.56298828125, 14.640625, 16.71826171875, 18.7958984375, 20.87353515625, 22.951171875, 25.02880859375, 27.1064453125, 29.18408203125, 31.26171875, 33.33935546875, 35.4169921875, 37.49462890625, 39.572265625, 41.64990234375, 43.7275390625, 45.80517578125, 47.8828125, 49.96044921875, 52.0380859375, 54.11572265625, 56.193359375, 58.27099609375, 60.3486328125, 62.42626953125, 64.50390625, 66.58154296875, 68.6591796875, 70.73681640625, 72.814453125, 74.89208984375, 76.9697265625, 79.04736328125, 81.125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 10.0, 13.0, 11.0, 13.0, 22.0, 17.0, 26.0, 17.0, 28.0, 23.0, 31.0, 35.0, 34.0, 34.0, 35.0, 39.0, 39.0, 49.0, 42.0, 44.0, 34.0, 37.0, 34.0, 26.0, 34.0, 32.0, 36.0, 25.0, 24.0, 21.0, 19.0, 18.0, 14.0, 13.0, 7.0, 9.0, 12.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-17.46875, -16.925537109375, -16.38232421875, -15.839111328125, -15.2958984375, -14.752685546875, -14.20947265625, -13.666259765625, -13.123046875, -12.579833984375, -12.03662109375, -11.493408203125, -10.9501953125, -10.406982421875, -9.86376953125, -9.320556640625, -8.77734375, -8.234130859375, -7.69091796875, -7.147705078125, -6.6044921875, -6.061279296875, -5.51806640625, -4.974853515625, -4.431640625, -3.888427734375, -3.34521484375, -2.802001953125, -2.2587890625, -1.715576171875, -1.17236328125, -0.629150390625, -0.0859375, 0.457275390625, 1.00048828125, 1.543701171875, 2.0869140625, 2.630126953125, 3.17333984375, 3.716552734375, 4.259765625, 4.802978515625, 5.34619140625, 5.889404296875, 6.4326171875, 6.975830078125, 7.51904296875, 8.062255859375, 8.60546875, 9.148681640625, 9.69189453125, 10.235107421875, 10.7783203125, 11.321533203125, 11.86474609375, 12.407958984375, 12.951171875, 13.494384765625, 14.03759765625, 14.580810546875, 15.1240234375, 15.667236328125, 16.21044921875, 16.753662109375, 17.296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 7.0, 5.0, 12.0, 12.0, 22.0, 28.0, 44.0, 82.0, 141.0, 285.0, 506.0, 1157.0, 2915.0, 9518.0, 51201.0, 1931068.0, 2130171.0, 53247.0, 9217.0, 2550.0, 1021.0, 473.0, 252.0, 134.0, 79.0, 45.0, 32.0, 17.0, 7.0, 4.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.875, -69.3974609375, -66.919921875, -64.4423828125, -61.96484375, -59.4873046875, -57.009765625, -54.5322265625, -52.0546875, -49.5771484375, -47.099609375, -44.6220703125, -42.14453125, -39.6669921875, -37.189453125, -34.7119140625, -32.234375, -29.7568359375, -27.279296875, -24.8017578125, -22.32421875, -19.8466796875, -17.369140625, -14.8916015625, -12.4140625, -9.9365234375, -7.458984375, -4.9814453125, -2.50390625, -0.0263671875, 2.451171875, 4.9287109375, 7.40625, 9.8837890625, 12.361328125, 14.8388671875, 17.31640625, 19.7939453125, 22.271484375, 24.7490234375, 27.2265625, 29.7041015625, 32.181640625, 34.6591796875, 37.13671875, 39.6142578125, 42.091796875, 44.5693359375, 47.046875, 49.5244140625, 52.001953125, 54.4794921875, 56.95703125, 59.4345703125, 61.912109375, 64.3896484375, 66.8671875, 69.3447265625, 71.822265625, 74.2998046875, 76.77734375, 79.2548828125, 81.732421875, 84.2099609375, 86.6875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 8.0, 10.0, 23.0, 28.0, 40.0, 61.0, 90.0, 183.0, 478.0, 1004.0, 1034.0, 560.0, 222.0, 98.0, 77.0, 40.0, 29.0, 23.0, 12.0, 15.0, 7.0, 1.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.625, -67.234375, -64.84375, -62.453125, -60.0625, -57.671875, -55.28125, -52.890625, -50.5, -48.109375, -45.71875, -43.328125, -40.9375, -38.546875, -36.15625, -33.765625, -31.375, -28.984375, -26.59375, -24.203125, -21.8125, -19.421875, -17.03125, -14.640625, -12.25, -9.859375, -7.46875, -5.078125, -2.6875, -0.296875, 2.09375, 4.484375, 6.875, 9.265625, 11.65625, 14.046875, 16.4375, 18.828125, 21.21875, 23.609375, 26.0, 28.390625, 30.78125, 33.171875, 35.5625, 37.953125, 40.34375, 42.734375, 45.125, 47.515625, 49.90625, 52.296875, 54.6875, 57.078125, 59.46875, 61.859375, 64.25, 66.640625, 69.03125, 71.421875, 73.8125, 76.203125, 78.59375, 80.984375, 83.375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 16.0, 17.0, 47.0, 126.0, 241.0, 261.0, 159.0, 58.0, 27.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-789.8038330078125, -768.443115234375, -747.0823364257812, -725.7216186523438, -704.3609008789062, -683.0001831054688, -661.639404296875, -640.2786865234375, -618.91796875, -597.5572509765625, -576.1964721679688, -554.8357543945312, -533.4750366210938, -512.1143188476562, -490.7535400390625, -469.392822265625, -448.0320739746094, -426.67132568359375, -405.31060791015625, -383.9498596191406, -362.5891418457031, -341.2283935546875, -319.86767578125, -298.5069274902344, -277.14617919921875, -255.7854461669922, -234.42471313476562, -213.06396484375, -191.7032470703125, -170.34249877929688, -148.9817657470703, -127.62103271484375, -106.26031494140625, -84.89958190917969, -63.53884506225586, -42.17810821533203, -20.81737518310547, 0.5433578491210938, 21.904098510742188, 43.26483154296875, 64.62556457519531, 85.98629760742188, 107.34703063964844, 128.707763671875, 150.06851196289062, 171.42922973632812, 192.78997802734375, 214.1507110595703, 235.51144409179688, 256.8721923828125, 278.23291015625, 299.5936584472656, 320.9543762207031, 342.31512451171875, 363.67584228515625, 385.0365905761719, 406.3973388671875, 427.7580871582031, 449.1188049316406, 470.47955322265625, 491.84027099609375, 513.2009887695312, 534.561767578125, 555.9224853515625, 577.283203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 14.0, 5.0, 11.0, 19.0, 19.0, 19.0, 39.0, 40.0, 48.0, 57.0, 62.0, 60.0, 81.0, 78.0, 55.0, 55.0, 57.0, 51.0, 51.0, 40.0, 33.0, 20.0, 19.0, 13.0, 13.0, 11.0, 7.0, 0.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-317.19891357421875, -307.2953796386719, -297.391845703125, -287.4883117675781, -277.58477783203125, -267.6812438964844, -257.7777099609375, -247.87417602539062, -237.97064208984375, -228.06710815429688, -218.16357421875, -208.26004028320312, -198.35650634765625, -188.45297241210938, -178.5494384765625, -168.64590454101562, -158.74237060546875, -148.83883666992188, -138.935302734375, -129.03176879882812, -119.12823486328125, -109.22470092773438, -99.3211669921875, -89.41763305664062, -79.51409912109375, -69.61056518554688, -59.70703125, -49.803497314453125, -39.89996337890625, -29.996429443359375, -20.0928955078125, -10.189361572265625, -0.28582763671875, 9.617706298828125, 19.521240234375, 29.424774169921875, 39.32830810546875, 49.231842041015625, 59.1353759765625, 69.03890991210938, 78.94244384765625, 88.84597778320312, 98.74951171875, 108.65304565429688, 118.55657958984375, 128.46011352539062, 138.3636474609375, 148.26718139648438, 158.17071533203125, 168.07424926757812, 177.977783203125, 187.88131713867188, 197.78485107421875, 207.68838500976562, 217.5919189453125, 227.49545288085938, 237.39898681640625, 247.30252075195312, 257.2060546875, 267.1095886230469, 277.01312255859375, 286.9166564941406, 296.8201904296875, 306.7237243652344, 316.62725830078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 4.0, 4.0, 8.0, 12.0, 14.0, 22.0, 40.0, 44.0, 54.0, 147.0, 232.0, 402.0, 717.0, 1352.0, 2640.0, 5650.0, 12704.0, 31656.0, 84645.0, 223082.0, 351675.0, 205395.0, 76783.0, 28995.0, 11693.0, 5147.0, 2560.0, 1228.0, 672.0, 383.0, 225.0, 132.0, 87.0, 55.0, 31.0, 31.0, 13.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.51708984375, -23.4716796875, -22.42626953125, -21.380859375, -20.33544921875, -19.2900390625, -18.24462890625, -17.19921875, -16.15380859375, -15.1083984375, -14.06298828125, -13.017578125, -11.97216796875, -10.9267578125, -9.88134765625, -8.8359375, -7.79052734375, -6.7451171875, -5.69970703125, -4.654296875, -3.60888671875, -2.5634765625, -1.51806640625, -0.47265625, 0.57275390625, 1.6181640625, 2.66357421875, 3.708984375, 4.75439453125, 5.7998046875, 6.84521484375, 7.890625, 8.93603515625, 9.9814453125, 11.02685546875, 12.072265625, 13.11767578125, 14.1630859375, 15.20849609375, 16.25390625, 17.29931640625, 18.3447265625, 19.39013671875, 20.435546875, 21.48095703125, 22.5263671875, 23.57177734375, 24.6171875, 25.66259765625, 26.7080078125, 27.75341796875, 28.798828125, 29.84423828125, 30.8896484375, 31.93505859375, 32.98046875, 34.02587890625, 35.0712890625, 36.11669921875, 37.162109375, 38.20751953125, 39.2529296875, 40.29833984375, 41.34375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 10.0, 14.0, 7.0, 13.0, 13.0, 16.0, 19.0, 22.0, 33.0, 27.0, 31.0, 40.0, 34.0, 35.0, 38.0, 33.0, 28.0, 47.0, 46.0, 38.0, 38.0, 55.0, 33.0, 34.0, 34.0, 28.0, 28.0, 23.0, 21.0, 18.0, 19.0, 17.0, 11.0, 14.0, 12.0, 10.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0], "bins": [-20.0, -19.427734375, -18.85546875, -18.283203125, -17.7109375, -17.138671875, -16.56640625, -15.994140625, -15.421875, -14.849609375, -14.27734375, -13.705078125, -13.1328125, -12.560546875, -11.98828125, -11.416015625, -10.84375, -10.271484375, -9.69921875, -9.126953125, -8.5546875, -7.982421875, -7.41015625, -6.837890625, -6.265625, -5.693359375, -5.12109375, -4.548828125, -3.9765625, -3.404296875, -2.83203125, -2.259765625, -1.6875, -1.115234375, -0.54296875, 0.029296875, 0.6015625, 1.173828125, 1.74609375, 2.318359375, 2.890625, 3.462890625, 4.03515625, 4.607421875, 5.1796875, 5.751953125, 6.32421875, 6.896484375, 7.46875, 8.041015625, 8.61328125, 9.185546875, 9.7578125, 10.330078125, 10.90234375, 11.474609375, 12.046875, 12.619140625, 13.19140625, 13.763671875, 14.3359375, 14.908203125, 15.48046875, 16.052734375, 16.625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 8.0, 10.0, 15.0, 28.0, 32.0, 45.0, 88.0, 122.0, 245.0, 474.0, 1111.0, 2751.0, 8605.0, 38384.0, 283995.0, 626165.0, 66977.0, 12929.0, 3788.0, 1459.0, 657.0, 280.0, 145.0, 84.0, 41.0, 29.0, 27.0, 16.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.78125, -60.62744140625, -58.4736328125, -56.31982421875, -54.166015625, -52.01220703125, -49.8583984375, -47.70458984375, -45.55078125, -43.39697265625, -41.2431640625, -39.08935546875, -36.935546875, -34.78173828125, -32.6279296875, -30.47412109375, -28.3203125, -26.16650390625, -24.0126953125, -21.85888671875, -19.705078125, -17.55126953125, -15.3974609375, -13.24365234375, -11.08984375, -8.93603515625, -6.7822265625, -4.62841796875, -2.474609375, -0.32080078125, 1.8330078125, 3.98681640625, 6.140625, 8.29443359375, 10.4482421875, 12.60205078125, 14.755859375, 16.90966796875, 19.0634765625, 21.21728515625, 23.37109375, 25.52490234375, 27.6787109375, 29.83251953125, 31.986328125, 34.14013671875, 36.2939453125, 38.44775390625, 40.6015625, 42.75537109375, 44.9091796875, 47.06298828125, 49.216796875, 51.37060546875, 53.5244140625, 55.67822265625, 57.83203125, 59.98583984375, 62.1396484375, 64.29345703125, 66.447265625, 68.60107421875, 70.7548828125, 72.90869140625, 75.0625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 6.0, 19.0, 22.0, 23.0, 18.0, 28.0, 39.0, 34.0, 53.0, 47.0, 62.0, 71.0, 82.0, 75.0, 62.0, 59.0, 58.0, 54.0, 27.0, 36.0, 24.0, 23.0, 17.0, 13.0, 13.0, 11.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.9375, -101.7265625, -98.515625, -95.3046875, -92.09375, -88.8828125, -85.671875, -82.4609375, -79.25, -76.0390625, -72.828125, -69.6171875, -66.40625, -63.1953125, -59.984375, -56.7734375, -53.5625, -50.3515625, -47.140625, -43.9296875, -40.71875, -37.5078125, -34.296875, -31.0859375, -27.875, -24.6640625, -21.453125, -18.2421875, -15.03125, -11.8203125, -8.609375, -5.3984375, -2.1875, 1.0234375, 4.234375, 7.4453125, 10.65625, 13.8671875, 17.078125, 20.2890625, 23.5, 26.7109375, 29.921875, 33.1328125, 36.34375, 39.5546875, 42.765625, 45.9765625, 49.1875, 52.3984375, 55.609375, 58.8203125, 62.03125, 65.2421875, 68.453125, 71.6640625, 74.875, 78.0859375, 81.296875, 84.5078125, 87.71875, 90.9296875, 94.140625, 97.3515625, 100.5625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 1.0, 10.0, 12.0, 24.0, 24.0, 34.0, 47.0, 79.0, 129.0, 221.0, 424.0, 842.0, 1859.0, 4467.0, 13687.0, 55007.0, 307289.0, 564560.0, 73267.0, 17015.0, 5253.0, 2192.0, 967.0, 478.0, 225.0, 140.0, 105.0, 63.0, 31.0, 31.0, 18.0, 7.0, 11.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.765625, -16.226318359375, -15.68701171875, -15.147705078125, -14.6083984375, -14.069091796875, -13.52978515625, -12.990478515625, -12.451171875, -11.911865234375, -11.37255859375, -10.833251953125, -10.2939453125, -9.754638671875, -9.21533203125, -8.676025390625, -8.13671875, -7.597412109375, -7.05810546875, -6.518798828125, -5.9794921875, -5.440185546875, -4.90087890625, -4.361572265625, -3.822265625, -3.282958984375, -2.74365234375, -2.204345703125, -1.6650390625, -1.125732421875, -0.58642578125, -0.047119140625, 0.4921875, 1.031494140625, 1.57080078125, 2.110107421875, 2.6494140625, 3.188720703125, 3.72802734375, 4.267333984375, 4.806640625, 5.345947265625, 5.88525390625, 6.424560546875, 6.9638671875, 7.503173828125, 8.04248046875, 8.581787109375, 9.12109375, 9.660400390625, 10.19970703125, 10.739013671875, 11.2783203125, 11.817626953125, 12.35693359375, 12.896240234375, 13.435546875, 13.974853515625, 14.51416015625, 15.053466796875, 15.5927734375, 16.132080078125, 16.67138671875, 17.210693359375, 17.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 7.0, 5.0, 7.0, 11.0, 18.0, 31.0, 30.0, 67.0, 76.0, 95.0, 99.0, 147.0, 116.0, 89.0, 60.0, 41.0, 36.0, 16.0, 12.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00527191162109375, -0.005102992057800293, -0.004934072494506836, -0.004765152931213379, -0.004596233367919922, -0.004427313804626465, -0.004258394241333008, -0.004089474678039551, -0.003920555114746094, -0.0037516355514526367, -0.0035827159881591797, -0.0034137964248657227, -0.0032448768615722656, -0.0030759572982788086, -0.0029070377349853516, -0.0027381181716918945, -0.0025691986083984375, -0.0024002790451049805, -0.0022313594818115234, -0.0020624399185180664, -0.0018935203552246094, -0.0017246007919311523, -0.0015556812286376953, -0.0013867616653442383, -0.0012178421020507812, -0.0010489225387573242, -0.0008800029754638672, -0.0007110834121704102, -0.0005421638488769531, -0.0003732442855834961, -0.00020432472229003906, -3.540515899658203e-05, 0.000133514404296875, 0.00030243396759033203, 0.00047135353088378906, 0.0006402730941772461, 0.0008091926574707031, 0.0009781122207641602, 0.0011470317840576172, 0.0013159513473510742, 0.0014848709106445312, 0.0016537904739379883, 0.0018227100372314453, 0.0019916296005249023, 0.0021605491638183594, 0.0023294687271118164, 0.0024983882904052734, 0.0026673078536987305, 0.0028362274169921875, 0.0030051469802856445, 0.0031740665435791016, 0.0033429861068725586, 0.0035119056701660156, 0.0036808252334594727, 0.0038497447967529297, 0.004018664360046387, 0.004187583923339844, 0.004356503486633301, 0.004525423049926758, 0.004694342613220215, 0.004863262176513672, 0.005032181739807129, 0.005201101303100586, 0.005370020866394043, 0.0055389404296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 11.0, 13.0, 19.0, 20.0, 38.0, 63.0, 95.0, 133.0, 263.0, 526.0, 1161.0, 2984.0, 9561.0, 44456.0, 321187.0, 589623.0, 60321.0, 11847.0, 3443.0, 1416.0, 655.0, 288.0, 174.0, 97.0, 55.0, 32.0, 23.0, 18.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.09375, -20.436279296875, -19.77880859375, -19.121337890625, -18.4638671875, -17.806396484375, -17.14892578125, -16.491455078125, -15.833984375, -15.176513671875, -14.51904296875, -13.861572265625, -13.2041015625, -12.546630859375, -11.88916015625, -11.231689453125, -10.57421875, -9.916748046875, -9.25927734375, -8.601806640625, -7.9443359375, -7.286865234375, -6.62939453125, -5.971923828125, -5.314453125, -4.656982421875, -3.99951171875, -3.342041015625, -2.6845703125, -2.027099609375, -1.36962890625, -0.712158203125, -0.0546875, 0.602783203125, 1.26025390625, 1.917724609375, 2.5751953125, 3.232666015625, 3.89013671875, 4.547607421875, 5.205078125, 5.862548828125, 6.52001953125, 7.177490234375, 7.8349609375, 8.492431640625, 9.14990234375, 9.807373046875, 10.46484375, 11.122314453125, 11.77978515625, 12.437255859375, 13.0947265625, 13.752197265625, 14.40966796875, 15.067138671875, 15.724609375, 16.382080078125, 17.03955078125, 17.697021484375, 18.3544921875, 19.011962890625, 19.66943359375, 20.326904296875, 20.984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 19.0, 25.0, 33.0, 42.0, 73.0, 89.0, 102.0, 108.0, 114.0, 94.0, 63.0, 53.0, 42.0, 29.0, 28.0, 11.0, 18.0, 7.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.277099609375, -16.55419921875, -15.831298828125, -15.1083984375, -14.385498046875, -13.66259765625, -12.939697265625, -12.216796875, -11.493896484375, -10.77099609375, -10.048095703125, -9.3251953125, -8.602294921875, -7.87939453125, -7.156494140625, -6.43359375, -5.710693359375, -4.98779296875, -4.264892578125, -3.5419921875, -2.819091796875, -2.09619140625, -1.373291015625, -0.650390625, 0.072509765625, 0.79541015625, 1.518310546875, 2.2412109375, 2.964111328125, 3.68701171875, 4.409912109375, 5.1328125, 5.855712890625, 6.57861328125, 7.301513671875, 8.0244140625, 8.747314453125, 9.47021484375, 10.193115234375, 10.916015625, 11.638916015625, 12.36181640625, 13.084716796875, 13.8076171875, 14.530517578125, 15.25341796875, 15.976318359375, 16.69921875, 17.422119140625, 18.14501953125, 18.867919921875, 19.5908203125, 20.313720703125, 21.03662109375, 21.759521484375, 22.482421875, 23.205322265625, 23.92822265625, 24.651123046875, 25.3740234375, 26.096923828125, 26.81982421875, 27.542724609375, 28.265625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 13.0, 18.0, 58.0, 209.0, 464.0, 170.0, 45.0, 14.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1135.611083984375, -1105.9742431640625, -1076.3372802734375, -1046.700439453125, -1017.0634765625, -987.4266357421875, -957.7897338867188, -928.15283203125, -898.5159301757812, -868.8790283203125, -839.2421264648438, -809.605224609375, -779.9683837890625, -750.3314208984375, -720.694580078125, -691.0576782226562, -661.4207763671875, -631.7838745117188, -602.14697265625, -572.5100708007812, -542.8731689453125, -513.236328125, -483.59942626953125, -453.9625244140625, -424.32562255859375, -394.688720703125, -365.05181884765625, -335.4149475097656, -305.7780456542969, -276.1411437988281, -246.50425720214844, -216.86737060546875, -187.23046875, -157.59356689453125, -127.95668029785156, -98.31978607177734, -68.68289184570312, -39.045989990234375, -9.409103393554688, 20.227783203125, 49.86468505859375, 79.50157928466797, 109.13847351074219, 138.77536010742188, 168.41226196289062, 198.04916381835938, 227.68605041503906, 257.32293701171875, 286.9598388671875, 316.59674072265625, 346.233642578125, 375.8705139160156, 405.5074157714844, 435.1443176269531, 464.78118896484375, 494.4180908203125, 524.0549926757812, 553.69189453125, 583.3287963867188, 612.9656982421875, 642.6025390625, 672.239501953125, 701.8763427734375, 731.5132446289062, 761.150146484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 9.0, 19.0, 11.0, 13.0, 13.0, 16.0, 18.0, 23.0, 29.0, 26.0, 33.0, 40.0, 40.0, 50.0, 64.0, 63.0, 65.0, 52.0, 57.0, 36.0, 40.0, 29.0, 33.0, 23.0, 28.0, 26.0, 17.0, 16.0, 12.0, 15.0, 13.0, 7.0, 11.0, 6.0, 10.0, 6.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-331.1248779296875, -322.1282958984375, -313.1317138671875, -304.1351623535156, -295.1385803222656, -286.1419982910156, -277.14544677734375, -268.14886474609375, -259.15228271484375, -250.15570068359375, -241.1591339111328, -232.16256713867188, -223.16598510742188, -214.16940307617188, -205.17283630371094, -196.17626953125, -187.1796875, -178.18310546875, -169.18653869628906, -160.18997192382812, -151.19338989257812, -142.19680786132812, -133.2002410888672, -124.20366668701172, -115.20709228515625, -106.21051788330078, -97.21394348144531, -88.21736907958984, -79.22079467773438, -70.2242202758789, -61.22764587402344, -52.23107147216797, -43.2344970703125, -34.23792266845703, -25.241348266601562, -16.244773864746094, -7.248199462890625, 1.7483749389648438, 10.744949340820312, 19.74152374267578, 28.73809814453125, 37.73467254638672, 46.73124694824219, 55.727821350097656, 64.72439575195312, 73.7209701538086, 82.71754455566406, 91.71411895751953, 100.710693359375, 109.70726776123047, 118.70384216308594, 127.7004165649414, 136.69699096679688, 145.69357299804688, 154.6901397705078, 163.68670654296875, 172.68328857421875, 181.67987060546875, 190.6764373779297, 199.67300415039062, 208.66958618164062, 217.66616821289062, 226.66273498535156, 235.6593017578125, 244.6558837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 14.0, 13.0, 18.0, 15.0, 16.0, 47.0, 62.0, 115.0, 210.0, 362.0, 713.0, 1651.0, 4895.0, 21015.0, 338934.0, 3430574.0, 364740.0, 22576.0, 5099.0, 1674.0, 706.0, 347.0, 160.0, 96.0, 80.0, 46.0, 27.0, 18.0, 11.0, 7.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.8125, -47.31103515625, -45.8095703125, -44.30810546875, -42.806640625, -41.30517578125, -39.8037109375, -38.30224609375, -36.80078125, -35.29931640625, -33.7978515625, -32.29638671875, -30.794921875, -29.29345703125, -27.7919921875, -26.29052734375, -24.7890625, -23.28759765625, -21.7861328125, -20.28466796875, -18.783203125, -17.28173828125, -15.7802734375, -14.27880859375, -12.77734375, -11.27587890625, -9.7744140625, -8.27294921875, -6.771484375, -5.27001953125, -3.7685546875, -2.26708984375, -0.765625, 0.73583984375, 2.2373046875, 3.73876953125, 5.240234375, 6.74169921875, 8.2431640625, 9.74462890625, 11.24609375, 12.74755859375, 14.2490234375, 15.75048828125, 17.251953125, 18.75341796875, 20.2548828125, 21.75634765625, 23.2578125, 24.75927734375, 26.2607421875, 27.76220703125, 29.263671875, 30.76513671875, 32.2666015625, 33.76806640625, 35.26953125, 36.77099609375, 38.2724609375, 39.77392578125, 41.275390625, 42.77685546875, 44.2783203125, 45.77978515625, 47.28125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 10.0, 9.0, 17.0, 8.0, 19.0, 18.0, 21.0, 30.0, 24.0, 33.0, 34.0, 37.0, 43.0, 44.0, 42.0, 55.0, 51.0, 41.0, 52.0, 38.0, 43.0, 43.0, 37.0, 39.0, 29.0, 23.0, 20.0, 12.0, 21.0, 18.0, 11.0, 15.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.609375, -21.002685546875, -20.39599609375, -19.789306640625, -19.1826171875, -18.575927734375, -17.96923828125, -17.362548828125, -16.755859375, -16.149169921875, -15.54248046875, -14.935791015625, -14.3291015625, -13.722412109375, -13.11572265625, -12.509033203125, -11.90234375, -11.295654296875, -10.68896484375, -10.082275390625, -9.4755859375, -8.868896484375, -8.26220703125, -7.655517578125, -7.048828125, -6.442138671875, -5.83544921875, -5.228759765625, -4.6220703125, -4.015380859375, -3.40869140625, -2.802001953125, -2.1953125, -1.588623046875, -0.98193359375, -0.375244140625, 0.2314453125, 0.838134765625, 1.44482421875, 2.051513671875, 2.658203125, 3.264892578125, 3.87158203125, 4.478271484375, 5.0849609375, 5.691650390625, 6.29833984375, 6.905029296875, 7.51171875, 8.118408203125, 8.72509765625, 9.331787109375, 9.9384765625, 10.545166015625, 11.15185546875, 11.758544921875, 12.365234375, 12.971923828125, 13.57861328125, 14.185302734375, 14.7919921875, 15.398681640625, 16.00537109375, 16.612060546875, 17.21875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 12.0, 22.0, 36.0, 36.0, 66.0, 165.0, 376.0, 992.0, 3671.0, 22665.0, 1471148.0, 2661548.0, 27546.0, 4134.0, 1124.0, 345.0, 176.0, 66.0, 51.0, 29.0, 12.0, 14.0, 7.0, 3.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.5, -90.48828125, -87.4765625, -84.46484375, -81.453125, -78.44140625, -75.4296875, -72.41796875, -69.40625, -66.39453125, -63.3828125, -60.37109375, -57.359375, -54.34765625, -51.3359375, -48.32421875, -45.3125, -42.30078125, -39.2890625, -36.27734375, -33.265625, -30.25390625, -27.2421875, -24.23046875, -21.21875, -18.20703125, -15.1953125, -12.18359375, -9.171875, -6.16015625, -3.1484375, -0.13671875, 2.875, 5.88671875, 8.8984375, 11.91015625, 14.921875, 17.93359375, 20.9453125, 23.95703125, 26.96875, 29.98046875, 32.9921875, 36.00390625, 39.015625, 42.02734375, 45.0390625, 48.05078125, 51.0625, 54.07421875, 57.0859375, 60.09765625, 63.109375, 66.12109375, 69.1328125, 72.14453125, 75.15625, 78.16796875, 81.1796875, 84.19140625, 87.203125, 90.21484375, 93.2265625, 96.23828125, 99.25]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 20.0, 20.0, 41.0, 72.0, 100.0, 221.0, 511.0, 1024.0, 986.0, 561.0, 211.0, 104.0, 51.0, 45.0, 17.0, 11.0, 10.0, 7.0, 8.0, 9.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.875, -85.62255859375, -83.3701171875, -81.11767578125, -78.865234375, -76.61279296875, -74.3603515625, -72.10791015625, -69.85546875, -67.60302734375, -65.3505859375, -63.09814453125, -60.845703125, -58.59326171875, -56.3408203125, -54.08837890625, -51.8359375, -49.58349609375, -47.3310546875, -45.07861328125, -42.826171875, -40.57373046875, -38.3212890625, -36.06884765625, -33.81640625, -31.56396484375, -29.3115234375, -27.05908203125, -24.806640625, -22.55419921875, -20.3017578125, -18.04931640625, -15.796875, -13.54443359375, -11.2919921875, -9.03955078125, -6.787109375, -4.53466796875, -2.2822265625, -0.02978515625, 2.22265625, 4.47509765625, 6.7275390625, 8.97998046875, 11.232421875, 13.48486328125, 15.7373046875, 17.98974609375, 20.2421875, 22.49462890625, 24.7470703125, 26.99951171875, 29.251953125, 31.50439453125, 33.7568359375, 36.00927734375, 38.26171875, 40.51416015625, 42.7666015625, 45.01904296875, 47.271484375, 49.52392578125, 51.7763671875, 54.02880859375, 56.28125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 23.0, 57.0, 149.0, 312.0, 234.0, 122.0, 48.0, 22.0, 12.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-877.1295166015625, -855.1187744140625, -833.1080322265625, -811.0972900390625, -789.0865478515625, -767.0758666992188, -745.0651245117188, -723.0543823242188, -701.0436401367188, -679.0328979492188, -657.0221557617188, -635.0114135742188, -613.000732421875, -590.989990234375, -568.979248046875, -546.968505859375, -524.957763671875, -502.947021484375, -480.936279296875, -458.9255676269531, -436.9148254394531, -414.9040832519531, -392.89337158203125, -370.88262939453125, -348.87188720703125, -326.86114501953125, -304.85040283203125, -282.8396911621094, -260.8289489746094, -238.81820678710938, -216.80747985839844, -194.7967529296875, -172.7860107421875, -150.7752685546875, -128.76454162597656, -106.7538070678711, -84.74307250976562, -62.732337951660156, -40.72160339355469, -18.71087646484375, 3.29986572265625, 25.31060028076172, 47.32133483886719, 69.33206939697266, 91.34280395507812, 113.3535385131836, 135.36427307128906, 157.375, 179.3857421875, 201.396484375, 223.40721130371094, 245.41793823242188, 267.4286804199219, 289.4394226074219, 311.45013427734375, 333.46087646484375, 355.47161865234375, 377.48236083984375, 399.49310302734375, 421.5038146972656, 443.5145568847656, 465.5252990722656, 487.5360107421875, 509.5467529296875, 531.5574951171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 1.0, 7.0, 3.0, 12.0, 14.0, 12.0, 12.0, 29.0, 31.0, 28.0, 36.0, 38.0, 45.0, 43.0, 53.0, 51.0, 53.0, 61.0, 51.0, 60.0, 48.0, 35.0, 45.0, 35.0, 28.0, 28.0, 25.0, 18.0, 22.0, 8.0, 15.0, 15.0, 8.0, 5.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.19119262695312, -229.75479125976562, -221.31837463378906, -212.8819580078125, -204.445556640625, -196.0091552734375, -187.57273864746094, -179.13632202148438, -170.69992065429688, -162.26351928710938, -153.8271026611328, -145.39068603515625, -136.95428466796875, -128.51788330078125, -120.08146667480469, -111.64505767822266, -103.20864868164062, -94.7722396850586, -86.33583068847656, -77.89942169189453, -69.4630126953125, -61.02660369873047, -52.59019470214844, -44.153785705566406, -35.717376708984375, -27.280967712402344, -18.844558715820312, -10.408149719238281, -1.97174072265625, 6.464668273925781, 14.901077270507812, 23.337486267089844, 31.773895263671875, 40.210304260253906, 48.64671325683594, 57.08312225341797, 65.51953125, 73.95594024658203, 82.39234924316406, 90.8287582397461, 99.26516723632812, 107.70157623291016, 116.13798522949219, 124.57439422607422, 133.01080322265625, 141.44720458984375, 149.8836212158203, 158.32003784179688, 166.75643920898438, 175.19284057617188, 183.62925720214844, 192.065673828125, 200.5020751953125, 208.9384765625, 217.37489318847656, 225.81130981445312, 234.24771118164062, 242.68411254882812, 251.1205291748047, 259.55694580078125, 267.99334716796875, 276.42974853515625, 284.86614990234375, 293.3025817871094, 301.7389831542969]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 11.0, 13.0, 27.0, 38.0, 61.0, 115.0, 187.0, 328.0, 625.0, 1085.0, 2090.0, 4489.0, 10411.0, 25269.0, 67704.0, 193627.0, 383143.0, 227872.0, 79756.0, 29504.0, 11946.0, 5156.0, 2387.0, 1166.0, 640.0, 356.0, 213.0, 115.0, 83.0, 57.0, 25.0, 12.0, 14.0, 10.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.40625, -37.38427734375, -36.3623046875, -35.34033203125, -34.318359375, -33.29638671875, -32.2744140625, -31.25244140625, -30.23046875, -29.20849609375, -28.1865234375, -27.16455078125, -26.142578125, -25.12060546875, -24.0986328125, -23.07666015625, -22.0546875, -21.03271484375, -20.0107421875, -18.98876953125, -17.966796875, -16.94482421875, -15.9228515625, -14.90087890625, -13.87890625, -12.85693359375, -11.8349609375, -10.81298828125, -9.791015625, -8.76904296875, -7.7470703125, -6.72509765625, -5.703125, -4.68115234375, -3.6591796875, -2.63720703125, -1.615234375, -0.59326171875, 0.4287109375, 1.45068359375, 2.47265625, 3.49462890625, 4.5166015625, 5.53857421875, 6.560546875, 7.58251953125, 8.6044921875, 9.62646484375, 10.6484375, 11.67041015625, 12.6923828125, 13.71435546875, 14.736328125, 15.75830078125, 16.7802734375, 17.80224609375, 18.82421875, 19.84619140625, 20.8681640625, 21.89013671875, 22.912109375, 23.93408203125, 24.9560546875, 25.97802734375, 27.0]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 1.0, 4.0, 6.0, 11.0, 9.0, 12.0, 8.0, 25.0, 16.0, 13.0, 28.0, 23.0, 31.0, 26.0, 33.0, 33.0, 35.0, 41.0, 47.0, 53.0, 36.0, 32.0, 44.0, 33.0, 34.0, 39.0, 38.0, 30.0, 34.0, 27.0, 29.0, 23.0, 26.0, 16.0, 14.0, 16.0, 10.0, 14.0, 6.0, 11.0, 5.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.6533203125, -18.072265625, -17.4912109375, -16.91015625, -16.3291015625, -15.748046875, -15.1669921875, -14.5859375, -14.0048828125, -13.423828125, -12.8427734375, -12.26171875, -11.6806640625, -11.099609375, -10.5185546875, -9.9375, -9.3564453125, -8.775390625, -8.1943359375, -7.61328125, -7.0322265625, -6.451171875, -5.8701171875, -5.2890625, -4.7080078125, -4.126953125, -3.5458984375, -2.96484375, -2.3837890625, -1.802734375, -1.2216796875, -0.640625, -0.0595703125, 0.521484375, 1.1025390625, 1.68359375, 2.2646484375, 2.845703125, 3.4267578125, 4.0078125, 4.5888671875, 5.169921875, 5.7509765625, 6.33203125, 6.9130859375, 7.494140625, 8.0751953125, 8.65625, 9.2373046875, 9.818359375, 10.3994140625, 10.98046875, 11.5615234375, 12.142578125, 12.7236328125, 13.3046875, 13.8857421875, 14.466796875, 15.0478515625, 15.62890625, 16.2099609375, 16.791015625, 17.3720703125, 17.953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 5.0, 8.0, 13.0, 28.0, 44.0, 73.0, 133.0, 250.0, 587.0, 1708.0, 8662.0, 108895.0, 871550.0, 49018.0, 5382.0, 1264.0, 476.0, 200.0, 108.0, 50.0, 29.0, 16.0, 20.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.1875, -96.7763671875, -93.365234375, -89.9541015625, -86.54296875, -83.1318359375, -79.720703125, -76.3095703125, -72.8984375, -69.4873046875, -66.076171875, -62.6650390625, -59.25390625, -55.8427734375, -52.431640625, -49.0205078125, -45.609375, -42.1982421875, -38.787109375, -35.3759765625, -31.96484375, -28.5537109375, -25.142578125, -21.7314453125, -18.3203125, -14.9091796875, -11.498046875, -8.0869140625, -4.67578125, -1.2646484375, 2.146484375, 5.5576171875, 8.96875, 12.3798828125, 15.791015625, 19.2021484375, 22.61328125, 26.0244140625, 29.435546875, 32.8466796875, 36.2578125, 39.6689453125, 43.080078125, 46.4912109375, 49.90234375, 53.3134765625, 56.724609375, 60.1357421875, 63.546875, 66.9580078125, 70.369140625, 73.7802734375, 77.19140625, 80.6025390625, 84.013671875, 87.4248046875, 90.8359375, 94.2470703125, 97.658203125, 101.0693359375, 104.48046875, 107.8916015625, 111.302734375, 114.7138671875, 118.125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 2.0, 7.0, 6.0, 11.0, 9.0, 17.0, 14.0, 20.0, 17.0, 19.0, 27.0, 29.0, 24.0, 28.0, 40.0, 47.0, 58.0, 60.0, 61.0, 53.0, 62.0, 56.0, 56.0, 32.0, 48.0, 39.0, 23.0, 25.0, 15.0, 12.0, 14.0, 12.0, 12.0, 12.0, 9.0, 8.0, 4.0, 8.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.7080078125, -63.166015625, -60.6240234375, -58.08203125, -55.5400390625, -52.998046875, -50.4560546875, -47.9140625, -45.3720703125, -42.830078125, -40.2880859375, -37.74609375, -35.2041015625, -32.662109375, -30.1201171875, -27.578125, -25.0361328125, -22.494140625, -19.9521484375, -17.41015625, -14.8681640625, -12.326171875, -9.7841796875, -7.2421875, -4.7001953125, -2.158203125, 0.3837890625, 2.92578125, 5.4677734375, 8.009765625, 10.5517578125, 13.09375, 15.6357421875, 18.177734375, 20.7197265625, 23.26171875, 25.8037109375, 28.345703125, 30.8876953125, 33.4296875, 35.9716796875, 38.513671875, 41.0556640625, 43.59765625, 46.1396484375, 48.681640625, 51.2236328125, 53.765625, 56.3076171875, 58.849609375, 61.3916015625, 63.93359375, 66.4755859375, 69.017578125, 71.5595703125, 74.1015625, 76.6435546875, 79.185546875, 81.7275390625, 84.26953125, 86.8115234375, 89.353515625, 91.8955078125, 94.4375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 10.0, 9.0, 20.0, 24.0, 54.0, 77.0, 156.0, 284.0, 551.0, 1178.0, 2848.0, 8314.0, 31542.0, 236327.0, 694184.0, 53925.0, 12105.0, 4000.0, 1503.0, 658.0, 346.0, 166.0, 108.0, 57.0, 32.0, 22.0, 15.0, 11.0, 7.0, 5.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.640625, -21.0582275390625, -20.475830078125, -19.8934326171875, -19.31103515625, -18.7286376953125, -18.146240234375, -17.5638427734375, -16.9814453125, -16.3990478515625, -15.816650390625, -15.2342529296875, -14.65185546875, -14.0694580078125, -13.487060546875, -12.9046630859375, -12.322265625, -11.7398681640625, -11.157470703125, -10.5750732421875, -9.99267578125, -9.4102783203125, -8.827880859375, -8.2454833984375, -7.6630859375, -7.0806884765625, -6.498291015625, -5.9158935546875, -5.33349609375, -4.7510986328125, -4.168701171875, -3.5863037109375, -3.00390625, -2.4215087890625, -1.839111328125, -1.2567138671875, -0.67431640625, -0.0919189453125, 0.490478515625, 1.0728759765625, 1.6552734375, 2.2376708984375, 2.820068359375, 3.4024658203125, 3.98486328125, 4.5672607421875, 5.149658203125, 5.7320556640625, 6.314453125, 6.8968505859375, 7.479248046875, 8.0616455078125, 8.64404296875, 9.2264404296875, 9.808837890625, 10.3912353515625, 10.9736328125, 11.5560302734375, 12.138427734375, 12.7208251953125, 13.30322265625, 13.8856201171875, 14.468017578125, 15.0504150390625, 15.6328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 3.0, 10.0, 11.0, 12.0, 18.0, 21.0, 37.0, 49.0, 58.0, 89.0, 142.0, 134.0, 99.0, 79.0, 64.0, 32.0, 29.0, 20.0, 20.0, 9.0, 10.0, 10.0, 7.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003986358642578125, -0.003850281238555908, -0.0037142038345336914, -0.0035781264305114746, -0.003442049026489258, -0.003305971622467041, -0.0031698942184448242, -0.0030338168144226074, -0.0028977394104003906, -0.002761662006378174, -0.002625584602355957, -0.0024895071983337402, -0.0023534297943115234, -0.0022173523902893066, -0.00208127498626709, -0.001945197582244873, -0.0018091201782226562, -0.0016730427742004395, -0.0015369653701782227, -0.0014008879661560059, -0.001264810562133789, -0.0011287331581115723, -0.0009926557540893555, -0.0008565783500671387, -0.0007205009460449219, -0.0005844235420227051, -0.0004483461380004883, -0.0003122687339782715, -0.0001761913299560547, -4.011392593383789e-05, 9.59634780883789e-05, 0.0002320408821105957, 0.0003681182861328125, 0.0005041956901550293, 0.0006402730941772461, 0.0007763504981994629, 0.0009124279022216797, 0.0010485053062438965, 0.0011845827102661133, 0.00132066011428833, 0.0014567375183105469, 0.0015928149223327637, 0.0017288923263549805, 0.0018649697303771973, 0.002001047134399414, 0.002137124538421631, 0.0022732019424438477, 0.0024092793464660645, 0.0025453567504882812, 0.002681434154510498, 0.002817511558532715, 0.0029535889625549316, 0.0030896663665771484, 0.0032257437705993652, 0.003361821174621582, 0.003497898578643799, 0.0036339759826660156, 0.0037700533866882324, 0.0039061307907104492, 0.004042208194732666, 0.004178285598754883, 0.0043143630027771, 0.004450440406799316, 0.004586517810821533, 0.00472259521484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 10.0, 11.0, 18.0, 25.0, 39.0, 63.0, 118.0, 226.0, 520.0, 1243.0, 3651.0, 16319.0, 128189.0, 807510.0, 74795.0, 11073.0, 2801.0, 978.0, 440.0, 193.0, 120.0, 54.0, 40.0, 35.0, 15.0, 16.0, 10.0, 10.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.830078125, -20.14453125, -19.458984375, -18.7734375, -18.087890625, -17.40234375, -16.716796875, -16.03125, -15.345703125, -14.66015625, -13.974609375, -13.2890625, -12.603515625, -11.91796875, -11.232421875, -10.546875, -9.861328125, -9.17578125, -8.490234375, -7.8046875, -7.119140625, -6.43359375, -5.748046875, -5.0625, -4.376953125, -3.69140625, -3.005859375, -2.3203125, -1.634765625, -0.94921875, -0.263671875, 0.421875, 1.107421875, 1.79296875, 2.478515625, 3.1640625, 3.849609375, 4.53515625, 5.220703125, 5.90625, 6.591796875, 7.27734375, 7.962890625, 8.6484375, 9.333984375, 10.01953125, 10.705078125, 11.390625, 12.076171875, 12.76171875, 13.447265625, 14.1328125, 14.818359375, 15.50390625, 16.189453125, 16.875, 17.560546875, 18.24609375, 18.931640625, 19.6171875, 20.302734375, 20.98828125, 21.673828125, 22.359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 18.0, 18.0, 28.0, 25.0, 34.0, 45.0, 80.0, 94.0, 108.0, 105.0, 96.0, 69.0, 55.0, 43.0, 33.0, 24.0, 14.0, 17.0, 5.0, 10.0, 9.0, 9.0, 8.0, 0.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.76123046875, -16.2568359375, -15.75244140625, -15.248046875, -14.74365234375, -14.2392578125, -13.73486328125, -13.23046875, -12.72607421875, -12.2216796875, -11.71728515625, -11.212890625, -10.70849609375, -10.2041015625, -9.69970703125, -9.1953125, -8.69091796875, -8.1865234375, -7.68212890625, -7.177734375, -6.67333984375, -6.1689453125, -5.66455078125, -5.16015625, -4.65576171875, -4.1513671875, -3.64697265625, -3.142578125, -2.63818359375, -2.1337890625, -1.62939453125, -1.125, -0.62060546875, -0.1162109375, 0.38818359375, 0.892578125, 1.39697265625, 1.9013671875, 2.40576171875, 2.91015625, 3.41455078125, 3.9189453125, 4.42333984375, 4.927734375, 5.43212890625, 5.9365234375, 6.44091796875, 6.9453125, 7.44970703125, 7.9541015625, 8.45849609375, 8.962890625, 9.46728515625, 9.9716796875, 10.47607421875, 10.98046875, 11.48486328125, 11.9892578125, 12.49365234375, 12.998046875, 13.50244140625, 14.0068359375, 14.51123046875, 15.015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 12.0, 5.0, 5.0, 16.0, 28.0, 39.0, 84.0, 120.0, 260.0, 165.0, 98.0, 62.0, 38.0, 27.0, 16.0, 12.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-469.0545654296875, -457.233642578125, -445.4126892089844, -433.59173583984375, -421.77081298828125, -409.94989013671875, -398.1289367675781, -386.3079833984375, -374.487060546875, -362.6661376953125, -350.8451843261719, -339.02423095703125, -327.20330810546875, -315.38238525390625, -303.5614318847656, -291.740478515625, -279.9195556640625, -268.0986328125, -256.2776794433594, -244.4567413330078, -232.63580322265625, -220.8148651123047, -208.99392700195312, -197.17298889160156, -185.35205078125, -173.53111267089844, -161.71017456054688, -149.8892364501953, -138.06829833984375, -126.24736022949219, -114.42642211914062, -102.60548400878906, -90.7845458984375, -78.96360778808594, -67.14266967773438, -55.32173156738281, -43.50079345703125, -31.679855346679688, -19.858917236328125, -8.037979125976562, 3.782958984375, 15.603897094726562, 27.424835205078125, 39.24577331542969, 51.06671142578125, 62.88764953613281, 74.70858764648438, 86.52952575683594, 98.3504638671875, 110.17140197753906, 121.99234008789062, 133.8132781982422, 145.63421630859375, 157.4551544189453, 169.27609252929688, 181.09703063964844, 192.91796875, 204.73890686035156, 216.55984497070312, 228.3807830810547, 240.20172119140625, 252.0226593017578, 263.8435974121094, 275.66455078125, 287.4854736328125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 10.0, 7.0, 15.0, 8.0, 17.0, 17.0, 18.0, 27.0, 32.0, 22.0, 36.0, 30.0, 39.0, 38.0, 68.0, 100.0, 114.0, 67.0, 41.0, 30.0, 28.0, 28.0, 27.0, 33.0, 13.0, 16.0, 16.0, 15.0, 14.0, 6.0, 7.0, 8.0, 8.0, 3.0, 5.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-267.234619140625, -257.72015380859375, -248.20567321777344, -238.6912078857422, -229.17672729492188, -219.66226196289062, -210.14779663085938, -200.63333129882812, -191.1188507080078, -181.60438537597656, -172.08990478515625, -162.575439453125, -153.06097412109375, -143.54649353027344, -134.0320281982422, -124.5175552368164, -115.00308227539062, -105.48860931396484, -95.97413635253906, -86.45967102050781, -76.94519805908203, -67.43072509765625, -57.916255950927734, -48.40178680419922, -38.88731384277344, -29.37284278869629, -19.85837173461914, -10.343900680541992, -0.8294296264648438, 8.685043334960938, 18.199512481689453, 27.71398162841797, 37.228485107421875, 46.742958068847656, 56.25742721557617, 65.77189636230469, 75.28636932373047, 84.80084228515625, 94.3153076171875, 103.82978057861328, 113.34425354003906, 122.85872650146484, 132.37319946289062, 141.88766479492188, 151.40213012695312, 160.91661071777344, 170.4310760498047, 179.945556640625, 189.46002197265625, 198.9744873046875, 208.4889678955078, 218.00343322753906, 227.51791381835938, 237.03237915039062, 246.54684448242188, 256.0613098144531, 265.5758056640625, 275.09027099609375, 284.604736328125, 294.1192321777344, 303.6336975097656, 313.1481628417969, 322.6626281738281, 332.1770935058594, 341.6915588378906]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 8.0, 14.0, 19.0, 28.0, 27.0, 58.0, 100.0, 144.0, 254.0, 413.0, 658.0, 1139.0, 1925.0, 3760.0, 8007.0, 20099.0, 68044.0, 287965.0, 1157140.0, 1822745.0, 611785.0, 145623.0, 39060.0, 13254.0, 5623.0, 2813.0, 1481.0, 843.0, 474.0, 293.0, 159.0, 111.0, 73.0, 48.0, 27.0, 17.0, 15.0, 8.0, 7.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.59375, -18.9462890625, -18.298828125, -17.6513671875, -17.00390625, -16.3564453125, -15.708984375, -15.0615234375, -14.4140625, -13.7666015625, -13.119140625, -12.4716796875, -11.82421875, -11.1767578125, -10.529296875, -9.8818359375, -9.234375, -8.5869140625, -7.939453125, -7.2919921875, -6.64453125, -5.9970703125, -5.349609375, -4.7021484375, -4.0546875, -3.4072265625, -2.759765625, -2.1123046875, -1.46484375, -0.8173828125, -0.169921875, 0.4775390625, 1.125, 1.7724609375, 2.419921875, 3.0673828125, 3.71484375, 4.3623046875, 5.009765625, 5.6572265625, 6.3046875, 6.9521484375, 7.599609375, 8.2470703125, 8.89453125, 9.5419921875, 10.189453125, 10.8369140625, 11.484375, 12.1318359375, 12.779296875, 13.4267578125, 14.07421875, 14.7216796875, 15.369140625, 16.0166015625, 16.6640625, 17.3115234375, 17.958984375, 18.6064453125, 19.25390625, 19.9013671875, 20.548828125, 21.1962890625, 21.84375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 4.0, 15.0, 7.0, 9.0, 18.0, 12.0, 10.0, 19.0, 29.0, 25.0, 26.0, 32.0, 32.0, 29.0, 45.0, 44.0, 45.0, 39.0, 38.0, 53.0, 35.0, 40.0, 38.0, 38.0, 29.0, 37.0, 26.0, 36.0, 35.0, 25.0, 19.0, 15.0, 16.0, 9.0, 9.0, 9.0, 6.0, 9.0, 1.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.9453125, -16.375, -15.8046875, -15.234375, -14.6640625, -14.09375, -13.5234375, -12.953125, -12.3828125, -11.8125, -11.2421875, -10.671875, -10.1015625, -9.53125, -8.9609375, -8.390625, -7.8203125, -7.25, -6.6796875, -6.109375, -5.5390625, -4.96875, -4.3984375, -3.828125, -3.2578125, -2.6875, -2.1171875, -1.546875, -0.9765625, -0.40625, 0.1640625, 0.734375, 1.3046875, 1.875, 2.4453125, 3.015625, 3.5859375, 4.15625, 4.7265625, 5.296875, 5.8671875, 6.4375, 7.0078125, 7.578125, 8.1484375, 8.71875, 9.2890625, 9.859375, 10.4296875, 11.0, 11.5703125, 12.140625, 12.7109375, 13.28125, 13.8515625, 14.421875, 14.9921875, 15.5625, 16.1328125, 16.703125, 17.2734375, 17.84375, 18.4140625, 18.984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 2.0, 7.0, 7.0, 11.0, 17.0, 21.0, 28.0, 54.0, 96.0, 159.0, 336.0, 818.0, 2648.0, 14058.0, 185421.0, 3809034.0, 164675.0, 12804.0, 2497.0, 816.0, 325.0, 174.0, 97.0, 57.0, 36.0, 17.0, 14.0, 10.0, 9.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-73.0625, -70.94384765625, -68.8251953125, -66.70654296875, -64.587890625, -62.46923828125, -60.3505859375, -58.23193359375, -56.11328125, -53.99462890625, -51.8759765625, -49.75732421875, -47.638671875, -45.52001953125, -43.4013671875, -41.28271484375, -39.1640625, -37.04541015625, -34.9267578125, -32.80810546875, -30.689453125, -28.57080078125, -26.4521484375, -24.33349609375, -22.21484375, -20.09619140625, -17.9775390625, -15.85888671875, -13.740234375, -11.62158203125, -9.5029296875, -7.38427734375, -5.265625, -3.14697265625, -1.0283203125, 1.09033203125, 3.208984375, 5.32763671875, 7.4462890625, 9.56494140625, 11.68359375, 13.80224609375, 15.9208984375, 18.03955078125, 20.158203125, 22.27685546875, 24.3955078125, 26.51416015625, 28.6328125, 30.75146484375, 32.8701171875, 34.98876953125, 37.107421875, 39.22607421875, 41.3447265625, 43.46337890625, 45.58203125, 47.70068359375, 49.8193359375, 51.93798828125, 54.056640625, 56.17529296875, 58.2939453125, 60.41259765625, 62.53125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 11.0, 15.0, 26.0, 30.0, 47.0, 73.0, 111.0, 204.0, 350.0, 680.0, 851.0, 707.0, 413.0, 231.0, 117.0, 86.0, 27.0, 20.0, 21.0, 13.0, 10.0, 6.0, 2.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.84375, -55.95361328125, -54.0634765625, -52.17333984375, -50.283203125, -48.39306640625, -46.5029296875, -44.61279296875, -42.72265625, -40.83251953125, -38.9423828125, -37.05224609375, -35.162109375, -33.27197265625, -31.3818359375, -29.49169921875, -27.6015625, -25.71142578125, -23.8212890625, -21.93115234375, -20.041015625, -18.15087890625, -16.2607421875, -14.37060546875, -12.48046875, -10.59033203125, -8.7001953125, -6.81005859375, -4.919921875, -3.02978515625, -1.1396484375, 0.75048828125, 2.640625, 4.53076171875, 6.4208984375, 8.31103515625, 10.201171875, 12.09130859375, 13.9814453125, 15.87158203125, 17.76171875, 19.65185546875, 21.5419921875, 23.43212890625, 25.322265625, 27.21240234375, 29.1025390625, 30.99267578125, 32.8828125, 34.77294921875, 36.6630859375, 38.55322265625, 40.443359375, 42.33349609375, 44.2236328125, 46.11376953125, 48.00390625, 49.89404296875, 51.7841796875, 53.67431640625, 55.564453125, 57.45458984375, 59.3447265625, 61.23486328125, 63.125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 12.0, 9.0, 38.0, 105.0, 231.0, 263.0, 208.0, 88.0, 25.0, 10.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-776.28076171875, -757.06201171875, -737.84326171875, -718.62451171875, -699.40576171875, -680.18701171875, -660.96826171875, -641.74951171875, -622.53076171875, -603.31201171875, -584.09326171875, -564.87451171875, -545.65576171875, -526.43701171875, -507.2182312011719, -487.9994812011719, -468.78070068359375, -449.56195068359375, -430.34320068359375, -411.12445068359375, -391.90570068359375, -372.68695068359375, -353.4681701660156, -334.2494201660156, -315.0306701660156, -295.8119201660156, -276.5931701660156, -257.3744201660156, -238.15565490722656, -218.93690490722656, -199.7181396484375, -180.4993896484375, -161.28067016601562, -142.06192016601562, -122.8431625366211, -103.62440490722656, -84.40565490722656, -65.18690490722656, -45.96814727783203, -26.7493896484375, -7.5306396484375, 11.688114166259766, 30.90686798095703, 50.1256217956543, 69.34437561035156, 88.56312561035156, 107.7818832397461, 127.00064086914062, 146.21939086914062, 165.43814086914062, 184.65689086914062, 203.8756561279297, 223.0944061279297, 242.3131561279297, 261.53192138671875, 280.75067138671875, 299.96942138671875, 319.18817138671875, 338.40692138671875, 357.62567138671875, 376.84442138671875, 396.06317138671875, 415.2819519042969, 434.5007019042969, 453.7194519042969]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 12.0, 13.0, 10.0, 17.0, 15.0, 26.0, 25.0, 33.0, 29.0, 44.0, 39.0, 35.0, 47.0, 51.0, 54.0, 62.0, 47.0, 45.0, 49.0, 35.0, 40.0, 41.0, 29.0, 25.0, 20.0, 20.0, 18.0, 10.0, 13.0, 10.0, 15.0, 12.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.3595733642578, -177.9515380859375, -171.54351806640625, -165.13548278808594, -158.72744750976562, -152.31942749023438, -145.91139221191406, -139.50335693359375, -133.0953369140625, -126.68730926513672, -120.27928161621094, -113.87124633789062, -107.46321868896484, -101.05519104003906, -94.64715576171875, -88.23912811279297, -81.83110046386719, -75.4230728149414, -69.01504516601562, -62.60700988769531, -56.19898223876953, -49.79095458984375, -43.3829231262207, -36.974891662597656, -30.566864013671875, -24.15883445739746, -17.750804901123047, -11.342775344848633, -4.934745788574219, 1.4732818603515625, 7.881313323974609, 14.289344787597656, 20.6973876953125, 27.105417251586914, 33.51344680786133, 39.921478271484375, 46.329505920410156, 52.73753356933594, 59.145565032958984, 65.55359649658203, 71.96162414550781, 78.3696517944336, 84.77767944335938, 91.18571472167969, 97.59374237060547, 104.00177001953125, 110.40980529785156, 116.81783294677734, 123.22586059570312, 129.63389587402344, 136.0419158935547, 142.449951171875, 148.85797119140625, 155.26600646972656, 161.67404174804688, 168.08206176757812, 174.49009704589844, 180.89813232421875, 187.30615234375, 193.7141876220703, 200.12222290039062, 206.53024291992188, 212.9382781982422, 219.3463134765625, 225.75433349609375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 6.0, 0.0, 5.0, 5.0, 8.0, 10.0, 19.0, 20.0, 27.0, 49.0, 85.0, 92.0, 165.0, 247.0, 389.0, 680.0, 1115.0, 1954.0, 3648.0, 6598.0, 13110.0, 26472.0, 57669.0, 134841.0, 303143.0, 277816.0, 119799.0, 51065.0, 23776.0, 11777.0, 6124.0, 3254.0, 1815.0, 1099.0, 622.0, 354.0, 237.0, 144.0, 105.0, 73.0, 42.0, 37.0, 14.0, 17.0, 12.0, 13.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.45703125, -22.5859375, -21.71484375, -20.84375, -19.97265625, -19.1015625, -18.23046875, -17.359375, -16.48828125, -15.6171875, -14.74609375, -13.875, -13.00390625, -12.1328125, -11.26171875, -10.390625, -9.51953125, -8.6484375, -7.77734375, -6.90625, -6.03515625, -5.1640625, -4.29296875, -3.421875, -2.55078125, -1.6796875, -0.80859375, 0.0625, 0.93359375, 1.8046875, 2.67578125, 3.546875, 4.41796875, 5.2890625, 6.16015625, 7.03125, 7.90234375, 8.7734375, 9.64453125, 10.515625, 11.38671875, 12.2578125, 13.12890625, 14.0, 14.87109375, 15.7421875, 16.61328125, 17.484375, 18.35546875, 19.2265625, 20.09765625, 20.96875, 21.83984375, 22.7109375, 23.58203125, 24.453125, 25.32421875, 26.1953125, 27.06640625, 27.9375, 28.80859375, 29.6796875, 30.55078125, 31.421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 4.0, 9.0, 5.0, 11.0, 7.0, 9.0, 21.0, 15.0, 21.0, 22.0, 26.0, 16.0, 21.0, 30.0, 34.0, 28.0, 35.0, 43.0, 45.0, 37.0, 39.0, 37.0, 33.0, 43.0, 45.0, 30.0, 43.0, 39.0, 17.0, 32.0, 26.0, 27.0, 26.0, 25.0, 15.0, 13.0, 10.0, 6.0, 5.0, 7.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-17.3125, -16.755615234375, -16.19873046875, -15.641845703125, -15.0849609375, -14.528076171875, -13.97119140625, -13.414306640625, -12.857421875, -12.300537109375, -11.74365234375, -11.186767578125, -10.6298828125, -10.072998046875, -9.51611328125, -8.959228515625, -8.40234375, -7.845458984375, -7.28857421875, -6.731689453125, -6.1748046875, -5.617919921875, -5.06103515625, -4.504150390625, -3.947265625, -3.390380859375, -2.83349609375, -2.276611328125, -1.7197265625, -1.162841796875, -0.60595703125, -0.049072265625, 0.5078125, 1.064697265625, 1.62158203125, 2.178466796875, 2.7353515625, 3.292236328125, 3.84912109375, 4.406005859375, 4.962890625, 5.519775390625, 6.07666015625, 6.633544921875, 7.1904296875, 7.747314453125, 8.30419921875, 8.861083984375, 9.41796875, 9.974853515625, 10.53173828125, 11.088623046875, 11.6455078125, 12.202392578125, 12.75927734375, 13.316162109375, 13.873046875, 14.429931640625, 14.98681640625, 15.543701171875, 16.1005859375, 16.657470703125, 17.21435546875, 17.771240234375, 18.328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 6.0, 15.0, 6.0, 22.0, 25.0, 40.0, 63.0, 99.0, 149.0, 241.0, 406.0, 721.0, 1385.0, 3698.0, 14757.0, 128216.0, 824261.0, 60088.0, 9130.0, 2620.0, 1096.0, 562.0, 348.0, 202.0, 117.0, 74.0, 64.0, 25.0, 23.0, 19.0, 13.0, 14.0, 12.0, 7.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.0, -74.462890625, -71.92578125, -69.388671875, -66.8515625, -64.314453125, -61.77734375, -59.240234375, -56.703125, -54.166015625, -51.62890625, -49.091796875, -46.5546875, -44.017578125, -41.48046875, -38.943359375, -36.40625, -33.869140625, -31.33203125, -28.794921875, -26.2578125, -23.720703125, -21.18359375, -18.646484375, -16.109375, -13.572265625, -11.03515625, -8.498046875, -5.9609375, -3.423828125, -0.88671875, 1.650390625, 4.1875, 6.724609375, 9.26171875, 11.798828125, 14.3359375, 16.873046875, 19.41015625, 21.947265625, 24.484375, 27.021484375, 29.55859375, 32.095703125, 34.6328125, 37.169921875, 39.70703125, 42.244140625, 44.78125, 47.318359375, 49.85546875, 52.392578125, 54.9296875, 57.466796875, 60.00390625, 62.541015625, 65.078125, 67.615234375, 70.15234375, 72.689453125, 75.2265625, 77.763671875, 80.30078125, 82.837890625, 85.375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 15.0, 4.0, 13.0, 13.0, 22.0, 31.0, 30.0, 42.0, 34.0, 57.0, 65.0, 66.0, 84.0, 77.0, 62.0, 70.0, 57.0, 53.0, 42.0, 33.0, 23.0, 25.0, 21.0, 19.0, 7.0, 8.0, 7.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.6875, -69.4482421875, -66.208984375, -62.9697265625, -59.73046875, -56.4912109375, -53.251953125, -50.0126953125, -46.7734375, -43.5341796875, -40.294921875, -37.0556640625, -33.81640625, -30.5771484375, -27.337890625, -24.0986328125, -20.859375, -17.6201171875, -14.380859375, -11.1416015625, -7.90234375, -4.6630859375, -1.423828125, 1.8154296875, 5.0546875, 8.2939453125, 11.533203125, 14.7724609375, 18.01171875, 21.2509765625, 24.490234375, 27.7294921875, 30.96875, 34.2080078125, 37.447265625, 40.6865234375, 43.92578125, 47.1650390625, 50.404296875, 53.6435546875, 56.8828125, 60.1220703125, 63.361328125, 66.6005859375, 69.83984375, 73.0791015625, 76.318359375, 79.5576171875, 82.796875, 86.0361328125, 89.275390625, 92.5146484375, 95.75390625, 98.9931640625, 102.232421875, 105.4716796875, 108.7109375, 111.9501953125, 115.189453125, 118.4287109375, 121.66796875, 124.9072265625, 128.146484375, 131.3857421875, 134.625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 19.0, 15.0, 28.0, 24.0, 28.0, 57.0, 82.0, 144.0, 193.0, 317.0, 508.0, 944.0, 2026.0, 5238.0, 16516.0, 79030.0, 779738.0, 128406.0, 23123.0, 6814.0, 2525.0, 1168.0, 579.0, 336.0, 222.0, 129.0, 97.0, 58.0, 57.0, 26.0, 17.0, 20.0, 12.0, 9.0, 7.0, 5.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0], "bins": [-13.8671875, -13.4547119140625, -13.042236328125, -12.6297607421875, -12.21728515625, -11.8048095703125, -11.392333984375, -10.9798583984375, -10.5673828125, -10.1549072265625, -9.742431640625, -9.3299560546875, -8.91748046875, -8.5050048828125, -8.092529296875, -7.6800537109375, -7.267578125, -6.8551025390625, -6.442626953125, -6.0301513671875, -5.61767578125, -5.2052001953125, -4.792724609375, -4.3802490234375, -3.9677734375, -3.5552978515625, -3.142822265625, -2.7303466796875, -2.31787109375, -1.9053955078125, -1.492919921875, -1.0804443359375, -0.66796875, -0.2554931640625, 0.156982421875, 0.5694580078125, 0.98193359375, 1.3944091796875, 1.806884765625, 2.2193603515625, 2.6318359375, 3.0443115234375, 3.456787109375, 3.8692626953125, 4.28173828125, 4.6942138671875, 5.106689453125, 5.5191650390625, 5.931640625, 6.3441162109375, 6.756591796875, 7.1690673828125, 7.58154296875, 7.9940185546875, 8.406494140625, 8.8189697265625, 9.2314453125, 9.6439208984375, 10.056396484375, 10.4688720703125, 10.88134765625, 11.2938232421875, 11.706298828125, 12.1187744140625, 12.53125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 5.0, 2.0, 5.0, 5.0, 17.0, 12.0, 19.0, 22.0, 21.0, 26.0, 43.0, 61.0, 78.0, 110.0, 118.0, 90.0, 93.0, 56.0, 37.0, 35.0, 26.0, 18.0, 16.0, 10.0, 12.0, 6.0, 11.0, 8.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0031890869140625, -0.0030842721462249756, -0.002979457378387451, -0.0028746426105499268, -0.0027698278427124023, -0.002665013074874878, -0.0025601983070373535, -0.002455383539199829, -0.0023505687713623047, -0.0022457540035247803, -0.002140939235687256, -0.0020361244678497314, -0.001931309700012207, -0.0018264949321746826, -0.0017216801643371582, -0.0016168653964996338, -0.0015120506286621094, -0.001407235860824585, -0.0013024210929870605, -0.0011976063251495361, -0.0010927915573120117, -0.0009879767894744873, -0.0008831620216369629, -0.0007783472537994385, -0.0006735324859619141, -0.0005687177181243896, -0.00046390295028686523, -0.0003590881824493408, -0.0002542734146118164, -0.000149458646774292, -4.464387893676758e-05, 6.0170888900756836e-05, 0.00016498565673828125, 0.00026980042457580566, 0.0003746151924133301, 0.0004794299602508545, 0.0005842447280883789, 0.0006890594959259033, 0.0007938742637634277, 0.0008986890316009521, 0.0010035037994384766, 0.001108318567276001, 0.0012131333351135254, 0.0013179481029510498, 0.0014227628707885742, 0.0015275776386260986, 0.001632392406463623, 0.0017372071743011475, 0.0018420219421386719, 0.0019468367099761963, 0.0020516514778137207, 0.002156466245651245, 0.0022612810134887695, 0.002366095781326294, 0.0024709105491638184, 0.0025757253170013428, 0.002680540084838867, 0.0027853548526763916, 0.002890169620513916, 0.0029949843883514404, 0.003099799156188965, 0.0032046139240264893, 0.0033094286918640137, 0.003414243459701538, 0.0035190582275390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 5.0, 5.0, 1.0, 6.0, 13.0, 21.0, 28.0, 41.0, 70.0, 96.0, 127.0, 238.0, 455.0, 1006.0, 2695.0, 8818.0, 56526.0, 858362.0, 101678.0, 12439.0, 3266.0, 1295.0, 575.0, 308.0, 171.0, 112.0, 56.0, 53.0, 22.0, 13.0, 15.0, 10.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.821044921875, -16.18896484375, -15.556884765625, -14.9248046875, -14.292724609375, -13.66064453125, -13.028564453125, -12.396484375, -11.764404296875, -11.13232421875, -10.500244140625, -9.8681640625, -9.236083984375, -8.60400390625, -7.971923828125, -7.33984375, -6.707763671875, -6.07568359375, -5.443603515625, -4.8115234375, -4.179443359375, -3.54736328125, -2.915283203125, -2.283203125, -1.651123046875, -1.01904296875, -0.386962890625, 0.2451171875, 0.877197265625, 1.50927734375, 2.141357421875, 2.7734375, 3.405517578125, 4.03759765625, 4.669677734375, 5.3017578125, 5.933837890625, 6.56591796875, 7.197998046875, 7.830078125, 8.462158203125, 9.09423828125, 9.726318359375, 10.3583984375, 10.990478515625, 11.62255859375, 12.254638671875, 12.88671875, 13.518798828125, 14.15087890625, 14.782958984375, 15.4150390625, 16.047119140625, 16.67919921875, 17.311279296875, 17.943359375, 18.575439453125, 19.20751953125, 19.839599609375, 20.4716796875, 21.103759765625, 21.73583984375, 22.367919921875, 23.0]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 1.0, 7.0, 7.0, 11.0, 7.0, 8.0, 11.0, 21.0, 25.0, 28.0, 31.0, 34.0, 34.0, 49.0, 61.0, 78.0, 82.0, 88.0, 73.0, 72.0, 48.0, 34.0, 39.0, 28.0, 20.0, 18.0, 12.0, 12.0, 12.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7578125, -10.440185546875, -10.12255859375, -9.804931640625, -9.4873046875, -9.169677734375, -8.85205078125, -8.534423828125, -8.216796875, -7.899169921875, -7.58154296875, -7.263916015625, -6.9462890625, -6.628662109375, -6.31103515625, -5.993408203125, -5.67578125, -5.358154296875, -5.04052734375, -4.722900390625, -4.4052734375, -4.087646484375, -3.77001953125, -3.452392578125, -3.134765625, -2.817138671875, -2.49951171875, -2.181884765625, -1.8642578125, -1.546630859375, -1.22900390625, -0.911376953125, -0.59375, -0.276123046875, 0.04150390625, 0.359130859375, 0.6767578125, 0.994384765625, 1.31201171875, 1.629638671875, 1.947265625, 2.264892578125, 2.58251953125, 2.900146484375, 3.2177734375, 3.535400390625, 3.85302734375, 4.170654296875, 4.48828125, 4.805908203125, 5.12353515625, 5.441162109375, 5.7587890625, 6.076416015625, 6.39404296875, 6.711669921875, 7.029296875, 7.346923828125, 7.66455078125, 7.982177734375, 8.2998046875, 8.617431640625, 8.93505859375, 9.252685546875, 9.5703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 35.0, 48.0, 97.0, 257.0, 267.0, 111.0, 78.0, 33.0, 22.0, 11.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-506.16717529296875, -492.85101318359375, -479.53485107421875, -466.21868896484375, -452.9024963378906, -439.5863342285156, -426.2701721191406, -412.9540100097656, -399.6378479003906, -386.3216857910156, -373.0055236816406, -359.6893310546875, -346.3731689453125, -333.0570068359375, -319.7408447265625, -306.4246826171875, -293.1085205078125, -279.7923583984375, -266.4761962890625, -253.16001892089844, -239.84385681152344, -226.52767944335938, -213.21151733398438, -199.89535522460938, -186.57916259765625, -173.26300048828125, -159.9468231201172, -146.6306610107422, -133.3144989013672, -119.99832916259766, -106.68215942382812, -93.36599731445312, -80.04983520507812, -66.7336654663086, -53.417503356933594, -40.10133361816406, -26.785167694091797, -13.469001770019531, -0.15283203125, 13.163330078125, 26.47949981689453, 39.7956657409668, 53.11183166503906, 66.4280014038086, 79.74417114257812, 93.06033325195312, 106.37650299072266, 119.69266510009766, 133.0088348388672, 146.3249969482422, 159.64117431640625, 172.95733642578125, 186.27349853515625, 199.58966064453125, 212.9058380126953, 226.2220001220703, 239.53817749023438, 252.85433959960938, 266.1705017089844, 279.4866943359375, 292.8028564453125, 306.1190185546875, 319.4351806640625, 332.7513427734375, 346.0675048828125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 12.0, 10.0, 11.0, 11.0, 20.0, 24.0, 22.0, 26.0, 23.0, 25.0, 39.0, 40.0, 51.0, 109.0, 158.0, 82.0, 60.0, 39.0, 31.0, 24.0, 27.0, 24.0, 20.0, 18.0, 10.0, 17.0, 16.0, 9.0, 7.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-376.76458740234375, -367.212646484375, -357.6606750488281, -348.1087341308594, -338.5567932128906, -329.00482177734375, -319.452880859375, -309.90093994140625, -300.3489990234375, -290.79705810546875, -281.2450866699219, -271.6931457519531, -262.1412048339844, -252.58924865722656, -243.03729248046875, -233.4853515625, -223.93338012695312, -214.3814239501953, -204.82948303222656, -195.27752685546875, -185.7255859375, -176.1736297607422, -166.62167358398438, -157.06973266601562, -147.5177764892578, -137.9658203125, -128.41387939453125, -118.86192321777344, -109.30997467041016, -99.75802612304688, -90.20606994628906, -80.65412139892578, -71.1021728515625, -61.55022430419922, -51.99827194213867, -42.446319580078125, -32.894371032714844, -23.342422485351562, -13.790470123291016, -4.238517761230469, 5.3134307861328125, 14.865381240844727, 24.41733169555664, 33.96928405761719, 43.52123260498047, 53.07318115234375, 62.6251335144043, 72.17708587646484, 81.72903442382812, 91.2809829711914, 100.83293151855469, 110.3848876953125, 119.93683624267578, 129.48878479003906, 139.04074096679688, 148.59268188476562, 158.14463806152344, 167.69659423828125, 177.24853515625, 186.8004913330078, 196.35244750976562, 205.90438842773438, 215.4563446044922, 225.00830078125, 234.56024169921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 12.0, 20.0, 29.0, 48.0, 52.0, 74.0, 103.0, 178.0, 275.0, 440.0, 877.0, 1768.0, 4305.0, 14571.0, 102867.0, 1713810.0, 2190659.0, 138283.0, 16874.0, 4825.0, 2000.0, 909.0, 456.0, 294.0, 171.0, 108.0, 68.0, 53.0, 35.0, 32.0, 17.0, 15.0, 8.0, 4.0, 8.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.96875, -52.3359375, -50.703125, -49.0703125, -47.4375, -45.8046875, -44.171875, -42.5390625, -40.90625, -39.2734375, -37.640625, -36.0078125, -34.375, -32.7421875, -31.109375, -29.4765625, -27.84375, -26.2109375, -24.578125, -22.9453125, -21.3125, -19.6796875, -18.046875, -16.4140625, -14.78125, -13.1484375, -11.515625, -9.8828125, -8.25, -6.6171875, -4.984375, -3.3515625, -1.71875, -0.0859375, 1.546875, 3.1796875, 4.8125, 6.4453125, 8.078125, 9.7109375, 11.34375, 12.9765625, 14.609375, 16.2421875, 17.875, 19.5078125, 21.140625, 22.7734375, 24.40625, 26.0390625, 27.671875, 29.3046875, 30.9375, 32.5703125, 34.203125, 35.8359375, 37.46875, 39.1015625, 40.734375, 42.3671875, 44.0, 45.6328125, 47.265625, 48.8984375, 50.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 8.0, 9.0, 5.0, 7.0, 6.0, 9.0, 10.0, 20.0, 27.0, 9.0, 28.0, 21.0, 28.0, 25.0, 36.0, 34.0, 39.0, 30.0, 43.0, 32.0, 43.0, 50.0, 40.0, 44.0, 40.0, 40.0, 33.0, 46.0, 19.0, 30.0, 23.0, 27.0, 21.0, 17.0, 20.0, 9.0, 17.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.9375, -16.412841796875, -15.88818359375, -15.363525390625, -14.8388671875, -14.314208984375, -13.78955078125, -13.264892578125, -12.740234375, -12.215576171875, -11.69091796875, -11.166259765625, -10.6416015625, -10.116943359375, -9.59228515625, -9.067626953125, -8.54296875, -8.018310546875, -7.49365234375, -6.968994140625, -6.4443359375, -5.919677734375, -5.39501953125, -4.870361328125, -4.345703125, -3.821044921875, -3.29638671875, -2.771728515625, -2.2470703125, -1.722412109375, -1.19775390625, -0.673095703125, -0.1484375, 0.376220703125, 0.90087890625, 1.425537109375, 1.9501953125, 2.474853515625, 2.99951171875, 3.524169921875, 4.048828125, 4.573486328125, 5.09814453125, 5.622802734375, 6.1474609375, 6.672119140625, 7.19677734375, 7.721435546875, 8.24609375, 8.770751953125, 9.29541015625, 9.820068359375, 10.3447265625, 10.869384765625, 11.39404296875, 11.918701171875, 12.443359375, 12.968017578125, 13.49267578125, 14.017333984375, 14.5419921875, 15.066650390625, 15.59130859375, 16.115966796875, 16.640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 8.0, 8.0, 18.0, 19.0, 42.0, 65.0, 125.0, 244.0, 480.0, 1376.0, 7559.0, 726264.0, 3443099.0, 11890.0, 1836.0, 617.0, 269.0, 143.0, 82.0, 47.0, 29.0, 19.0, 14.0, 9.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.625, -163.52734375, -158.4296875, -153.33203125, -148.234375, -143.13671875, -138.0390625, -132.94140625, -127.84375, -122.74609375, -117.6484375, -112.55078125, -107.453125, -102.35546875, -97.2578125, -92.16015625, -87.0625, -81.96484375, -76.8671875, -71.76953125, -66.671875, -61.57421875, -56.4765625, -51.37890625, -46.28125, -41.18359375, -36.0859375, -30.98828125, -25.890625, -20.79296875, -15.6953125, -10.59765625, -5.5, -0.40234375, 4.6953125, 9.79296875, 14.890625, 19.98828125, 25.0859375, 30.18359375, 35.28125, 40.37890625, 45.4765625, 50.57421875, 55.671875, 60.76953125, 65.8671875, 70.96484375, 76.0625, 81.16015625, 86.2578125, 91.35546875, 96.453125, 101.55078125, 106.6484375, 111.74609375, 116.84375, 121.94140625, 127.0390625, 132.13671875, 137.234375, 142.33203125, 147.4296875, 152.52734375, 157.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 15.0, 27.0, 42.0, 64.0, 91.0, 169.0, 348.0, 731.0, 1113.0, 678.0, 334.0, 168.0, 104.0, 69.0, 35.0, 29.0, 24.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.0625, -84.0, -80.9375, -77.875, -74.8125, -71.75, -68.6875, -65.625, -62.5625, -59.5, -56.4375, -53.375, -50.3125, -47.25, -44.1875, -41.125, -38.0625, -35.0, -31.9375, -28.875, -25.8125, -22.75, -19.6875, -16.625, -13.5625, -10.5, -7.4375, -4.375, -1.3125, 1.75, 4.8125, 7.875, 10.9375, 14.0, 17.0625, 20.125, 23.1875, 26.25, 29.3125, 32.375, 35.4375, 38.5, 41.5625, 44.625, 47.6875, 50.75, 53.8125, 56.875, 59.9375, 63.0, 66.0625, 69.125, 72.1875, 75.25, 78.3125, 81.375, 84.4375, 87.5, 90.5625, 93.625, 96.6875, 99.75, 102.8125, 105.875, 108.9375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 24.0, 62.0, 148.0, 332.0, 234.0, 101.0, 44.0, 22.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1322.56689453125, -1285.486328125, -1248.4056396484375, -1211.3250732421875, -1174.244384765625, -1137.163818359375, -1100.083251953125, -1063.002685546875, -1025.9219970703125, -988.8413696289062, -951.7607421875, -914.68017578125, -877.5995483398438, -840.5189208984375, -803.4383544921875, -766.3577270507812, -729.277099609375, -692.1964721679688, -655.1158447265625, -618.0352783203125, -580.9546508789062, -543.8740234375, -506.7934265136719, -469.71282958984375, -432.6322021484375, -395.55157470703125, -358.4709777832031, -321.390380859375, -284.30975341796875, -247.22914123535156, -210.14852905273438, -173.06793212890625, -135.9874267578125, -98.90681457519531, -61.826202392578125, -24.745590209960938, 12.33502197265625, 49.41563415527344, 86.49624633789062, 123.57684326171875, 160.657470703125, 197.7380828857422, 234.81869506835938, 271.8992919921875, 308.97991943359375, 346.060546875, 383.1411437988281, 420.22174072265625, 457.3023681640625, 494.38299560546875, 531.463623046875, 568.544189453125, 605.6248168945312, 642.7054443359375, 679.7860107421875, 716.8666381835938, 753.947265625, 791.0278930664062, 828.1085205078125, 865.1890869140625, 902.2697143554688, 939.350341796875, 976.430908203125, 1013.5115356445312, 1050.5921630859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 3.0, 8.0, 7.0, 9.0, 11.0, 7.0, 18.0, 16.0, 29.0, 22.0, 27.0, 31.0, 31.0, 32.0, 55.0, 38.0, 51.0, 41.0, 49.0, 70.0, 41.0, 52.0, 48.0, 31.0, 41.0, 39.0, 19.0, 31.0, 21.0, 28.0, 15.0, 17.0, 9.0, 8.0, 6.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-370.226318359375, -359.552001953125, -348.8777160644531, -338.2033996582031, -327.52911376953125, -316.85479736328125, -306.18048095703125, -295.5061950683594, -284.8319091796875, -274.1575927734375, -263.4833068847656, -252.80899047851562, -242.13470458984375, -231.46038818359375, -220.7860870361328, -210.11178588867188, -199.43746948242188, -188.76316833496094, -178.0888671875, -167.41455078125, -156.74026489257812, -146.06594848632812, -135.3916473388672, -124.71734619140625, -114.04304504394531, -103.36874389648438, -92.69444274902344, -82.02013397216797, -71.34583282470703, -60.671531677246094, -49.997222900390625, -39.32292175292969, -28.648590087890625, -17.974287033081055, -7.299983978271484, 3.3743209838867188, 14.048622131347656, 24.722923278808594, 35.39723205566406, 46.071533203125, 56.74583435058594, 67.42013549804688, 78.09443664550781, 88.76874542236328, 99.44304656982422, 110.11734771728516, 120.79165649414062, 131.46595764160156, 142.1402587890625, 152.81455993652344, 163.48886108398438, 174.16317749023438, 184.83746337890625, 195.51177978515625, 206.1860809326172, 216.86038208007812, 227.53468322753906, 238.208984375, 248.88328552246094, 259.5575866699219, 270.2319030761719, 280.90618896484375, 291.58050537109375, 302.25482177734375, 312.9291076660156]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 19.0, 52.0, 67.0, 144.0, 270.0, 514.0, 1288.0, 3365.0, 10512.0, 46824.0, 371099.0, 532735.0, 61926.0, 13219.0, 3853.0, 1458.0, 579.0, 303.0, 126.0, 93.0, 41.0, 16.0, 16.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-78.375, -76.41943359375, -74.4638671875, -72.50830078125, -70.552734375, -68.59716796875, -66.6416015625, -64.68603515625, -62.73046875, -60.77490234375, -58.8193359375, -56.86376953125, -54.908203125, -52.95263671875, -50.9970703125, -49.04150390625, -47.0859375, -45.13037109375, -43.1748046875, -41.21923828125, -39.263671875, -37.30810546875, -35.3525390625, -33.39697265625, -31.44140625, -29.48583984375, -27.5302734375, -25.57470703125, -23.619140625, -21.66357421875, -19.7080078125, -17.75244140625, -15.796875, -13.84130859375, -11.8857421875, -9.93017578125, -7.974609375, -6.01904296875, -4.0634765625, -2.10791015625, -0.15234375, 1.80322265625, 3.7587890625, 5.71435546875, 7.669921875, 9.62548828125, 11.5810546875, 13.53662109375, 15.4921875, 17.44775390625, 19.4033203125, 21.35888671875, 23.314453125, 25.27001953125, 27.2255859375, 29.18115234375, 31.13671875, 33.09228515625, 35.0478515625, 37.00341796875, 38.958984375, 40.91455078125, 42.8701171875, 44.82568359375, 46.78125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 10.0, 4.0, 3.0, 5.0, 9.0, 11.0, 11.0, 19.0, 18.0, 26.0, 33.0, 18.0, 30.0, 38.0, 25.0, 51.0, 40.0, 39.0, 50.0, 45.0, 50.0, 31.0, 53.0, 39.0, 34.0, 42.0, 30.0, 40.0, 28.0, 26.0, 32.0, 21.0, 19.0, 9.0, 8.0, 13.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.96875, -22.26953125, -21.5703125, -20.87109375, -20.171875, -19.47265625, -18.7734375, -18.07421875, -17.375, -16.67578125, -15.9765625, -15.27734375, -14.578125, -13.87890625, -13.1796875, -12.48046875, -11.78125, -11.08203125, -10.3828125, -9.68359375, -8.984375, -8.28515625, -7.5859375, -6.88671875, -6.1875, -5.48828125, -4.7890625, -4.08984375, -3.390625, -2.69140625, -1.9921875, -1.29296875, -0.59375, 0.10546875, 0.8046875, 1.50390625, 2.203125, 2.90234375, 3.6015625, 4.30078125, 5.0, 5.69921875, 6.3984375, 7.09765625, 7.796875, 8.49609375, 9.1953125, 9.89453125, 10.59375, 11.29296875, 11.9921875, 12.69140625, 13.390625, 14.08984375, 14.7890625, 15.48828125, 16.1875, 16.88671875, 17.5859375, 18.28515625, 18.984375, 19.68359375, 20.3828125, 21.08203125, 21.78125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 17.0, 32.0, 41.0, 68.0, 109.0, 240.0, 486.0, 1357.0, 6214.0, 108303.0, 907870.0, 19727.0, 2593.0, 764.0, 335.0, 150.0, 87.0, 52.0, 33.0, 16.0, 16.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.1875, -90.2978515625, -87.408203125, -84.5185546875, -81.62890625, -78.7392578125, -75.849609375, -72.9599609375, -70.0703125, -67.1806640625, -64.291015625, -61.4013671875, -58.51171875, -55.6220703125, -52.732421875, -49.8427734375, -46.953125, -44.0634765625, -41.173828125, -38.2841796875, -35.39453125, -32.5048828125, -29.615234375, -26.7255859375, -23.8359375, -20.9462890625, -18.056640625, -15.1669921875, -12.27734375, -9.3876953125, -6.498046875, -3.6083984375, -0.71875, 2.1708984375, 5.060546875, 7.9501953125, 10.83984375, 13.7294921875, 16.619140625, 19.5087890625, 22.3984375, 25.2880859375, 28.177734375, 31.0673828125, 33.95703125, 36.8466796875, 39.736328125, 42.6259765625, 45.515625, 48.4052734375, 51.294921875, 54.1845703125, 57.07421875, 59.9638671875, 62.853515625, 65.7431640625, 68.6328125, 71.5224609375, 74.412109375, 77.3017578125, 80.19140625, 83.0810546875, 85.970703125, 88.8603515625, 91.75]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 8.0, 3.0, 5.0, 3.0, 5.0, 8.0, 9.0, 13.0, 14.0, 15.0, 23.0, 13.0, 29.0, 29.0, 34.0, 36.0, 51.0, 62.0, 61.0, 63.0, 63.0, 70.0, 59.0, 52.0, 45.0, 29.0, 32.0, 24.0, 28.0, 19.0, 13.0, 16.0, 13.0, 6.0, 14.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.0, -77.26171875, -74.5234375, -71.78515625, -69.046875, -66.30859375, -63.5703125, -60.83203125, -58.09375, -55.35546875, -52.6171875, -49.87890625, -47.140625, -44.40234375, -41.6640625, -38.92578125, -36.1875, -33.44921875, -30.7109375, -27.97265625, -25.234375, -22.49609375, -19.7578125, -17.01953125, -14.28125, -11.54296875, -8.8046875, -6.06640625, -3.328125, -0.58984375, 2.1484375, 4.88671875, 7.625, 10.36328125, 13.1015625, 15.83984375, 18.578125, 21.31640625, 24.0546875, 26.79296875, 29.53125, 32.26953125, 35.0078125, 37.74609375, 40.484375, 43.22265625, 45.9609375, 48.69921875, 51.4375, 54.17578125, 56.9140625, 59.65234375, 62.390625, 65.12890625, 67.8671875, 70.60546875, 73.34375, 76.08203125, 78.8203125, 81.55859375, 84.296875, 87.03515625, 89.7734375, 92.51171875, 95.25]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 9.0, 12.0, 31.0, 35.0, 71.0, 143.0, 384.0, 1892.0, 19130.0, 982898.0, 40313.0, 2715.0, 548.0, 196.0, 72.0, 41.0, 24.0, 14.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.893798828125, -18.20947265625, -17.525146484375, -16.8408203125, -16.156494140625, -15.47216796875, -14.787841796875, -14.103515625, -13.419189453125, -12.73486328125, -12.050537109375, -11.3662109375, -10.681884765625, -9.99755859375, -9.313232421875, -8.62890625, -7.944580078125, -7.26025390625, -6.575927734375, -5.8916015625, -5.207275390625, -4.52294921875, -3.838623046875, -3.154296875, -2.469970703125, -1.78564453125, -1.101318359375, -0.4169921875, 0.267333984375, 0.95166015625, 1.635986328125, 2.3203125, 3.004638671875, 3.68896484375, 4.373291015625, 5.0576171875, 5.741943359375, 6.42626953125, 7.110595703125, 7.794921875, 8.479248046875, 9.16357421875, 9.847900390625, 10.5322265625, 11.216552734375, 11.90087890625, 12.585205078125, 13.26953125, 13.953857421875, 14.63818359375, 15.322509765625, 16.0068359375, 16.691162109375, 17.37548828125, 18.059814453125, 18.744140625, 19.428466796875, 20.11279296875, 20.797119140625, 21.4814453125, 22.165771484375, 22.85009765625, 23.534423828125, 24.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 11.0, 17.0, 14.0, 26.0, 29.0, 40.0, 31.0, 48.0, 81.0, 89.0, 114.0, 109.0, 91.0, 82.0, 49.0, 32.0, 29.0, 20.0, 22.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028228759765625, -0.002737104892730713, -0.0026513338088989258, -0.0025655627250671387, -0.0024797916412353516, -0.0023940205574035645, -0.0023082494735717773, -0.0022224783897399902, -0.002136707305908203, -0.002050936222076416, -0.001965165138244629, -0.0018793940544128418, -0.0017936229705810547, -0.0017078518867492676, -0.0016220808029174805, -0.0015363097190856934, -0.0014505386352539062, -0.0013647675514221191, -0.001278996467590332, -0.001193225383758545, -0.0011074542999267578, -0.0010216832160949707, -0.0009359121322631836, -0.0008501410484313965, -0.0007643699645996094, -0.0006785988807678223, -0.0005928277969360352, -0.000507056713104248, -0.00042128562927246094, -0.00033551454544067383, -0.0002497434616088867, -0.0001639723777770996, -7.82012939453125e-05, 7.569789886474609e-06, 9.334087371826172e-05, 0.00017911195755004883, 0.00026488304138183594, 0.00035065412521362305, 0.00043642520904541016, 0.0005221962928771973, 0.0006079673767089844, 0.0006937384605407715, 0.0007795095443725586, 0.0008652806282043457, 0.0009510517120361328, 0.00103682279586792, 0.001122593879699707, 0.0012083649635314941, 0.0012941360473632812, 0.0013799071311950684, 0.0014656782150268555, 0.0015514492988586426, 0.0016372203826904297, 0.0017229914665222168, 0.001808762550354004, 0.001894533634185791, 0.001980304718017578, 0.0020660758018493652, 0.0021518468856811523, 0.0022376179695129395, 0.0023233890533447266, 0.0024091601371765137, 0.0024949312210083008, 0.002580702304840088, 0.002666473388671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 7.0, 10.0, 14.0, 18.0, 51.0, 97.0, 244.0, 994.0, 11301.0, 999518.0, 33933.0, 1763.0, 348.0, 123.0, 69.0, 23.0, 10.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.8125, -31.98486328125, -31.1572265625, -30.32958984375, -29.501953125, -28.67431640625, -27.8466796875, -27.01904296875, -26.19140625, -25.36376953125, -24.5361328125, -23.70849609375, -22.880859375, -22.05322265625, -21.2255859375, -20.39794921875, -19.5703125, -18.74267578125, -17.9150390625, -17.08740234375, -16.259765625, -15.43212890625, -14.6044921875, -13.77685546875, -12.94921875, -12.12158203125, -11.2939453125, -10.46630859375, -9.638671875, -8.81103515625, -7.9833984375, -7.15576171875, -6.328125, -5.50048828125, -4.6728515625, -3.84521484375, -3.017578125, -2.18994140625, -1.3623046875, -0.53466796875, 0.29296875, 1.12060546875, 1.9482421875, 2.77587890625, 3.603515625, 4.43115234375, 5.2587890625, 6.08642578125, 6.9140625, 7.74169921875, 8.5693359375, 9.39697265625, 10.224609375, 11.05224609375, 11.8798828125, 12.70751953125, 13.53515625, 14.36279296875, 15.1904296875, 16.01806640625, 16.845703125, 17.67333984375, 18.5009765625, 19.32861328125, 20.15625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 6.0, 10.0, 6.0, 14.0, 21.0, 20.0, 44.0, 52.0, 75.0, 86.0, 140.0, 120.0, 107.0, 86.0, 65.0, 46.0, 28.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.8203125, -9.5064697265625, -9.192626953125, -8.8787841796875, -8.56494140625, -8.2510986328125, -7.937255859375, -7.6234130859375, -7.3095703125, -6.9957275390625, -6.681884765625, -6.3680419921875, -6.05419921875, -5.7403564453125, -5.426513671875, -5.1126708984375, -4.798828125, -4.4849853515625, -4.171142578125, -3.8572998046875, -3.54345703125, -3.2296142578125, -2.915771484375, -2.6019287109375, -2.2880859375, -1.9742431640625, -1.660400390625, -1.3465576171875, -1.03271484375, -0.7188720703125, -0.405029296875, -0.0911865234375, 0.22265625, 0.5364990234375, 0.850341796875, 1.1641845703125, 1.47802734375, 1.7918701171875, 2.105712890625, 2.4195556640625, 2.7333984375, 3.0472412109375, 3.361083984375, 3.6749267578125, 3.98876953125, 4.3026123046875, 4.616455078125, 4.9302978515625, 5.244140625, 5.5579833984375, 5.871826171875, 6.1856689453125, 6.49951171875, 6.8133544921875, 7.127197265625, 7.4410400390625, 7.7548828125, 8.0687255859375, 8.382568359375, 8.6964111328125, 9.01025390625, 9.3240966796875, 9.637939453125, 9.9517822265625, 10.265625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 11.0, 31.0, 67.0, 324.0, 455.0, 80.0, 19.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1020.0196533203125, -994.6287231445312, -969.23779296875, -943.846923828125, -918.4559936523438, -893.0650634765625, -867.6741333007812, -842.283203125, -816.892333984375, -791.5014038085938, -766.1104736328125, -740.7196044921875, -715.3286743164062, -689.937744140625, -664.5468139648438, -639.1558837890625, -613.7650146484375, -588.3740844726562, -562.983154296875, -537.59228515625, -512.2013549804688, -486.8104248046875, -461.41949462890625, -436.0285949707031, -410.63763427734375, -385.2467041015625, -359.8558044433594, -334.4648742675781, -309.073974609375, -283.68304443359375, -258.2921142578125, -232.90121459960938, -207.51031494140625, -182.11940002441406, -156.72848510742188, -131.33755493164062, -105.94664764404297, -80.55573272705078, -55.16481018066406, -29.773895263671875, -4.3829803466796875, 21.007936477661133, 46.39885330200195, 71.7897720336914, 97.1806869506836, 122.57160186767578, 147.9625244140625, 173.3534393310547, 198.74435424804688, 224.13526916503906, 249.52618408203125, 274.9171142578125, 300.3080139160156, 325.6989440917969, 351.08984375, 376.48077392578125, 401.8717041015625, 427.26263427734375, 452.6535339355469, 478.0444641113281, 503.43536376953125, 528.8262939453125, 554.2172241210938, 579.608154296875, 604.9990234375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 5.0, 12.0, 11.0, 7.0, 10.0, 16.0, 15.0, 13.0, 13.0, 18.0, 33.0, 62.0, 105.0, 71.0, 70.0, 60.0, 58.0, 65.0, 118.0, 51.0, 29.0, 30.0, 21.0, 14.0, 22.0, 21.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-309.3206787109375, -300.3393249511719, -291.35797119140625, -282.3766174316406, -273.395263671875, -264.4139099121094, -255.4325714111328, -246.4512176513672, -237.46986389160156, -228.48851013183594, -219.5071563720703, -210.5258026123047, -201.54446411132812, -192.5631103515625, -183.58175659179688, -174.60040283203125, -165.61904907226562, -156.6376953125, -147.65634155273438, -138.67498779296875, -129.69363403320312, -120.71228790283203, -111.73094177246094, -102.74958801269531, -93.76823425292969, -84.78688049316406, -75.80552673339844, -66.82418060302734, -57.84282684326172, -48.861473083496094, -39.880123138427734, -30.898773193359375, -21.917449951171875, -12.936098098754883, -3.9547462463378906, 5.026605606079102, 14.007957458496094, 22.98931121826172, 31.970661163330078, 40.95201110839844, 49.93336486816406, 58.91471862792969, 67.89607238769531, 76.8774185180664, 85.85877227783203, 94.84012603759766, 103.82147216796875, 112.80282592773438, 121.7841796875, 130.76553344726562, 139.74688720703125, 148.72824096679688, 157.7095947265625, 166.69094848632812, 175.6722869873047, 184.6536407470703, 193.63499450683594, 202.61634826660156, 211.5977020263672, 220.5790557861328, 229.56039428710938, 238.541748046875, 247.52310180664062, 256.50445556640625, 265.4858093261719]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 10.0, 10.0, 16.0, 15.0, 23.0, 34.0, 31.0, 32.0, 30.0, 58.0, 138.0, 238.0, 59.0, 48.0, 42.0, 29.0, 33.0, 19.0, 16.0, 16.0, 18.0, 16.0, 9.0, 6.0, 6.0, 12.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.984375, -25.178466796875, -24.37255859375, -23.566650390625, -22.7607421875, -21.954833984375, -21.14892578125, -20.343017578125, -19.537109375, -18.731201171875, -17.92529296875, -17.119384765625, -16.3134765625, -15.507568359375, -14.70166015625, -13.895751953125, -13.08984375, -12.283935546875, -11.47802734375, -10.672119140625, -9.8662109375, -9.060302734375, -8.25439453125, -7.448486328125, -6.642578125, -5.836669921875, -5.03076171875, -4.224853515625, -3.4189453125, -2.613037109375, -1.80712890625, -1.001220703125, -0.1953125, 0.610595703125, 1.41650390625, 2.222412109375, 3.0283203125, 3.834228515625, 4.64013671875, 5.446044921875, 6.251953125, 7.057861328125, 7.86376953125, 8.669677734375, 9.4755859375, 10.281494140625, 11.08740234375, 11.893310546875, 12.69921875, 13.505126953125, 14.31103515625, 15.116943359375, 15.9228515625, 16.728759765625, 17.53466796875, 18.340576171875, 19.146484375, 19.952392578125, 20.75830078125, 21.564208984375, 22.3701171875, 23.176025390625, 23.98193359375, 24.787841796875, 25.59375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 11.0, 10.0, 20.0, 13.0, 28.0, 48.0, 80.0, 209.0, 611.0, 3383.0, 7849317.0, 530555.0, 3227.0, 632.0, 171.0, 73.0, 32.0, 33.0, 26.0, 29.0, 13.0, 10.0, 8.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-325.1297607421875, -313.08160400390625, -301.0334777832031, -288.9853210449219, -276.93719482421875, -264.8890380859375, -252.84091186523438, -240.79275512695312, -228.74462890625, -216.6964874267578, -204.64834594726562, -192.60020446777344, -180.55206298828125, -168.50392150878906, -156.45578002929688, -144.40762329101562, -132.35948181152344, -120.31134033203125, -108.26319885253906, -96.21505737304688, -84.16691589355469, -72.1187744140625, -60.07062530517578, -48.022483825683594, -35.974342346191406, -23.92620086669922, -11.878057479858398, 0.17008590698242188, 12.21822738647461, 24.266368865966797, 36.31451416015625, 48.36265563964844, 60.410797119140625, 72.45893859863281, 84.507080078125, 96.55522155761719, 108.60336303710938, 120.65150451660156, 132.69964599609375, 144.747802734375, 156.79592895507812, 168.8440704345703, 180.8922119140625, 192.9403533935547, 204.98849487304688, 217.03663635253906, 229.08477783203125, 241.1329345703125, 253.1810760498047, 265.2292175292969, 277.2773742675781, 289.32550048828125, 301.3736572265625, 313.4217834472656, 325.4699401855469, 337.51806640625, 349.56622314453125, 361.6143798828125, 373.6625061035156, 385.7106628417969, 397.7587890625, 409.80694580078125, 421.8550720214844, 433.9032287597656, 445.95135498046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 8.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-575.4168090820312, -561.3034057617188, -547.1900634765625, -533.07666015625, -518.9633178710938, -504.84991455078125, -490.7365417480469, -476.6231689453125, -462.509765625, -448.3963928222656, -434.28302001953125, -420.16961669921875, -406.0562438964844, -391.94287109375, -377.8294982910156, -363.71612548828125, -349.6027526855469, -335.4893798828125, -321.3760070800781, -307.26263427734375, -293.14923095703125, -279.0358581542969, -264.9224853515625, -250.80911254882812, -236.6957244873047, -222.5823516845703, -208.46896362304688, -194.3555908203125, -180.24221801757812, -166.1288299560547, -152.0154571533203, -137.90206909179688, -123.78872680664062, -109.67534637451172, -95.56196594238281, -81.44859313964844, -67.33521270751953, -53.221832275390625, -39.10845947265625, -24.995079040527344, -10.881698608398438, 3.231679916381836, 17.34505844116211, 31.45843505859375, 45.571815490722656, 59.68519592285156, 73.79856872558594, 87.91194915771484, 102.02532958984375, 116.13871002197266, 130.25209045410156, 144.36546325683594, 158.47885131835938, 172.59222412109375, 186.70559692382812, 200.8189697265625, 214.93235778808594, 229.0457305908203, 243.15911865234375, 257.2724914550781, 271.3858642578125, 285.499267578125, 299.61260986328125, 313.72601318359375, 327.8393859863281]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 7.0, 15.0, 24.0, 32.0, 32.0, 46.0, 84.0, 127.0, 205.0, 364.0, 566.0, 1265.0, 2893.0, 7531.0, 21454.0, 65663.0, 179675.0, 161210.0, 55019.0, 17413.0, 6110.0, 2344.0, 1054.0, 506.0, 252.0, 151.0, 67.0, 58.0, 34.0, 10.0, 12.0, 12.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.5, -200.751953125, -195.00390625, -189.255859375, -183.5078125, -177.759765625, -172.01171875, -166.263671875, -160.515625, -154.767578125, -149.01953125, -143.271484375, -137.5234375, -131.775390625, -126.02734375, -120.279296875, -114.53125, -108.783203125, -103.03515625, -97.287109375, -91.5390625, -85.791015625, -80.04296875, -74.294921875, -68.546875, -62.798828125, -57.05078125, -51.302734375, -45.5546875, -39.806640625, -34.05859375, -28.310546875, -22.5625, -16.814453125, -11.06640625, -5.318359375, 0.4296875, 6.177734375, 11.92578125, 17.673828125, 23.421875, 29.169921875, 34.91796875, 40.666015625, 46.4140625, 52.162109375, 57.91015625, 63.658203125, 69.40625, 75.154296875, 80.90234375, 86.650390625, 92.3984375, 98.146484375, 103.89453125, 109.642578125, 115.390625, 121.138671875, 126.88671875, 132.634765625, 138.3828125, 144.130859375, 149.87890625, 155.626953125, 161.375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 9.0, 5.0, 8.0, 10.0, 10.0, 11.0, 20.0, 7.0, 9.0, 16.0, 23.0, 23.0, 29.0, 27.0, 37.0, 37.0, 56.0, 45.0, 60.0, 65.0, 57.0, 48.0, 32.0, 45.0, 52.0, 37.0, 35.0, 30.0, 26.0, 29.0, 16.0, 22.0, 12.0, 13.0, 11.0, 7.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-27.640625, -26.92138671875, -26.2021484375, -25.48291015625, -24.763671875, -24.04443359375, -23.3251953125, -22.60595703125, -21.88671875, -21.16748046875, -20.4482421875, -19.72900390625, -19.009765625, -18.29052734375, -17.5712890625, -16.85205078125, -16.1328125, -15.41357421875, -14.6943359375, -13.97509765625, -13.255859375, -12.53662109375, -11.8173828125, -11.09814453125, -10.37890625, -9.65966796875, -8.9404296875, -8.22119140625, -7.501953125, -6.78271484375, -6.0634765625, -5.34423828125, -4.625, -3.90576171875, -3.1865234375, -2.46728515625, -1.748046875, -1.02880859375, -0.3095703125, 0.40966796875, 1.12890625, 1.84814453125, 2.5673828125, 3.28662109375, 4.005859375, 4.72509765625, 5.4443359375, 6.16357421875, 6.8828125, 7.60205078125, 8.3212890625, 9.04052734375, 9.759765625, 10.47900390625, 11.1982421875, 11.91748046875, 12.63671875, 13.35595703125, 14.0751953125, 14.79443359375, 15.513671875, 16.23291015625, 16.9521484375, 17.67138671875, 18.390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 13.0, 22.0, 32.0, 66.0, 80.0, 104.0, 75.0, 41.0, 8.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.3271484375, -208.95359802246094, -199.58004760742188, -190.2064971923828, -180.83294677734375, -171.45938110351562, -162.08583068847656, -152.7122802734375, -143.33872985839844, -133.96517944335938, -124.59162902832031, -115.21807098388672, -105.84452056884766, -96.4709701538086, -87.097412109375, -77.72386169433594, -68.35031127929688, -58.97676086425781, -49.603206634521484, -40.229652404785156, -30.856101989746094, -21.48255157470703, -12.108997344970703, -2.735443115234375, 6.6381072998046875, 16.011659622192383, 25.385211944580078, 34.758766174316406, 44.13231658935547, 53.50586700439453, 62.87942123413086, 72.25297546386719, 81.62652587890625, 91.00007629394531, 100.37362670898438, 109.74718475341797, 119.12073516845703, 128.49429321289062, 137.8678436279297, 147.24139404296875, 156.6149444580078, 165.98849487304688, 175.36204528808594, 184.735595703125, 194.10916137695312, 203.48269653320312, 212.85626220703125, 222.2298126220703, 231.60336303710938, 240.97691345214844, 250.3504638671875, 259.7240295410156, 269.0975646972656, 278.47113037109375, 287.84466552734375, 297.2182312011719, 306.591796875, 315.9653625488281, 325.3388977050781, 334.71246337890625, 344.08599853515625, 353.4595642089844, 362.8330993652344, 372.2066650390625, 381.5802001953125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 8.0, 4.0, 5.0, 9.0, 17.0, 17.0, 44.0, 62.0, 76.0, 91.0, 54.0, 28.0, 23.0, 4.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.83026123046875, -161.76821899414062, -156.7061767578125, -151.64413452148438, -146.58209228515625, -141.52005004882812, -136.4580078125, -131.39596557617188, -126.33393096923828, -121.27188873291016, -116.20984649658203, -111.1478042602539, -106.08576965332031, -101.02372741699219, -95.96168518066406, -90.89964294433594, -85.83760070800781, -80.77555847167969, -75.71351623535156, -70.65147399902344, -65.58943176269531, -60.52739334106445, -55.465354919433594, -50.40331268310547, -45.341270446777344, -40.27922821044922, -35.217185974121094, -30.155147552490234, -25.09310531616211, -20.031063079833984, -14.969022750854492, -9.906982421875, -4.844940185546875, 0.2171010971069336, 5.279142379760742, 10.34118366241455, 15.40322494506836, 20.465267181396484, 25.527307510375977, 30.58934783935547, 35.651390075683594, 40.71343231201172, 45.775474548339844, 50.8375129699707, 55.89955520629883, 60.96159744262695, 66.02363586425781, 71.08567810058594, 76.14772033691406, 81.20976257324219, 86.27180480957031, 91.33384704589844, 96.39588928222656, 101.45793151855469, 106.51996612548828, 111.5820083618164, 116.64405059814453, 121.70609283447266, 126.76813507080078, 131.83016967773438, 136.8922119140625, 141.95425415039062, 147.01629638671875, 152.07833862304688, 157.140380859375]}, "eval/loss": 2.4603452682495117, "eval/wer": 0.35762049328333034, "eval/runtime": 877.6671, "eval/samples_per_second": 3.01, "eval/steps_per_second": 0.377} \ No newline at end of file