diff --git "a/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" "b/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.3833, "train/learning_rate": 3e-05, "train/epoch": 0.14, "train/global_step": 500, "_runtime": 1399, "_timestamp": 1646215678, "_step": 500, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 9.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30388.0, 54.0, 18.0, 11.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1262.0, -1231.296875, -1200.59375, -1169.890625, -1139.1875, -1108.484375, -1077.78125, -1047.078125, -1016.375, -985.671875, -954.96875, -924.265625, -893.5625, -862.859375, -832.15625, -801.453125, -770.75, -740.046875, -709.34375, -678.640625, -647.9375, -617.234375, -586.53125, -555.828125, -525.125, -494.421875, -463.71875, -433.015625, -402.3125, -371.609375, -340.90625, -310.203125, -279.5, -248.796875, -218.09375, -187.390625, -156.6875, -125.984375, -95.28125, -64.578125, -33.875, -3.171875, 27.53125, 58.234375, 88.9375, 119.640625, 150.34375, 181.046875, 211.75, 242.453125, 273.15625, 303.859375, 334.5625, 365.265625, 395.96875, 426.671875, 457.375, 488.078125, 518.78125, 549.484375, 580.1875, 610.890625, 641.59375, 672.296875, 703.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 3.0, 11.0, 13.0, 16.0, 20.0, 23.0, 30.0, 44.0, 51.0, 71.0, 68.0, 61.0, 92.0, 83.0, 74.0, 69.0, 60.0, 44.0, 39.0, 31.0, 22.0, 19.0, 15.0, 9.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-473.05267333984375, -457.8367004394531, -442.6207275390625, -427.4047546386719, -412.18878173828125, -396.97283935546875, -381.7568664550781, -366.5408935546875, -351.3249206542969, -336.10894775390625, -320.8929748535156, -305.677001953125, -290.4610595703125, -275.24505615234375, -260.02911376953125, -244.81314086914062, -229.59716796875, -214.38119506835938, -199.16522216796875, -183.9492645263672, -168.73329162597656, -153.51731872558594, -138.30136108398438, -123.08538818359375, -107.86941528320312, -92.6534423828125, -77.4374771118164, -62.22150802612305, -47.00553894042969, -31.789566040039062, -16.57360076904297, -1.357635498046875, 13.85833740234375, 29.07430648803711, 44.29027557373047, 59.50624465942383, 74.72221374511719, 89.93818664550781, 105.1541519165039, 120.3701171875, 135.58609008789062, 150.80206298828125, 166.01803588867188, 181.23399353027344, 196.44996643066406, 211.6659393310547, 226.88189697265625, 242.09786987304688, 257.3138427734375, 272.5298156738281, 287.74578857421875, 302.9617614746094, 318.177734375, 333.3936767578125, 348.6096496582031, 363.82562255859375, 379.0415954589844, 394.257568359375, 409.4735412597656, 424.68951416015625, 439.90545654296875, 455.1214599609375, 470.33740234375, 485.5533752441406, 500.76934814453125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 14.0, 14.0, 15.0, 9.0, 17.0, 15.0, 31.0, 20.0, 32.0, 27.0, 27.0, 36.0, 30.0, 35.0, 36.0, 56.0, 44.0, 36.0, 57.0, 37.0, 39.0, 34.0, 41.0, 35.0, 29.0, 38.0, 25.0, 24.0, 23.0, 20.0, 13.0, 11.0, 14.0, 9.0, 9.0, 12.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-338.35546875, -328.3011779785156, -318.24688720703125, -308.1925964355469, -298.1383056640625, -288.0840148925781, -278.02972412109375, -267.9754333496094, -257.921142578125, -247.86685180664062, -237.81256103515625, -227.75827026367188, -217.7039794921875, -207.64968872070312, -197.59539794921875, -187.54110717773438, -177.48681640625, -167.43252563476562, -157.37823486328125, -147.32394409179688, -137.2696533203125, -127.21536254882812, -117.16107177734375, -107.10678100585938, -97.052490234375, -86.99819946289062, -76.94390869140625, -66.88961791992188, -56.8353271484375, -46.781036376953125, -36.72674560546875, -26.672454833984375, -16.6181640625, -6.563873291015625, 3.49041748046875, 13.544708251953125, 23.5989990234375, 33.653289794921875, 43.70758056640625, 53.761871337890625, 63.816162109375, 73.87045288085938, 83.92474365234375, 93.97903442382812, 104.0333251953125, 114.08761596679688, 124.14190673828125, 134.19619750976562, 144.25048828125, 154.30477905273438, 164.35906982421875, 174.41336059570312, 184.4676513671875, 194.52194213867188, 204.57623291015625, 214.63052368164062, 224.684814453125, 234.73910522460938, 244.79339599609375, 254.84768676757812, 264.9019775390625, 274.9562683105469, 285.01055908203125, 295.0648498535156, 305.119140625]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 6.0, 12.0, 14.0, 22.0, 33.0, 49.0, 73.0, 104.0, 137.0, 206.0, 298.0, 449.0, 721.0, 1108.0, 1903.0, 3033.0, 4976.0, 8318.0, 14027.0, 24659.0, 46469.0, 105621.0, 544571.0, 161140.0, 58321.0, 30100.0, 17168.0, 9767.0, 5733.0, 3532.0, 2132.0, 1282.0, 869.0, 562.0, 383.0, 253.0, 138.0, 108.0, 77.0, 56.0, 35.0, 28.0, 15.0, 10.0, 8.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1738.0, -1683.109375, -1628.21875, -1573.328125, -1518.4375, -1463.546875, -1408.65625, -1353.765625, -1298.875, -1243.984375, -1189.09375, -1134.203125, -1079.3125, -1024.421875, -969.53125, -914.640625, -859.75, -804.859375, -749.96875, -695.078125, -640.1875, -585.296875, -530.40625, -475.515625, -420.625, -365.734375, -310.84375, -255.953125, -201.0625, -146.171875, -91.28125, -36.390625, 18.5, 73.390625, 128.28125, 183.171875, 238.0625, 292.953125, 347.84375, 402.734375, 457.625, 512.515625, 567.40625, 622.296875, 677.1875, 732.078125, 786.96875, 841.859375, 896.75, 951.640625, 1006.53125, 1061.421875, 1116.3125, 1171.203125, 1226.09375, 1280.984375, 1335.875, 1390.765625, 1445.65625, 1500.546875, 1555.4375, 1610.328125, 1665.21875, 1720.109375, 1775.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 6.0, 10.0, 8.0, 13.0, 16.0, 15.0, 22.0, 19.0, 24.0, 30.0, 35.0, 50.0, 149.0, 197.0, 112.0, 57.0, 41.0, 31.0, 25.0, 24.0, 25.0, 15.0, 14.0, 12.0, 12.0, 3.0, 7.0, 4.0, 0.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-529.0, -511.5703125, -494.140625, -476.7109375, -459.28125, -441.8515625, -424.421875, -406.9921875, -389.5625, -372.1328125, -354.703125, -337.2734375, -319.84375, -302.4140625, -284.984375, -267.5546875, -250.125, -232.6953125, -215.265625, -197.8359375, -180.40625, -162.9765625, -145.546875, -128.1171875, -110.6875, -93.2578125, -75.828125, -58.3984375, -40.96875, -23.5390625, -6.109375, 11.3203125, 28.75, 46.1796875, 63.609375, 81.0390625, 98.46875, 115.8984375, 133.328125, 150.7578125, 168.1875, 185.6171875, 203.046875, 220.4765625, 237.90625, 255.3359375, 272.765625, 290.1953125, 307.625, 325.0546875, 342.484375, 359.9140625, 377.34375, 394.7734375, 412.203125, 429.6328125, 447.0625, 464.4921875, 481.921875, 499.3515625, 516.78125, 534.2109375, 551.640625, 569.0703125, 586.5]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 14.0, 11.0, 8.0, 18.0, 29.0, 26.0, 42.0, 62.0, 68.0, 82.0, 102.0, 110.0, 102.0, 65.0, 40.0, 45.0, 35.0, 35.0, 24.0, 16.0, 14.0, 6.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-340.2661437988281, -329.0177917480469, -317.76947021484375, -306.5211181640625, -295.27276611328125, -284.0244140625, -272.77606201171875, -261.5277404785156, -250.27938842773438, -239.03103637695312, -227.78269958496094, -216.53436279296875, -205.2860107421875, -194.03765869140625, -182.78932189941406, -171.54098510742188, -160.29263305664062, -149.04428100585938, -137.7959442138672, -126.54759979248047, -115.29925537109375, -104.05091094970703, -92.80256652832031, -81.5542221069336, -70.30587768554688, -59.057533264160156, -47.80918884277344, -36.56084442138672, -25.3125, -14.064155578613281, -2.8158111572265625, 8.432533264160156, 19.680877685546875, 30.929222106933594, 42.17756652832031, 53.42591094970703, 64.67425537109375, 75.92259979248047, 87.17094421386719, 98.4192886352539, 109.66763305664062, 120.91597747802734, 132.16432189941406, 143.41265869140625, 154.6610107421875, 165.90936279296875, 177.15769958496094, 188.40603637695312, 199.65438842773438, 210.90274047851562, 222.1510772705078, 233.3994140625, 244.64776611328125, 255.8961181640625, 267.14447021484375, 278.3927917480469, 289.6411437988281, 300.8894958496094, 312.1378173828125, 323.38616943359375, 334.634521484375, 345.88287353515625, 357.1312255859375, 368.3795471191406, 379.6278991699219]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 6.0, 13.0, 14.0, 18.0, 20.0, 19.0, 25.0, 27.0, 32.0, 26.0, 45.0, 45.0, 42.0, 37.0, 37.0, 39.0, 41.0, 30.0, 44.0, 34.0, 42.0, 43.0, 39.0, 33.0, 23.0, 38.0, 32.0, 23.0, 22.0, 11.0, 11.0, 11.0, 8.0, 12.0, 7.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-248.25732421875, -241.13363647460938, -234.00994873046875, -226.88626098632812, -219.7625732421875, -212.63888549804688, -205.51519775390625, -198.39151000976562, -191.267822265625, -184.14413452148438, -177.02044677734375, -169.89675903320312, -162.7730712890625, -155.64938354492188, -148.52569580078125, -141.40200805664062, -134.2783203125, -127.15463256835938, -120.03094482421875, -112.90725708007812, -105.7835693359375, -98.65988159179688, -91.53619384765625, -84.41250610351562, -77.288818359375, -70.16513061523438, -63.04144287109375, -55.917755126953125, -48.7940673828125, -41.670379638671875, -34.54669189453125, -27.423004150390625, -20.29931640625, -13.175628662109375, -6.05194091796875, 1.071746826171875, 8.1954345703125, 15.319122314453125, 22.44281005859375, 29.566497802734375, 36.690185546875, 43.813873291015625, 50.93756103515625, 58.061248779296875, 65.1849365234375, 72.30862426757812, 79.43231201171875, 86.55599975585938, 93.6796875, 100.80337524414062, 107.92706298828125, 115.05075073242188, 122.1744384765625, 129.29812622070312, 136.42181396484375, 143.54550170898438, 150.669189453125, 157.79287719726562, 164.91656494140625, 172.04025268554688, 179.1639404296875, 186.28762817382812, 193.41131591796875, 200.53500366210938, 207.65869140625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 12.0, 14.0, 22.0, 24.0, 29.0, 33.0, 61.0, 118.0, 122.0, 223.0, 286.0, 464.0, 629.0, 920.0, 1415.0, 2110.0, 3211.0, 4841.0, 7485.0, 11757.0, 18427.0, 30153.0, 52321.0, 98273.0, 287758.0, 1432900.0, 1639080.0, 345989.0, 108060.0, 57156.0, 33026.0, 19965.0, 12762.0, 8256.0, 5380.0, 3561.0, 2301.0, 1667.0, 1063.0, 779.0, 484.0, 378.0, 227.0, 174.0, 129.0, 86.0, 45.0, 38.0, 25.0, 17.0, 12.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0], "bins": [-326.75, -316.8671875, -306.984375, -297.1015625, -287.21875, -277.3359375, -267.453125, -257.5703125, -247.6875, -237.8046875, -227.921875, -218.0390625, -208.15625, -198.2734375, -188.390625, -178.5078125, -168.625, -158.7421875, -148.859375, -138.9765625, -129.09375, -119.2109375, -109.328125, -99.4453125, -89.5625, -79.6796875, -69.796875, -59.9140625, -50.03125, -40.1484375, -30.265625, -20.3828125, -10.5, -0.6171875, 9.265625, 19.1484375, 29.03125, 38.9140625, 48.796875, 58.6796875, 68.5625, 78.4453125, 88.328125, 98.2109375, 108.09375, 117.9765625, 127.859375, 137.7421875, 147.625, 157.5078125, 167.390625, 177.2734375, 187.15625, 197.0390625, 206.921875, 216.8046875, 226.6875, 236.5703125, 246.453125, 256.3359375, 266.21875, 276.1015625, 285.984375, 295.8671875, 305.75]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 10.0, 18.0, 15.0, 17.0, 19.0, 21.0, 22.0, 38.0, 31.0, 30.0, 40.0, 45.0, 38.0, 36.0, 40.0, 37.0, 45.0, 45.0, 38.0, 45.0, 36.0, 40.0, 34.0, 20.0, 33.0, 35.0, 32.0, 17.0, 18.0, 11.0, 8.0, 10.0, 9.0, 12.0, 6.0, 8.0, 1.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-146.0, -141.587890625, -137.17578125, -132.763671875, -128.3515625, -123.939453125, -119.52734375, -115.115234375, -110.703125, -106.291015625, -101.87890625, -97.466796875, -93.0546875, -88.642578125, -84.23046875, -79.818359375, -75.40625, -70.994140625, -66.58203125, -62.169921875, -57.7578125, -53.345703125, -48.93359375, -44.521484375, -40.109375, -35.697265625, -31.28515625, -26.873046875, -22.4609375, -18.048828125, -13.63671875, -9.224609375, -4.8125, -0.400390625, 4.01171875, 8.423828125, 12.8359375, 17.248046875, 21.66015625, 26.072265625, 30.484375, 34.896484375, 39.30859375, 43.720703125, 48.1328125, 52.544921875, 56.95703125, 61.369140625, 65.78125, 70.193359375, 74.60546875, 79.017578125, 83.4296875, 87.841796875, 92.25390625, 96.666015625, 101.078125, 105.490234375, 109.90234375, 114.314453125, 118.7265625, 123.138671875, 127.55078125, 131.962890625, 136.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 15.0, 26.0, 41.0, 61.0, 74.0, 151.0, 225.0, 348.0, 577.0, 914.0, 1586.0, 2826.0, 4943.0, 8825.0, 16468.0, 31503.0, 65697.0, 146900.0, 389503.0, 1868831.0, 1129430.0, 295988.0, 117475.0, 53630.0, 26543.0, 13925.0, 7501.0, 4146.0, 2490.0, 1455.0, 846.0, 502.0, 319.0, 201.0, 111.0, 55.0, 42.0, 29.0, 14.0, 16.0, 11.0, 5.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-360.0, -349.37109375, -338.7421875, -328.11328125, -317.484375, -306.85546875, -296.2265625, -285.59765625, -274.96875, -264.33984375, -253.7109375, -243.08203125, -232.453125, -221.82421875, -211.1953125, -200.56640625, -189.9375, -179.30859375, -168.6796875, -158.05078125, -147.421875, -136.79296875, -126.1640625, -115.53515625, -104.90625, -94.27734375, -83.6484375, -73.01953125, -62.390625, -51.76171875, -41.1328125, -30.50390625, -19.875, -9.24609375, 1.3828125, 12.01171875, 22.640625, 33.26953125, 43.8984375, 54.52734375, 65.15625, 75.78515625, 86.4140625, 97.04296875, 107.671875, 118.30078125, 128.9296875, 139.55859375, 150.1875, 160.81640625, 171.4453125, 182.07421875, 192.703125, 203.33203125, 213.9609375, 224.58984375, 235.21875, 245.84765625, 256.4765625, 267.10546875, 277.734375, 288.36328125, 298.9921875, 309.62109375, 320.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 9.0, 14.0, 12.0, 18.0, 17.0, 19.0, 34.0, 46.0, 66.0, 75.0, 88.0, 146.0, 161.0, 210.0, 316.0, 521.0, 695.0, 444.0, 305.0, 201.0, 155.0, 105.0, 81.0, 86.0, 58.0, 51.0, 31.0, 31.0, 17.0, 15.0, 15.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-121.0625, -117.8193359375, -114.576171875, -111.3330078125, -108.08984375, -104.8466796875, -101.603515625, -98.3603515625, -95.1171875, -91.8740234375, -88.630859375, -85.3876953125, -82.14453125, -78.9013671875, -75.658203125, -72.4150390625, -69.171875, -65.9287109375, -62.685546875, -59.4423828125, -56.19921875, -52.9560546875, -49.712890625, -46.4697265625, -43.2265625, -39.9833984375, -36.740234375, -33.4970703125, -30.25390625, -27.0107421875, -23.767578125, -20.5244140625, -17.28125, -14.0380859375, -10.794921875, -7.5517578125, -4.30859375, -1.0654296875, 2.177734375, 5.4208984375, 8.6640625, 11.9072265625, 15.150390625, 18.3935546875, 21.63671875, 24.8798828125, 28.123046875, 31.3662109375, 34.609375, 37.8525390625, 41.095703125, 44.3388671875, 47.58203125, 50.8251953125, 54.068359375, 57.3115234375, 60.5546875, 63.7978515625, 67.041015625, 70.2841796875, 73.52734375, 76.7705078125, 80.013671875, 83.2568359375, 86.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 15.0, 18.0, 27.0, 26.0, 43.0, 53.0, 58.0, 70.0, 102.0, 106.0, 98.0, 80.0, 60.0, 52.0, 26.0, 28.0, 22.0, 15.0, 15.0, 15.0, 12.0, 5.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-255.88021850585938, -248.50372314453125, -241.1272430419922, -233.75074768066406, -226.374267578125, -218.99777221679688, -211.62127685546875, -204.2447967529297, -196.86831665039062, -189.4918212890625, -182.11534118652344, -174.7388458251953, -167.36236572265625, -159.98587036132812, -152.609375, -145.23289489746094, -137.8563995361328, -130.4799041748047, -123.10342407226562, -115.7269287109375, -108.35044860839844, -100.97395324707031, -93.59746551513672, -86.22097778320312, -78.84449005126953, -71.46800231933594, -64.09151458740234, -56.715023040771484, -49.33853530883789, -41.9620475769043, -34.58555603027344, -27.209068298339844, -19.832565307617188, -12.456076622009277, -5.079587936401367, 2.2969017028808594, 9.673389434814453, 17.049877166748047, 24.426368713378906, 31.8028564453125, 39.179344177246094, 46.55583190917969, 53.93231964111328, 61.30881118774414, 68.685302734375, 76.06178283691406, 83.43827819824219, 90.81476593017578, 98.19125366210938, 105.56774139404297, 112.94422912597656, 120.32072448730469, 127.69720458984375, 135.07369995117188, 142.4501953125, 149.82667541503906, 157.20315551757812, 164.57965087890625, 171.9561309814453, 179.33262634277344, 186.7091064453125, 194.08560180664062, 201.46209716796875, 208.8385772705078, 216.21507263183594]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 11.0, 5.0, 7.0, 7.0, 14.0, 9.0, 19.0, 15.0, 25.0, 29.0, 31.0, 29.0, 29.0, 47.0, 41.0, 46.0, 43.0, 56.0, 37.0, 42.0, 40.0, 42.0, 46.0, 32.0, 27.0, 30.0, 38.0, 26.0, 26.0, 24.0, 17.0, 20.0, 12.0, 18.0, 8.0, 10.0, 9.0, 5.0, 8.0, 4.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.4295196533203, -134.66250610351562, -129.8955078125, -125.12849426269531, -120.36148834228516, -115.594482421875, -110.82746887207031, -106.06046295166016, -101.29345703125, -96.52645111083984, -91.75944519042969, -86.992431640625, -82.22542572021484, -77.45841979980469, -72.69140625, -67.92440032958984, -63.15739440917969, -58.39038848876953, -53.62337875366211, -48.85636901855469, -44.08936309814453, -39.322357177734375, -34.55534744262695, -29.78833770751953, -25.021331787109375, -20.254323959350586, -15.487316131591797, -10.720308303833008, -5.953300476074219, -1.1862926483154297, 3.5807151794433594, 8.347724914550781, 13.114730834960938, 17.881738662719727, 22.648746490478516, 27.415754318237305, 32.182762145996094, 36.94976806640625, 41.71677780151367, 46.483787536621094, 51.25079345703125, 56.017799377441406, 60.78480911254883, 65.55181884765625, 70.3188247680664, 75.08583068847656, 79.85284423828125, 84.6198501586914, 89.38685607910156, 94.15386199951172, 98.92086791992188, 103.68788146972656, 108.45488739013672, 113.22189331054688, 117.98890686035156, 122.75591278076172, 127.52291870117188, 132.28993225097656, 137.0569305419922, 141.82394409179688, 146.5909423828125, 151.3579559326172, 156.12496948242188, 160.8919677734375, 165.6589813232422]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [6.0, 3.0, 6.0, 6.0, 9.0, 15.0, 15.0, 28.0, 48.0, 63.0, 86.0, 126.0, 205.0, 249.0, 391.0, 545.0, 827.0, 1139.0, 1715.0, 2492.0, 3611.0, 5397.0, 8123.0, 11888.0, 17824.0, 26971.0, 41244.0, 64640.0, 102281.0, 159729.0, 203591.0, 140540.0, 88952.0, 56680.0, 36625.0, 23745.0, 15823.0, 10577.0, 7131.0, 4805.0, 3304.0, 2194.0, 1583.0, 1036.0, 718.0, 494.0, 345.0, 232.0, 166.0, 106.0, 83.0, 55.0, 28.0, 30.0, 16.0, 13.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-91.0, -88.001953125, -85.00390625, -82.005859375, -79.0078125, -76.009765625, -73.01171875, -70.013671875, -67.015625, -64.017578125, -61.01953125, -58.021484375, -55.0234375, -52.025390625, -49.02734375, -46.029296875, -43.03125, -40.033203125, -37.03515625, -34.037109375, -31.0390625, -28.041015625, -25.04296875, -22.044921875, -19.046875, -16.048828125, -13.05078125, -10.052734375, -7.0546875, -4.056640625, -1.05859375, 1.939453125, 4.9375, 7.935546875, 10.93359375, 13.931640625, 16.9296875, 19.927734375, 22.92578125, 25.923828125, 28.921875, 31.919921875, 34.91796875, 37.916015625, 40.9140625, 43.912109375, 46.91015625, 49.908203125, 52.90625, 55.904296875, 58.90234375, 61.900390625, 64.8984375, 67.896484375, 70.89453125, 73.892578125, 76.890625, 79.888671875, 82.88671875, 85.884765625, 88.8828125, 91.880859375, 94.87890625, 97.876953125, 100.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 10.0, 5.0, 10.0, 5.0, 12.0, 14.0, 10.0, 23.0, 17.0, 32.0, 25.0, 39.0, 41.0, 31.0, 39.0, 37.0, 47.0, 51.0, 36.0, 42.0, 41.0, 39.0, 38.0, 33.0, 31.0, 36.0, 35.0, 26.0, 29.0, 23.0, 21.0, 18.0, 23.0, 11.0, 12.0, 12.0, 10.0, 5.0, 9.0, 6.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-133.625, -129.263671875, -124.90234375, -120.541015625, -116.1796875, -111.818359375, -107.45703125, -103.095703125, -98.734375, -94.373046875, -90.01171875, -85.650390625, -81.2890625, -76.927734375, -72.56640625, -68.205078125, -63.84375, -59.482421875, -55.12109375, -50.759765625, -46.3984375, -42.037109375, -37.67578125, -33.314453125, -28.953125, -24.591796875, -20.23046875, -15.869140625, -11.5078125, -7.146484375, -2.78515625, 1.576171875, 5.9375, 10.298828125, 14.66015625, 19.021484375, 23.3828125, 27.744140625, 32.10546875, 36.466796875, 40.828125, 45.189453125, 49.55078125, 53.912109375, 58.2734375, 62.634765625, 66.99609375, 71.357421875, 75.71875, 80.080078125, 84.44140625, 88.802734375, 93.1640625, 97.525390625, 101.88671875, 106.248046875, 110.609375, 114.970703125, 119.33203125, 123.693359375, 128.0546875, 132.416015625, 136.77734375, 141.138671875, 145.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 12.0, 17.0, 10.0, 23.0, 38.0, 47.0, 96.0, 151.0, 235.0, 412.0, 665.0, 1078.0, 1676.0, 2872.0, 5115.0, 9083.0, 16768.0, 33538.0, 70591.0, 157225.0, 349228.0, 214622.0, 93475.0, 43508.0, 21569.0, 11312.0, 6143.0, 3646.0, 2128.0, 1234.0, 786.0, 488.0, 287.0, 172.0, 98.0, 76.0, 45.0, 25.0, 17.0, 13.0, 13.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.9375, -88.83984375, -85.7421875, -82.64453125, -79.546875, -76.44921875, -73.3515625, -70.25390625, -67.15625, -64.05859375, -60.9609375, -57.86328125, -54.765625, -51.66796875, -48.5703125, -45.47265625, -42.375, -39.27734375, -36.1796875, -33.08203125, -29.984375, -26.88671875, -23.7890625, -20.69140625, -17.59375, -14.49609375, -11.3984375, -8.30078125, -5.203125, -2.10546875, 0.9921875, 4.08984375, 7.1875, 10.28515625, 13.3828125, 16.48046875, 19.578125, 22.67578125, 25.7734375, 28.87109375, 31.96875, 35.06640625, 38.1640625, 41.26171875, 44.359375, 47.45703125, 50.5546875, 53.65234375, 56.75, 59.84765625, 62.9453125, 66.04296875, 69.140625, 72.23828125, 75.3359375, 78.43359375, 81.53125, 84.62890625, 87.7265625, 90.82421875, 93.921875, 97.01953125, 100.1171875, 103.21484375, 106.3125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 6.0, 10.0, 25.0, 10.0, 23.0, 14.0, 31.0, 14.0, 20.0, 33.0, 32.0, 30.0, 35.0, 46.0, 39.0, 41.0, 40.0, 44.0, 35.0, 43.0, 43.0, 35.0, 37.0, 35.0, 39.0, 26.0, 34.0, 28.0, 25.0, 11.0, 16.0, 18.0, 13.0, 11.0, 5.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.0, -88.30078125, -85.6015625, -82.90234375, -80.203125, -77.50390625, -74.8046875, -72.10546875, -69.40625, -66.70703125, -64.0078125, -61.30859375, -58.609375, -55.91015625, -53.2109375, -50.51171875, -47.8125, -45.11328125, -42.4140625, -39.71484375, -37.015625, -34.31640625, -31.6171875, -28.91796875, -26.21875, -23.51953125, -20.8203125, -18.12109375, -15.421875, -12.72265625, -10.0234375, -7.32421875, -4.625, -1.92578125, 0.7734375, 3.47265625, 6.171875, 8.87109375, 11.5703125, 14.26953125, 16.96875, 19.66796875, 22.3671875, 25.06640625, 27.765625, 30.46484375, 33.1640625, 35.86328125, 38.5625, 41.26171875, 43.9609375, 46.66015625, 49.359375, 52.05859375, 54.7578125, 57.45703125, 60.15625, 62.85546875, 65.5546875, 68.25390625, 70.953125, 73.65234375, 76.3515625, 79.05078125, 81.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 7.0, 4.0, 10.0, 11.0, 19.0, 25.0, 41.0, 53.0, 96.0, 151.0, 216.0, 367.0, 776.0, 1238.0, 2215.0, 4077.0, 8294.0, 18361.0, 49441.0, 190089.0, 578168.0, 127771.0, 37230.0, 14901.0, 6905.0, 3567.0, 1893.0, 1096.0, 577.0, 339.0, 223.0, 145.0, 107.0, 52.0, 25.0, 24.0, 20.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.66571044921875, -1.6048583984375, -1.54400634765625, -1.483154296875, -1.42230224609375, -1.3614501953125, -1.30059814453125, -1.23974609375, -1.17889404296875, -1.1180419921875, -1.05718994140625, -0.996337890625, -0.93548583984375, -0.8746337890625, -0.81378173828125, -0.7529296875, -0.69207763671875, -0.6312255859375, -0.57037353515625, -0.509521484375, -0.44866943359375, -0.3878173828125, -0.32696533203125, -0.26611328125, -0.20526123046875, -0.1444091796875, -0.08355712890625, -0.022705078125, 0.03814697265625, 0.0989990234375, 0.15985107421875, 0.220703125, 0.28155517578125, 0.3424072265625, 0.40325927734375, 0.464111328125, 0.52496337890625, 0.5858154296875, 0.64666748046875, 0.70751953125, 0.76837158203125, 0.8292236328125, 0.89007568359375, 0.950927734375, 1.01177978515625, 1.0726318359375, 1.13348388671875, 1.1943359375, 1.25518798828125, 1.3160400390625, 1.37689208984375, 1.437744140625, 1.49859619140625, 1.5594482421875, 1.62030029296875, 1.68115234375, 1.74200439453125, 1.8028564453125, 1.86370849609375, 1.924560546875, 1.98541259765625, 2.0462646484375, 2.10711669921875, 2.16796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 3.0, 4.0, 7.0, 6.0, 11.0, 12.0, 17.0, 22.0, 22.0, 24.0, 52.0, 58.0, 105.0, 149.0, 140.0, 102.0, 77.0, 40.0, 29.0, 30.0, 18.0, 21.0, 5.0, 4.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000732421875, -0.0007087439298629761, -0.0006850659847259521, -0.0006613880395889282, -0.0006377100944519043, -0.0006140321493148804, -0.0005903542041778564, -0.0005666762590408325, -0.0005429983139038086, -0.0005193203687667847, -0.0004956424236297607, -0.0004719644784927368, -0.0004482865333557129, -0.00042460858821868896, -0.00040093064308166504, -0.0003772526979446411, -0.0003535747528076172, -0.00032989680767059326, -0.00030621886253356934, -0.0002825409173965454, -0.0002588629722595215, -0.00023518502712249756, -0.00021150708198547363, -0.0001878291368484497, -0.00016415119171142578, -0.00014047324657440186, -0.00011679530143737793, -9.3117356300354e-05, -6.943941116333008e-05, -4.576146602630615e-05, -2.2083520889282227e-05, 1.5944242477416992e-06, 2.5272369384765625e-05, 4.895031452178955e-05, 7.262825965881348e-05, 9.63062047958374e-05, 0.00011998414993286133, 0.00014366209506988525, 0.00016734004020690918, 0.0001910179853439331, 0.00021469593048095703, 0.00023837387561798096, 0.0002620518207550049, 0.0002857297658920288, 0.00030940771102905273, 0.00033308565616607666, 0.0003567636013031006, 0.0003804415464401245, 0.00040411949157714844, 0.00042779743671417236, 0.0004514753818511963, 0.0004751533269882202, 0.0004988312721252441, 0.0005225092172622681, 0.000546187162399292, 0.0005698651075363159, 0.0005935430526733398, 0.0006172209978103638, 0.0006408989429473877, 0.0006645768880844116, 0.0006882548332214355, 0.0007119327783584595, 0.0007356107234954834, 0.0007592886686325073, 0.0007829666137695312]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 9.0, 14.0, 16.0, 26.0, 28.0, 38.0, 57.0, 87.0, 121.0, 193.0, 261.0, 444.0, 705.0, 957.0, 1581.0, 2543.0, 4163.0, 6957.0, 12090.0, 21606.0, 43526.0, 101628.0, 311318.0, 333604.0, 107749.0, 44966.0, 22661.0, 12330.0, 7240.0, 4257.0, 2612.0, 1612.0, 1017.0, 672.0, 463.0, 310.0, 221.0, 144.0, 85.0, 63.0, 54.0, 33.0, 21.0, 15.0, 10.0, 10.0, 3.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.0908203125, -1.0567626953125, -1.022705078125, -0.9886474609375, -0.95458984375, -0.9205322265625, -0.886474609375, -0.8524169921875, -0.818359375, -0.7843017578125, -0.750244140625, -0.7161865234375, -0.68212890625, -0.6480712890625, -0.614013671875, -0.5799560546875, -0.5458984375, -0.5118408203125, -0.477783203125, -0.4437255859375, -0.40966796875, -0.3756103515625, -0.341552734375, -0.3074951171875, -0.2734375, -0.2393798828125, -0.205322265625, -0.1712646484375, -0.13720703125, -0.1031494140625, -0.069091796875, -0.0350341796875, -0.0009765625, 0.0330810546875, 0.067138671875, 0.1011962890625, 0.13525390625, 0.1693115234375, 0.203369140625, 0.2374267578125, 0.271484375, 0.3055419921875, 0.339599609375, 0.3736572265625, 0.40771484375, 0.4417724609375, 0.475830078125, 0.5098876953125, 0.5439453125, 0.5780029296875, 0.612060546875, 0.6461181640625, 0.68017578125, 0.7142333984375, 0.748291015625, 0.7823486328125, 0.81640625, 0.8504638671875, 0.884521484375, 0.9185791015625, 0.95263671875, 0.9866943359375, 1.020751953125, 1.0548095703125, 1.0888671875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 10.0, 9.0, 5.0, 8.0, 11.0, 13.0, 14.0, 20.0, 33.0, 26.0, 36.0, 46.0, 57.0, 68.0, 103.0, 91.0, 102.0, 64.0, 50.0, 47.0, 35.0, 30.0, 28.0, 12.0, 15.0, 12.0, 15.0, 15.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3232421875, -0.3132591247558594, -0.30327606201171875, -0.2932929992675781, -0.2833099365234375, -0.2733268737792969, -0.26334381103515625, -0.2533607482910156, -0.243377685546875, -0.23339462280273438, -0.22341156005859375, -0.21342849731445312, -0.2034454345703125, -0.19346237182617188, -0.18347930908203125, -0.17349624633789062, -0.16351318359375, -0.15353012084960938, -0.14354705810546875, -0.13356399536132812, -0.1235809326171875, -0.11359786987304688, -0.10361480712890625, -0.09363174438476562, -0.083648681640625, -0.07366561889648438, -0.06368255615234375, -0.053699493408203125, -0.0437164306640625, -0.033733367919921875, -0.02375030517578125, -0.013767242431640625, -0.0037841796875, 0.006198883056640625, 0.01618194580078125, 0.026165008544921875, 0.0361480712890625, 0.046131134033203125, 0.05611419677734375, 0.06609725952148438, 0.076080322265625, 0.08606338500976562, 0.09604644775390625, 0.10602951049804688, 0.1160125732421875, 0.12599563598632812, 0.13597869873046875, 0.14596176147460938, 0.15594482421875, 0.16592788696289062, 0.17591094970703125, 0.18589401245117188, 0.1958770751953125, 0.20586013793945312, 0.21584320068359375, 0.22582626342773438, 0.235809326171875, 0.24579238891601562, 0.25577545166015625, 0.2657585144042969, 0.2757415771484375, 0.2857246398925781, 0.29570770263671875, 0.3056907653808594, 0.315673828125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 11.0, 9.0, 15.0, 14.0, 21.0, 41.0, 40.0, 58.0, 93.0, 87.0, 117.0, 93.0, 94.0, 68.0, 54.0, 46.0, 18.0, 25.0, 18.0, 10.0, 9.0, 16.0, 8.0, 5.0, 11.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.96934509277344, -211.36349487304688, -204.75762939453125, -198.1517791748047, -191.54592895507812, -184.9400634765625, -178.33421325683594, -171.72836303710938, -165.1225128173828, -158.51666259765625, -151.91079711914062, -145.30494689941406, -138.6990966796875, -132.09323120117188, -125.48738098144531, -118.88153076171875, -112.27567291259766, -105.66981506347656, -99.06396484375, -92.4581069946289, -85.85225677490234, -79.24639892578125, -72.64054870605469, -66.0346908569336, -59.428836822509766, -52.82298278808594, -46.21712875366211, -39.61127471923828, -33.00541687011719, -26.39956283569336, -19.79370880126953, -13.187854766845703, -6.582000732421875, 0.023853778839111328, 6.629708290100098, 13.235563278198242, 19.84141731262207, 26.44727325439453, 33.05312728881836, 39.65898132324219, 46.264835357666016, 52.870689392089844, 59.47654342651367, 66.0823974609375, 72.6882553100586, 79.29411315917969, 85.89996337890625, 92.50581359863281, 99.1116714477539, 105.717529296875, 112.32337951660156, 118.92923736572266, 125.53508758544922, 132.1409454345703, 138.74679565429688, 145.3526611328125, 151.95851135253906, 158.56436157226562, 165.17022705078125, 171.7760772705078, 178.38192749023438, 184.98779296875, 191.59364318847656, 198.19949340820312, 204.8053436279297]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 8.0, 6.0, 7.0, 8.0, 13.0, 15.0, 17.0, 21.0, 30.0, 29.0, 25.0, 33.0, 32.0, 48.0, 38.0, 54.0, 59.0, 30.0, 43.0, 41.0, 39.0, 50.0, 39.0, 28.0, 22.0, 33.0, 38.0, 29.0, 20.0, 25.0, 15.0, 12.0, 15.0, 13.0, 18.0, 7.0, 3.0, 11.0, 4.0, 12.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.84197998046875, -115.68860626220703, -111.53523254394531, -107.3818588256836, -103.22848510742188, -99.07511901855469, -94.92174530029297, -90.76837158203125, -86.61499786376953, -82.46162414550781, -78.3082504272461, -74.15487670898438, -70.00151062011719, -65.84812927246094, -61.69476318359375, -57.54138946533203, -53.38801574707031, -49.234642028808594, -45.081268310546875, -40.92789840698242, -36.7745246887207, -32.621150970458984, -28.4677791595459, -24.314407348632812, -20.161033630371094, -16.007659912109375, -11.854288101196289, -7.700915336608887, -3.5475425720214844, 0.6058311462402344, 4.75920295715332, 8.912574768066406, 13.065948486328125, 17.219322204589844, 21.37269401550293, 25.526065826416016, 29.679439544677734, 33.83281326293945, 37.986183166503906, 42.139556884765625, 46.292930603027344, 50.44630432128906, 54.59967803955078, 58.753047943115234, 62.90642166137695, 67.05979919433594, 71.21316528320312, 75.36653900146484, 79.51991271972656, 83.67328643798828, 87.82666015625, 91.98003387451172, 96.13340759277344, 100.28677368164062, 104.44014739990234, 108.59352111816406, 112.74689483642578, 116.9002685546875, 121.05364227294922, 125.20701599121094, 129.36038208007812, 133.51376342773438, 137.66712951660156, 141.82049560546875, 145.973876953125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 12.0, 11.0, 21.0, 32.0, 36.0, 65.0, 91.0, 131.0, 201.0, 275.0, 421.0, 648.0, 931.0, 1242.0, 1922.0, 2689.0, 4159.0, 6156.0, 9185.0, 14247.0, 22338.0, 36941.0, 63545.0, 113409.0, 196340.0, 224546.0, 144965.0, 80130.0, 45869.0, 27265.0, 17384.0, 11062.0, 7144.0, 4711.0, 3182.0, 2225.0, 1622.0, 1104.0, 721.0, 540.0, 354.0, 231.0, 144.0, 107.0, 67.0, 52.0, 27.0, 20.0, 12.0, 6.0, 6.0, 8.0, 0.0, 1.0, 2.0], "bins": [-222.875, -216.359375, -209.84375, -203.328125, -196.8125, -190.296875, -183.78125, -177.265625, -170.75, -164.234375, -157.71875, -151.203125, -144.6875, -138.171875, -131.65625, -125.140625, -118.625, -112.109375, -105.59375, -99.078125, -92.5625, -86.046875, -79.53125, -73.015625, -66.5, -59.984375, -53.46875, -46.953125, -40.4375, -33.921875, -27.40625, -20.890625, -14.375, -7.859375, -1.34375, 5.171875, 11.6875, 18.203125, 24.71875, 31.234375, 37.75, 44.265625, 50.78125, 57.296875, 63.8125, 70.328125, 76.84375, 83.359375, 89.875, 96.390625, 102.90625, 109.421875, 115.9375, 122.453125, 128.96875, 135.484375, 142.0, 148.515625, 155.03125, 161.546875, 168.0625, 174.578125, 181.09375, 187.609375, 194.125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 13.0, 7.0, 15.0, 15.0, 15.0, 13.0, 17.0, 19.0, 25.0, 20.0, 24.0, 32.0, 27.0, 28.0, 53.0, 43.0, 50.0, 44.0, 37.0, 35.0, 31.0, 52.0, 42.0, 36.0, 35.0, 25.0, 27.0, 30.0, 30.0, 23.0, 22.0, 11.0, 13.0, 12.0, 18.0, 6.0, 8.0, 7.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.0625, -84.0625, -81.0625, -78.0625, -75.0625, -72.0625, -69.0625, -66.0625, -63.0625, -60.0625, -57.0625, -54.0625, -51.0625, -48.0625, -45.0625, -42.0625, -39.0625, -36.0625, -33.0625, -30.0625, -27.0625, -24.0625, -21.0625, -18.0625, -15.0625, -12.0625, -9.0625, -6.0625, -3.0625, -0.0625, 2.9375, 5.9375, 8.9375, 11.9375, 14.9375, 17.9375, 20.9375, 23.9375, 26.9375, 29.9375, 32.9375, 35.9375, 38.9375, 41.9375, 44.9375, 47.9375, 50.9375, 53.9375, 56.9375, 59.9375, 62.9375, 65.9375, 68.9375, 71.9375, 74.9375, 77.9375, 80.9375, 83.9375, 86.9375, 89.9375, 92.9375, 95.9375, 98.9375, 101.9375, 104.9375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 20.0, 19.0, 36.0, 53.0, 59.0, 110.0, 145.0, 218.0, 317.0, 543.0, 738.0, 1182.0, 1693.0, 2311.0, 3649.0, 5213.0, 7949.0, 12114.0, 18668.0, 28837.0, 47611.0, 80492.0, 136186.0, 202593.0, 189978.0, 119293.0, 70967.0, 42007.0, 26084.0, 16472.0, 11015.0, 7155.0, 4796.0, 3248.0, 2266.0, 1485.0, 1015.0, 623.0, 470.0, 312.0, 202.0, 142.0, 85.0, 70.0, 41.0, 29.0, 8.0, 6.0, 7.0, 9.0, 4.0, 7.0, 3.0, 3.0], "bins": [-199.625, -193.732421875, -187.83984375, -181.947265625, -176.0546875, -170.162109375, -164.26953125, -158.376953125, -152.484375, -146.591796875, -140.69921875, -134.806640625, -128.9140625, -123.021484375, -117.12890625, -111.236328125, -105.34375, -99.451171875, -93.55859375, -87.666015625, -81.7734375, -75.880859375, -69.98828125, -64.095703125, -58.203125, -52.310546875, -46.41796875, -40.525390625, -34.6328125, -28.740234375, -22.84765625, -16.955078125, -11.0625, -5.169921875, 0.72265625, 6.615234375, 12.5078125, 18.400390625, 24.29296875, 30.185546875, 36.078125, 41.970703125, 47.86328125, 53.755859375, 59.6484375, 65.541015625, 71.43359375, 77.326171875, 83.21875, 89.111328125, 95.00390625, 100.896484375, 106.7890625, 112.681640625, 118.57421875, 124.466796875, 130.359375, 136.251953125, 142.14453125, 148.037109375, 153.9296875, 159.822265625, 165.71484375, 171.607421875, 177.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 6.0, 8.0, 14.0, 13.0, 10.0, 18.0, 15.0, 12.0, 27.0, 24.0, 22.0, 28.0, 33.0, 39.0, 37.0, 48.0, 40.0, 42.0, 37.0, 33.0, 35.0, 36.0, 43.0, 38.0, 32.0, 39.0, 36.0, 22.0, 35.0, 28.0, 16.0, 12.0, 16.0, 15.0, 22.0, 12.0, 5.0, 10.0, 7.0, 11.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-67.8125, -65.884765625, -63.95703125, -62.029296875, -60.1015625, -58.173828125, -56.24609375, -54.318359375, -52.390625, -50.462890625, -48.53515625, -46.607421875, -44.6796875, -42.751953125, -40.82421875, -38.896484375, -36.96875, -35.041015625, -33.11328125, -31.185546875, -29.2578125, -27.330078125, -25.40234375, -23.474609375, -21.546875, -19.619140625, -17.69140625, -15.763671875, -13.8359375, -11.908203125, -9.98046875, -8.052734375, -6.125, -4.197265625, -2.26953125, -0.341796875, 1.5859375, 3.513671875, 5.44140625, 7.369140625, 9.296875, 11.224609375, 13.15234375, 15.080078125, 17.0078125, 18.935546875, 20.86328125, 22.791015625, 24.71875, 26.646484375, 28.57421875, 30.501953125, 32.4296875, 34.357421875, 36.28515625, 38.212890625, 40.140625, 42.068359375, 43.99609375, 45.923828125, 47.8515625, 49.779296875, 51.70703125, 53.634765625, 55.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 13.0, 9.0, 17.0, 23.0, 30.0, 36.0, 35.0, 61.0, 84.0, 105.0, 167.0, 228.0, 284.0, 421.0, 548.0, 774.0, 1135.0, 1600.0, 2503.0, 3566.0, 5647.0, 9168.0, 15667.0, 29568.0, 67482.0, 222816.0, 456049.0, 127452.0, 46201.0, 22267.0, 12320.0, 7594.0, 4639.0, 3044.0, 2071.0, 1465.0, 949.0, 690.0, 484.0, 354.0, 249.0, 207.0, 143.0, 97.0, 74.0, 56.0, 40.0, 33.0, 25.0, 14.0, 16.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0], "bins": [-12.0703125, -11.707763671875, -11.34521484375, -10.982666015625, -10.6201171875, -10.257568359375, -9.89501953125, -9.532470703125, -9.169921875, -8.807373046875, -8.44482421875, -8.082275390625, -7.7197265625, -7.357177734375, -6.99462890625, -6.632080078125, -6.26953125, -5.906982421875, -5.54443359375, -5.181884765625, -4.8193359375, -4.456787109375, -4.09423828125, -3.731689453125, -3.369140625, -3.006591796875, -2.64404296875, -2.281494140625, -1.9189453125, -1.556396484375, -1.19384765625, -0.831298828125, -0.46875, -0.106201171875, 0.25634765625, 0.618896484375, 0.9814453125, 1.343994140625, 1.70654296875, 2.069091796875, 2.431640625, 2.794189453125, 3.15673828125, 3.519287109375, 3.8818359375, 4.244384765625, 4.60693359375, 4.969482421875, 5.33203125, 5.694580078125, 6.05712890625, 6.419677734375, 6.7822265625, 7.144775390625, 7.50732421875, 7.869873046875, 8.232421875, 8.594970703125, 8.95751953125, 9.320068359375, 9.6826171875, 10.045166015625, 10.40771484375, 10.770263671875, 11.1328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 1.0, 10.0, 4.0, 13.0, 16.0, 15.0, 29.0, 30.0, 54.0, 72.0, 86.0, 151.0, 124.0, 99.0, 66.0, 57.0, 35.0, 26.0, 21.0, 17.0, 10.0, 11.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002166748046875, -0.002094268798828125, -0.00202178955078125, -0.001949310302734375, -0.0018768310546875, -0.001804351806640625, -0.00173187255859375, -0.001659393310546875, -0.0015869140625, -0.001514434814453125, -0.00144195556640625, -0.001369476318359375, -0.0012969970703125, -0.001224517822265625, -0.00115203857421875, -0.001079559326171875, -0.001007080078125, -0.000934600830078125, -0.00086212158203125, -0.000789642333984375, -0.0007171630859375, -0.000644683837890625, -0.00057220458984375, -0.000499725341796875, -0.00042724609375, -0.000354766845703125, -0.00028228759765625, -0.000209808349609375, -0.0001373291015625, -6.4849853515625e-05, 7.62939453125e-06, 8.0108642578125e-05, 0.000152587890625, 0.000225067138671875, 0.00029754638671875, 0.000370025634765625, 0.0004425048828125, 0.000514984130859375, 0.00058746337890625, 0.000659942626953125, 0.000732421875, 0.000804901123046875, 0.00087738037109375, 0.000949859619140625, 0.0010223388671875, 0.001094818115234375, 0.00116729736328125, 0.001239776611328125, 0.001312255859375, 0.001384735107421875, 0.00145721435546875, 0.001529693603515625, 0.0016021728515625, 0.001674652099609375, 0.00174713134765625, 0.001819610595703125, 0.00189208984375, 0.001964569091796875, 0.00203704833984375, 0.002109527587890625, 0.0021820068359375, 0.002254486083984375, 0.00232696533203125, 0.002399444580078125, 0.002471923828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 17.0, 17.0, 22.0, 39.0, 48.0, 54.0, 93.0, 127.0, 182.0, 279.0, 434.0, 643.0, 1033.0, 1775.0, 3135.0, 6117.0, 12646.0, 29756.0, 93801.0, 516332.0, 279476.0, 59816.0, 21427.0, 9715.0, 4889.0, 2545.0, 1530.0, 916.0, 531.0, 354.0, 247.0, 159.0, 127.0, 73.0, 46.0, 44.0, 33.0, 19.0, 16.0, 11.0, 6.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.449462890625, -13.93017578125, -13.410888671875, -12.8916015625, -12.372314453125, -11.85302734375, -11.333740234375, -10.814453125, -10.295166015625, -9.77587890625, -9.256591796875, -8.7373046875, -8.218017578125, -7.69873046875, -7.179443359375, -6.66015625, -6.140869140625, -5.62158203125, -5.102294921875, -4.5830078125, -4.063720703125, -3.54443359375, -3.025146484375, -2.505859375, -1.986572265625, -1.46728515625, -0.947998046875, -0.4287109375, 0.090576171875, 0.60986328125, 1.129150390625, 1.6484375, 2.167724609375, 2.68701171875, 3.206298828125, 3.7255859375, 4.244873046875, 4.76416015625, 5.283447265625, 5.802734375, 6.322021484375, 6.84130859375, 7.360595703125, 7.8798828125, 8.399169921875, 8.91845703125, 9.437744140625, 9.95703125, 10.476318359375, 10.99560546875, 11.514892578125, 12.0341796875, 12.553466796875, 13.07275390625, 13.592041015625, 14.111328125, 14.630615234375, 15.14990234375, 15.669189453125, 16.1884765625, 16.707763671875, 17.22705078125, 17.746337890625, 18.265625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 8.0, 18.0, 11.0, 11.0, 21.0, 28.0, 42.0, 54.0, 99.0, 135.0, 131.0, 116.0, 78.0, 60.0, 46.0, 33.0, 17.0, 17.0, 13.0, 10.0, 8.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.69378662109375, -3.5633544921875, -3.43292236328125, -3.302490234375, -3.17205810546875, -3.0416259765625, -2.91119384765625, -2.78076171875, -2.65032958984375, -2.5198974609375, -2.38946533203125, -2.259033203125, -2.12860107421875, -1.9981689453125, -1.86773681640625, -1.7373046875, -1.60687255859375, -1.4764404296875, -1.34600830078125, -1.215576171875, -1.08514404296875, -0.9547119140625, -0.82427978515625, -0.69384765625, -0.56341552734375, -0.4329833984375, -0.30255126953125, -0.172119140625, -0.04168701171875, 0.0887451171875, 0.21917724609375, 0.349609375, 0.48004150390625, 0.6104736328125, 0.74090576171875, 0.871337890625, 1.00177001953125, 1.1322021484375, 1.26263427734375, 1.39306640625, 1.52349853515625, 1.6539306640625, 1.78436279296875, 1.914794921875, 2.04522705078125, 2.1756591796875, 2.30609130859375, 2.4365234375, 2.56695556640625, 2.6973876953125, 2.82781982421875, 2.958251953125, 3.08868408203125, 3.2191162109375, 3.34954833984375, 3.47998046875, 3.61041259765625, 3.7408447265625, 3.87127685546875, 4.001708984375, 4.13214111328125, 4.2625732421875, 4.39300537109375, 4.5234375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 5.0, 13.0, 14.0, 13.0, 27.0, 29.0, 23.0, 42.0, 55.0, 67.0, 80.0, 96.0, 93.0, 75.0, 61.0, 72.0, 50.0, 32.0, 37.0, 16.0, 14.0, 13.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-144.6463623046875, -140.0290069580078, -135.4116668701172, -130.7943115234375, -126.17695617675781, -121.55960845947266, -116.9422607421875, -112.32490539550781, -107.70755004882812, -103.09020233154297, -98.47284698486328, -93.85549926757812, -89.23814392089844, -84.62079620361328, -80.00344848632812, -75.38609313964844, -70.76874542236328, -66.15139770507812, -61.53404235839844, -56.91669464111328, -52.299339294433594, -47.68199157714844, -43.064640045166016, -38.447288513183594, -33.82993698120117, -29.21258544921875, -24.595233917236328, -19.97788429260254, -15.360532760620117, -10.743181228637695, -6.125831604003906, -1.5084800720214844, 3.1088714599609375, 7.726222515106201, 12.343573570251465, 16.96092414855957, 21.578275680541992, 26.195627212524414, 30.812976837158203, 35.430328369140625, 40.04767990112305, 44.66503143310547, 49.28238296508789, 53.89973449707031, 58.51708221435547, 63.134437561035156, 67.75178527832031, 72.369140625, 76.98648834228516, 81.60383605957031, 86.22119140625, 90.83853912353516, 95.45589447021484, 100.0732421875, 104.69059753417969, 109.30794525146484, 113.92529296875, 118.54264068603516, 123.15999603271484, 127.77734375, 132.3946990966797, 137.01205444335938, 141.62939453125, 146.2467498779297, 150.86410522460938]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 9.0, 18.0, 15.0, 12.0, 27.0, 15.0, 22.0, 16.0, 32.0, 42.0, 32.0, 34.0, 45.0, 38.0, 50.0, 30.0, 41.0, 33.0, 41.0, 45.0, 34.0, 37.0, 28.0, 23.0, 26.0, 29.0, 27.0, 21.0, 20.0, 26.0, 14.0, 17.0, 14.0, 12.0, 8.0, 12.0, 6.0, 6.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-94.72086334228516, -91.71656799316406, -88.71227264404297, -85.70797729492188, -82.70368957519531, -79.69939422607422, -76.69509887695312, -73.69080352783203, -70.68650817871094, -67.68221282958984, -64.67791748046875, -61.67362594604492, -58.66933059692383, -55.6650390625, -52.660743713378906, -49.65644836425781, -46.652156829833984, -43.64786148071289, -40.64356994628906, -37.63927459716797, -34.634979248046875, -31.630685806274414, -28.626392364501953, -25.62209701538086, -22.6178035736084, -19.613510131835938, -16.609214782714844, -13.604921340942383, -10.600626945495605, -7.596332550048828, -4.592039108276367, -1.5877437591552734, 1.4165496826171875, 4.420844078063965, 7.425137996673584, 10.429431915283203, 13.43372631072998, 16.438020706176758, 19.44231414794922, 22.446609497070312, 25.450902938842773, 28.455196380615234, 31.459491729736328, 34.463783264160156, 37.46807861328125, 40.472373962402344, 43.47666931152344, 46.48096466064453, 49.48525619506836, 52.48955154418945, 55.49384307861328, 58.498138427734375, 61.50243377685547, 64.50672912597656, 67.51101684570312, 70.51531982421875, 73.51960754394531, 76.5239028930664, 79.5281982421875, 82.53248596191406, 85.53678131103516, 88.54107666015625, 91.54537200927734, 94.54966735839844, 97.55396270751953]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 9.0, 10.0, 14.0, 19.0, 28.0, 48.0, 98.0, 141.0, 203.0, 280.0, 458.0, 629.0, 944.0, 1386.0, 2077.0, 3299.0, 5090.0, 7888.0, 12349.0, 20020.0, 33432.0, 59457.0, 114260.0, 311261.0, 1308822.0, 1609402.0, 399683.0, 131554.0, 67693.0, 38751.0, 23497.0, 14487.0, 9277.0, 5998.0, 3915.0, 2599.0, 1663.0, 1151.0, 833.0, 561.0, 295.0, 215.0, 162.0, 123.0, 70.0, 48.0, 24.0, 21.0, 6.0, 15.0, 16.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-130.75, -126.09765625, -121.4453125, -116.79296875, -112.140625, -107.48828125, -102.8359375, -98.18359375, -93.53125, -88.87890625, -84.2265625, -79.57421875, -74.921875, -70.26953125, -65.6171875, -60.96484375, -56.3125, -51.66015625, -47.0078125, -42.35546875, -37.703125, -33.05078125, -28.3984375, -23.74609375, -19.09375, -14.44140625, -9.7890625, -5.13671875, -0.484375, 4.16796875, 8.8203125, 13.47265625, 18.125, 22.77734375, 27.4296875, 32.08203125, 36.734375, 41.38671875, 46.0390625, 50.69140625, 55.34375, 59.99609375, 64.6484375, 69.30078125, 73.953125, 78.60546875, 83.2578125, 87.91015625, 92.5625, 97.21484375, 101.8671875, 106.51953125, 111.171875, 115.82421875, 120.4765625, 125.12890625, 129.78125, 134.43359375, 139.0859375, 143.73828125, 148.390625, 153.04296875, 157.6953125, 162.34765625, 167.0]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 4.0, 3.0, 10.0, 14.0, 11.0, 20.0, 14.0, 10.0, 23.0, 26.0, 23.0, 30.0, 41.0, 32.0, 31.0, 28.0, 51.0, 40.0, 58.0, 32.0, 34.0, 42.0, 41.0, 30.0, 40.0, 28.0, 24.0, 28.0, 17.0, 26.0, 26.0, 24.0, 22.0, 24.0, 15.0, 12.0, 12.0, 10.0, 8.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.25, -56.25, -54.25, -52.25, -50.25, -48.25, -46.25, -44.25, -42.25, -40.25, -38.25, -36.25, -34.25, -32.25, -30.25, -28.25, -26.25, -24.25, -22.25, -20.25, -18.25, -16.25, -14.25, -12.25, -10.25, -8.25, -6.25, -4.25, -2.25, -0.25, 1.75, 3.75, 5.75, 7.75, 9.75, 11.75, 13.75, 15.75, 17.75, 19.75, 21.75, 23.75, 25.75, 27.75, 29.75, 31.75, 33.75, 35.75, 37.75, 39.75, 41.75, 43.75, 45.75, 47.75, 49.75, 51.75, 53.75, 55.75, 57.75, 59.75, 61.75, 63.75, 65.75, 67.75, 69.75]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 10.0, 18.0, 35.0, 39.0, 69.0, 102.0, 157.0, 253.0, 380.0, 606.0, 1087.0, 1805.0, 2968.0, 5143.0, 9193.0, 16274.0, 30001.0, 57602.0, 118046.0, 265436.0, 726038.0, 1842544.0, 645126.0, 242892.0, 110075.0, 54069.0, 28530.0, 15232.0, 8542.0, 4917.0, 2822.0, 1651.0, 989.0, 605.0, 359.0, 220.0, 167.0, 93.0, 64.0, 38.0, 23.0, 17.0, 16.0, 12.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-148.5, -144.060546875, -139.62109375, -135.181640625, -130.7421875, -126.302734375, -121.86328125, -117.423828125, -112.984375, -108.544921875, -104.10546875, -99.666015625, -95.2265625, -90.787109375, -86.34765625, -81.908203125, -77.46875, -73.029296875, -68.58984375, -64.150390625, -59.7109375, -55.271484375, -50.83203125, -46.392578125, -41.953125, -37.513671875, -33.07421875, -28.634765625, -24.1953125, -19.755859375, -15.31640625, -10.876953125, -6.4375, -1.998046875, 2.44140625, 6.880859375, 11.3203125, 15.759765625, 20.19921875, 24.638671875, 29.078125, 33.517578125, 37.95703125, 42.396484375, 46.8359375, 51.275390625, 55.71484375, 60.154296875, 64.59375, 69.033203125, 73.47265625, 77.912109375, 82.3515625, 86.791015625, 91.23046875, 95.669921875, 100.109375, 104.548828125, 108.98828125, 113.427734375, 117.8671875, 122.306640625, 126.74609375, 131.185546875, 135.625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 9.0, 14.0, 16.0, 29.0, 25.0, 45.0, 46.0, 49.0, 90.0, 101.0, 108.0, 116.0, 197.0, 237.0, 275.0, 441.0, 524.0, 407.0, 307.0, 217.0, 169.0, 135.0, 106.0, 82.0, 62.0, 54.0, 42.0, 33.0, 29.0, 27.0, 16.0, 19.0, 11.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-46.03125, -44.6533203125, -43.275390625, -41.8974609375, -40.51953125, -39.1416015625, -37.763671875, -36.3857421875, -35.0078125, -33.6298828125, -32.251953125, -30.8740234375, -29.49609375, -28.1181640625, -26.740234375, -25.3623046875, -23.984375, -22.6064453125, -21.228515625, -19.8505859375, -18.47265625, -17.0947265625, -15.716796875, -14.3388671875, -12.9609375, -11.5830078125, -10.205078125, -8.8271484375, -7.44921875, -6.0712890625, -4.693359375, -3.3154296875, -1.9375, -0.5595703125, 0.818359375, 2.1962890625, 3.57421875, 4.9521484375, 6.330078125, 7.7080078125, 9.0859375, 10.4638671875, 11.841796875, 13.2197265625, 14.59765625, 15.9755859375, 17.353515625, 18.7314453125, 20.109375, 21.4873046875, 22.865234375, 24.2431640625, 25.62109375, 26.9990234375, 28.376953125, 29.7548828125, 31.1328125, 32.5107421875, 33.888671875, 35.2666015625, 36.64453125, 38.0224609375, 39.400390625, 40.7783203125, 42.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 12.0, 11.0, 13.0, 23.0, 19.0, 24.0, 40.0, 51.0, 52.0, 74.0, 71.0, 94.0, 99.0, 75.0, 59.0, 62.0, 41.0, 33.0, 29.0, 23.0, 22.0, 15.0, 6.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.58313751220703, -93.12688446044922, -89.67062377929688, -86.21437072753906, -82.75811004638672, -79.3018569946289, -75.84559631347656, -72.38934326171875, -68.93309020996094, -65.47683715820312, -62.02057647705078, -58.56432342529297, -55.108062744140625, -51.65180969238281, -48.195552825927734, -44.739295959472656, -41.28303527832031, -37.826778411865234, -34.370521545410156, -30.91426658630371, -27.458009719848633, -24.001752853393555, -20.54549789428711, -17.08924102783203, -13.632984161376953, -10.176727294921875, -6.720471382141113, -3.2642154693603516, 0.19204139709472656, 3.6482982635498047, 7.10455322265625, 10.560810089111328, 14.017059326171875, 17.473316192626953, 20.92957305908203, 24.385828018188477, 27.842084884643555, 31.298341751098633, 34.75459671020508, 38.210853576660156, 41.667110443115234, 45.12336730957031, 48.57962417602539, 52.03588104248047, 55.49213409423828, 58.948394775390625, 62.40464782714844, 65.86090087890625, 69.3171615600586, 72.7734146118164, 76.22967529296875, 79.68592834472656, 83.1421890258789, 86.59844207763672, 90.05470275878906, 93.51095581054688, 96.96720886230469, 100.4234619140625, 103.87972259521484, 107.33597564697266, 110.792236328125, 114.24848937988281, 117.70474243164062, 121.16100311279297, 124.61726379394531]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 6.0, 10.0, 6.0, 4.0, 17.0, 5.0, 14.0, 22.0, 16.0, 15.0, 25.0, 31.0, 29.0, 30.0, 39.0, 40.0, 37.0, 31.0, 39.0, 41.0, 38.0, 38.0, 34.0, 35.0, 40.0, 40.0, 28.0, 30.0, 33.0, 27.0, 32.0, 22.0, 25.0, 19.0, 18.0, 19.0, 14.0, 11.0, 7.0, 8.0, 8.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.09126281738281, -61.96525192260742, -59.839237213134766, -57.713226318359375, -55.58721160888672, -53.46120071411133, -51.33518981933594, -49.20917510986328, -47.08316421508789, -44.9571533203125, -42.831138610839844, -40.70512771606445, -38.57911682128906, -36.453102111816406, -34.327091217041016, -32.201080322265625, -30.07506561279297, -27.949052810668945, -25.823040008544922, -23.69702911376953, -21.571016311645508, -19.445003509521484, -17.318992614746094, -15.19297981262207, -13.066967010498047, -10.940954208374023, -8.814942359924316, -6.688930034637451, -4.562917709350586, -2.4369049072265625, -0.31089305877685547, 1.8151187896728516, 3.941131591796875, 6.06714391708374, 8.193156242370605, 10.319168090820312, 12.445180892944336, 14.57119369506836, 16.69720458984375, 18.823217391967773, 20.949230194091797, 23.07524299621582, 25.201255798339844, 27.327266693115234, 29.453279495239258, 31.57929229736328, 33.70530319213867, 35.83131408691406, 37.95732879638672, 40.08333969116211, 42.209354400634766, 44.335365295410156, 46.46138000488281, 48.5873908996582, 50.713401794433594, 52.83941650390625, 54.96542739868164, 57.09143829345703, 59.21745300292969, 61.34346389770508, 63.46947479248047, 65.59548950195312, 67.72150421142578, 69.8475112915039, 71.97352600097656]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 14.0, 17.0, 35.0, 41.0, 69.0, 92.0, 158.0, 218.0, 398.0, 577.0, 931.0, 1443.0, 2290.0, 3668.0, 6040.0, 9861.0, 16327.0, 27532.0, 46484.0, 79748.0, 137162.0, 232664.0, 201495.0, 115401.0, 66807.0, 39294.0, 23472.0, 14082.0, 8424.0, 5240.0, 3133.0, 1983.0, 1228.0, 790.0, 539.0, 307.0, 226.0, 127.0, 73.0, 53.0, 45.0, 21.0, 17.0, 10.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-52.21875, -50.67578125, -49.1328125, -47.58984375, -46.046875, -44.50390625, -42.9609375, -41.41796875, -39.875, -38.33203125, -36.7890625, -35.24609375, -33.703125, -32.16015625, -30.6171875, -29.07421875, -27.53125, -25.98828125, -24.4453125, -22.90234375, -21.359375, -19.81640625, -18.2734375, -16.73046875, -15.1875, -13.64453125, -12.1015625, -10.55859375, -9.015625, -7.47265625, -5.9296875, -4.38671875, -2.84375, -1.30078125, 0.2421875, 1.78515625, 3.328125, 4.87109375, 6.4140625, 7.95703125, 9.5, 11.04296875, 12.5859375, 14.12890625, 15.671875, 17.21484375, 18.7578125, 20.30078125, 21.84375, 23.38671875, 24.9296875, 26.47265625, 28.015625, 29.55859375, 31.1015625, 32.64453125, 34.1875, 35.73046875, 37.2734375, 38.81640625, 40.359375, 41.90234375, 43.4453125, 44.98828125, 46.53125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 5.0, 6.0, 8.0, 12.0, 10.0, 11.0, 12.0, 21.0, 27.0, 18.0, 17.0, 37.0, 24.0, 27.0, 25.0, 27.0, 48.0, 33.0, 41.0, 34.0, 49.0, 31.0, 36.0, 30.0, 43.0, 32.0, 31.0, 30.0, 32.0, 26.0, 27.0, 24.0, 27.0, 21.0, 21.0, 18.0, 13.0, 8.0, 11.0, 6.0, 7.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-64.0, -62.01171875, -60.0234375, -58.03515625, -56.046875, -54.05859375, -52.0703125, -50.08203125, -48.09375, -46.10546875, -44.1171875, -42.12890625, -40.140625, -38.15234375, -36.1640625, -34.17578125, -32.1875, -30.19921875, -28.2109375, -26.22265625, -24.234375, -22.24609375, -20.2578125, -18.26953125, -16.28125, -14.29296875, -12.3046875, -10.31640625, -8.328125, -6.33984375, -4.3515625, -2.36328125, -0.375, 1.61328125, 3.6015625, 5.58984375, 7.578125, 9.56640625, 11.5546875, 13.54296875, 15.53125, 17.51953125, 19.5078125, 21.49609375, 23.484375, 25.47265625, 27.4609375, 29.44921875, 31.4375, 33.42578125, 35.4140625, 37.40234375, 39.390625, 41.37890625, 43.3671875, 45.35546875, 47.34375, 49.33203125, 51.3203125, 53.30859375, 55.296875, 57.28515625, 59.2734375, 61.26171875, 63.25]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 19.0, 27.0, 49.0, 81.0, 101.0, 134.0, 217.0, 362.0, 565.0, 912.0, 1481.0, 2370.0, 3927.0, 6785.0, 11897.0, 21819.0, 41028.0, 81662.0, 175641.0, 344394.0, 179146.0, 83250.0, 41451.0, 21806.0, 12074.0, 6800.0, 4072.0, 2411.0, 1435.0, 978.0, 584.0, 372.0, 222.0, 146.0, 88.0, 75.0, 47.0, 37.0, 20.0, 15.0, 12.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.71875, -46.2509765625, -44.783203125, -43.3154296875, -41.84765625, -40.3798828125, -38.912109375, -37.4443359375, -35.9765625, -34.5087890625, -33.041015625, -31.5732421875, -30.10546875, -28.6376953125, -27.169921875, -25.7021484375, -24.234375, -22.7666015625, -21.298828125, -19.8310546875, -18.36328125, -16.8955078125, -15.427734375, -13.9599609375, -12.4921875, -11.0244140625, -9.556640625, -8.0888671875, -6.62109375, -5.1533203125, -3.685546875, -2.2177734375, -0.75, 0.7177734375, 2.185546875, 3.6533203125, 5.12109375, 6.5888671875, 8.056640625, 9.5244140625, 10.9921875, 12.4599609375, 13.927734375, 15.3955078125, 16.86328125, 18.3310546875, 19.798828125, 21.2666015625, 22.734375, 24.2021484375, 25.669921875, 27.1376953125, 28.60546875, 30.0732421875, 31.541015625, 33.0087890625, 34.4765625, 35.9443359375, 37.412109375, 38.8798828125, 40.34765625, 41.8154296875, 43.283203125, 44.7509765625, 46.21875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 3.0, 10.0, 4.0, 7.0, 6.0, 8.0, 10.0, 8.0, 9.0, 28.0, 17.0, 20.0, 18.0, 27.0, 32.0, 29.0, 34.0, 26.0, 38.0, 44.0, 33.0, 24.0, 45.0, 35.0, 29.0, 38.0, 47.0, 40.0, 45.0, 40.0, 33.0, 19.0, 28.0, 21.0, 19.0, 25.0, 16.0, 18.0, 17.0, 14.0, 7.0, 5.0, 5.0, 5.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.25, -37.93994140625, -36.6298828125, -35.31982421875, -34.009765625, -32.69970703125, -31.3896484375, -30.07958984375, -28.76953125, -27.45947265625, -26.1494140625, -24.83935546875, -23.529296875, -22.21923828125, -20.9091796875, -19.59912109375, -18.2890625, -16.97900390625, -15.6689453125, -14.35888671875, -13.048828125, -11.73876953125, -10.4287109375, -9.11865234375, -7.80859375, -6.49853515625, -5.1884765625, -3.87841796875, -2.568359375, -1.25830078125, 0.0517578125, 1.36181640625, 2.671875, 3.98193359375, 5.2919921875, 6.60205078125, 7.912109375, 9.22216796875, 10.5322265625, 11.84228515625, 13.15234375, 14.46240234375, 15.7724609375, 17.08251953125, 18.392578125, 19.70263671875, 21.0126953125, 22.32275390625, 23.6328125, 24.94287109375, 26.2529296875, 27.56298828125, 28.873046875, 30.18310546875, 31.4931640625, 32.80322265625, 34.11328125, 35.42333984375, 36.7333984375, 38.04345703125, 39.353515625, 40.66357421875, 41.9736328125, 43.28369140625, 44.59375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 23.0, 27.0, 28.0, 60.0, 73.0, 134.0, 190.0, 308.0, 510.0, 862.0, 1415.0, 2771.0, 5283.0, 11417.0, 27429.0, 81079.0, 329339.0, 428331.0, 100115.0, 32638.0, 13309.0, 6051.0, 3027.0, 1686.0, 967.0, 526.0, 340.0, 207.0, 140.0, 75.0, 54.0, 37.0, 28.0, 15.0, 10.0, 10.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54150390625, -0.52288818359375, -0.5042724609375, -0.48565673828125, -0.467041015625, -0.44842529296875, -0.4298095703125, -0.41119384765625, -0.392578125, -0.37396240234375, -0.3553466796875, -0.33673095703125, -0.318115234375, -0.29949951171875, -0.2808837890625, -0.26226806640625, -0.24365234375, -0.22503662109375, -0.2064208984375, -0.18780517578125, -0.169189453125, -0.15057373046875, -0.1319580078125, -0.11334228515625, -0.0947265625, -0.07611083984375, -0.0574951171875, -0.03887939453125, -0.020263671875, -0.00164794921875, 0.0169677734375, 0.03558349609375, 0.05419921875, 0.07281494140625, 0.0914306640625, 0.11004638671875, 0.128662109375, 0.14727783203125, 0.1658935546875, 0.18450927734375, 0.203125, 0.22174072265625, 0.2403564453125, 0.25897216796875, 0.277587890625, 0.29620361328125, 0.3148193359375, 0.33343505859375, 0.35205078125, 0.37066650390625, 0.3892822265625, 0.40789794921875, 0.426513671875, 0.44512939453125, 0.4637451171875, 0.48236083984375, 0.5009765625, 0.51959228515625, 0.5382080078125, 0.55682373046875, 0.575439453125, 0.59405517578125, 0.6126708984375, 0.63128662109375, 0.64990234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 5.0, 6.0, 6.0, 6.0, 16.0, 9.0, 16.0, 21.0, 33.0, 52.0, 61.0, 70.0, 82.0, 104.0, 97.0, 92.0, 76.0, 65.0, 28.0, 36.0, 22.0, 21.0, 17.0, 16.0, 9.0, 7.0, 6.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022995471954345703, -0.00022314675152301788, -0.00021633878350257874, -0.0002095308154821396, -0.00020272284746170044, -0.0001959148794412613, -0.00018910691142082214, -0.000182298943400383, -0.00017549097537994385, -0.0001686830073595047, -0.00016187503933906555, -0.0001550670713186264, -0.00014825910329818726, -0.0001414511352777481, -0.00013464316725730896, -0.0001278351992368698, -0.00012102723121643066, -0.00011421926319599152, -0.00010741129517555237, -0.00010060332715511322, -9.379535913467407e-05, -8.698739111423492e-05, -8.017942309379578e-05, -7.337145507335663e-05, -6.656348705291748e-05, -5.975551903247833e-05, -5.2947551012039185e-05, -4.613958299160004e-05, -3.933161497116089e-05, -3.252364695072174e-05, -2.5715678930282593e-05, -1.8907710909843445e-05, -1.2099742889404297e-05, -5.291774868965149e-06, 1.516193151473999e-06, 8.324161171913147e-06, 1.5132129192352295e-05, 2.1940097212791443e-05, 2.874806523323059e-05, 3.555603325366974e-05, 4.236400127410889e-05, 4.9171969294548035e-05, 5.597993731498718e-05, 6.278790533542633e-05, 6.959587335586548e-05, 7.640384137630463e-05, 8.321180939674377e-05, 9.001977741718292e-05, 9.682774543762207e-05, 0.00010363571345806122, 0.00011044368147850037, 0.00011725164949893951, 0.00012405961751937866, 0.0001308675855398178, 0.00013767555356025696, 0.0001444835215806961, 0.00015129148960113525, 0.0001580994576215744, 0.00016490742564201355, 0.0001717153936624527, 0.00017852336168289185, 0.000185331329703331, 0.00019213929772377014, 0.0001989472657442093, 0.00020575523376464844]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 21.0, 17.0, 30.0, 62.0, 57.0, 83.0, 157.0, 235.0, 313.0, 500.0, 714.0, 1150.0, 1835.0, 3087.0, 4885.0, 8402.0, 14834.0, 28159.0, 57521.0, 130495.0, 325689.0, 262221.0, 105214.0, 47312.0, 23740.0, 12883.0, 7352.0, 4204.0, 2635.0, 1616.0, 1037.0, 668.0, 448.0, 306.0, 219.0, 126.0, 81.0, 68.0, 40.0, 30.0, 25.0, 23.0, 11.0, 12.0, 8.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.4443359375, -0.4319496154785156, -0.41956329345703125, -0.4071769714355469, -0.3947906494140625, -0.3824043273925781, -0.37001800537109375, -0.3576316833496094, -0.345245361328125, -0.3328590393066406, -0.32047271728515625, -0.3080863952636719, -0.2957000732421875, -0.2833137512207031, -0.27092742919921875, -0.2585411071777344, -0.24615478515625, -0.23376846313476562, -0.22138214111328125, -0.20899581909179688, -0.1966094970703125, -0.18422317504882812, -0.17183685302734375, -0.15945053100585938, -0.147064208984375, -0.13467788696289062, -0.12229156494140625, -0.10990524291992188, -0.0975189208984375, -0.08513259887695312, -0.07274627685546875, -0.060359954833984375, -0.0479736328125, -0.035587310791015625, -0.02320098876953125, -0.010814666748046875, 0.0015716552734375, 0.013957977294921875, 0.02634429931640625, 0.038730621337890625, 0.051116943359375, 0.06350326538085938, 0.07588958740234375, 0.08827590942382812, 0.1006622314453125, 0.11304855346679688, 0.12543487548828125, 0.13782119750976562, 0.15020751953125, 0.16259384155273438, 0.17498016357421875, 0.18736648559570312, 0.1997528076171875, 0.21213912963867188, 0.22452545166015625, 0.23691177368164062, 0.249298095703125, 0.2616844177246094, 0.27407073974609375, 0.2864570617675781, 0.2988433837890625, 0.3112297058105469, 0.32361602783203125, 0.3360023498535156, 0.348388671875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 6.0, 9.0, 11.0, 17.0, 25.0, 28.0, 36.0, 49.0, 43.0, 90.0, 60.0, 89.0, 85.0, 88.0, 53.0, 67.0, 48.0, 37.0, 27.0, 23.0, 25.0, 13.0, 10.0, 9.0, 6.0, 10.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.142333984375, -0.1385974884033203, -0.13486099243164062, -0.13112449645996094, -0.12738800048828125, -0.12365150451660156, -0.11991500854492188, -0.11617851257324219, -0.1124420166015625, -0.10870552062988281, -0.10496902465820312, -0.10123252868652344, -0.09749603271484375, -0.09375953674316406, -0.09002304077148438, -0.08628654479980469, -0.082550048828125, -0.07881355285644531, -0.07507705688476562, -0.07134056091308594, -0.06760406494140625, -0.06386756896972656, -0.060131072998046875, -0.05639457702636719, -0.0526580810546875, -0.04892158508300781, -0.045185089111328125, -0.04144859313964844, -0.03771209716796875, -0.03397560119628906, -0.030239105224609375, -0.026502609252929688, -0.02276611328125, -0.019029617309570312, -0.015293121337890625, -0.011556625366210938, -0.00782012939453125, -0.0040836334228515625, -0.000347137451171875, 0.0033893585205078125, 0.0071258544921875, 0.010862350463867188, 0.014598846435546875, 0.018335342407226562, 0.02207183837890625, 0.025808334350585938, 0.029544830322265625, 0.03328132629394531, 0.037017822265625, 0.04075431823730469, 0.044490814208984375, 0.04822731018066406, 0.05196380615234375, 0.05570030212402344, 0.059436798095703125, 0.06317329406738281, 0.0669097900390625, 0.07064628601074219, 0.07438278198242188, 0.07811927795410156, 0.08185577392578125, 0.08559226989746094, 0.08932876586914062, 0.09306526184082031, 0.0968017578125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 7.0, 12.0, 8.0, 21.0, 29.0, 27.0, 38.0, 49.0, 67.0, 69.0, 88.0, 95.0, 90.0, 89.0, 63.0, 42.0, 44.0, 26.0, 27.0, 27.0, 14.0, 11.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.76143646240234, -93.48902893066406, -90.21661376953125, -86.94419860839844, -83.67179107666016, -80.39938354492188, -77.12696838378906, -73.85455322265625, -70.58214569091797, -67.30973815917969, -64.03732299804688, -60.76491165161133, -57.49250030517578, -54.220088958740234, -50.94767761230469, -47.67526626586914, -44.402854919433594, -41.13044357299805, -37.8580322265625, -34.58562088012695, -31.313209533691406, -28.04079818725586, -24.768386840820312, -21.495975494384766, -18.22356414794922, -14.951152801513672, -11.678741455078125, -8.406330108642578, -5.133918762207031, -1.8615074157714844, 1.4109039306640625, 4.683315277099609, 7.955726623535156, 11.228137969970703, 14.50054931640625, 17.772960662841797, 21.045372009277344, 24.31778335571289, 27.590194702148438, 30.862606048583984, 34.13501739501953, 37.40742874145508, 40.679840087890625, 43.95225143432617, 47.22466278076172, 50.497074127197266, 53.76948547363281, 57.04189682006836, 60.314308166503906, 63.58671951293945, 66.859130859375, 70.13154602050781, 73.4039535522461, 76.67636108398438, 79.94877624511719, 83.22119140625, 86.49359893798828, 89.76600646972656, 93.03842163085938, 96.31083679199219, 99.58324432373047, 102.85565185546875, 106.12806701660156, 109.40048217773438, 112.67288970947266]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 6.0, 6.0, 13.0, 8.0, 17.0, 17.0, 19.0, 14.0, 23.0, 32.0, 30.0, 28.0, 41.0, 42.0, 33.0, 38.0, 31.0, 43.0, 42.0, 38.0, 30.0, 34.0, 41.0, 36.0, 37.0, 23.0, 34.0, 29.0, 30.0, 22.0, 22.0, 21.0, 21.0, 19.0, 12.0, 12.0, 8.0, 7.0, 8.0, 2.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.92499923706055, -56.97076416015625, -55.01652526855469, -53.06229019165039, -51.10805130004883, -49.15381622314453, -47.19957733154297, -45.24534225463867, -43.291107177734375, -41.33687210083008, -39.382633209228516, -37.42839813232422, -35.474159240722656, -33.51992416381836, -31.56568717956543, -29.6114501953125, -27.657211303710938, -25.702974319458008, -23.748737335205078, -21.79450225830078, -19.84026336669922, -17.886028289794922, -15.931791305541992, -13.977554321289062, -12.023317337036133, -10.069080352783203, -8.114843368530273, -6.16060733795166, -4.2063703536987305, -2.252133369445801, -0.2978973388671875, 1.6563396453857422, 3.6105804443359375, 5.564817428588867, 7.519053936004639, 9.47329044342041, 11.42752742767334, 13.38176441192627, 15.336000442504883, 17.290237426757812, 19.244474411010742, 21.198711395263672, 23.1529483795166, 25.10718536376953, 27.061420440673828, 29.01565933227539, 30.969894409179688, 32.92413330078125, 34.87836837768555, 36.832603454589844, 38.786842346191406, 40.7410774230957, 42.695316314697266, 44.64955139160156, 46.603790283203125, 48.55802536010742, 50.51226043701172, 52.466495513916016, 54.42073440551758, 56.374969482421875, 58.32920837402344, 60.283443450927734, 62.23767852783203, 64.1919174194336, 66.14615631103516]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 14.0, 30.0, 32.0, 40.0, 66.0, 99.0, 168.0, 201.0, 344.0, 488.0, 753.0, 1246.0, 1854.0, 2760.0, 4306.0, 6638.0, 10408.0, 15956.0, 25865.0, 41598.0, 67986.0, 113152.0, 172687.0, 196149.0, 147593.0, 91088.0, 54793.0, 33441.0, 21053.0, 13236.0, 8588.0, 5602.0, 3509.0, 2366.0, 1537.0, 968.0, 626.0, 445.0, 297.0, 201.0, 129.0, 75.0, 54.0, 37.0, 27.0, 14.0, 6.0, 11.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-109.9375, -106.5322265625, -103.126953125, -99.7216796875, -96.31640625, -92.9111328125, -89.505859375, -86.1005859375, -82.6953125, -79.2900390625, -75.884765625, -72.4794921875, -69.07421875, -65.6689453125, -62.263671875, -58.8583984375, -55.453125, -52.0478515625, -48.642578125, -45.2373046875, -41.83203125, -38.4267578125, -35.021484375, -31.6162109375, -28.2109375, -24.8056640625, -21.400390625, -17.9951171875, -14.58984375, -11.1845703125, -7.779296875, -4.3740234375, -0.96875, 2.4365234375, 5.841796875, 9.2470703125, 12.65234375, 16.0576171875, 19.462890625, 22.8681640625, 26.2734375, 29.6787109375, 33.083984375, 36.4892578125, 39.89453125, 43.2998046875, 46.705078125, 50.1103515625, 53.515625, 56.9208984375, 60.326171875, 63.7314453125, 67.13671875, 70.5419921875, 73.947265625, 77.3525390625, 80.7578125, 84.1630859375, 87.568359375, 90.9736328125, 94.37890625, 97.7841796875, 101.189453125, 104.5947265625, 108.0]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 9.0, 7.0, 8.0, 20.0, 13.0, 23.0, 14.0, 20.0, 24.0, 18.0, 33.0, 33.0, 38.0, 31.0, 47.0, 45.0, 34.0, 43.0, 42.0, 33.0, 44.0, 30.0, 39.0, 32.0, 39.0, 37.0, 35.0, 19.0, 24.0, 27.0, 24.0, 21.0, 16.0, 15.0, 10.0, 10.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-56.53125, -54.86181640625, -53.1923828125, -51.52294921875, -49.853515625, -48.18408203125, -46.5146484375, -44.84521484375, -43.17578125, -41.50634765625, -39.8369140625, -38.16748046875, -36.498046875, -34.82861328125, -33.1591796875, -31.48974609375, -29.8203125, -28.15087890625, -26.4814453125, -24.81201171875, -23.142578125, -21.47314453125, -19.8037109375, -18.13427734375, -16.46484375, -14.79541015625, -13.1259765625, -11.45654296875, -9.787109375, -8.11767578125, -6.4482421875, -4.77880859375, -3.109375, -1.43994140625, 0.2294921875, 1.89892578125, 3.568359375, 5.23779296875, 6.9072265625, 8.57666015625, 10.24609375, 11.91552734375, 13.5849609375, 15.25439453125, 16.923828125, 18.59326171875, 20.2626953125, 21.93212890625, 23.6015625, 25.27099609375, 26.9404296875, 28.60986328125, 30.279296875, 31.94873046875, 33.6181640625, 35.28759765625, 36.95703125, 38.62646484375, 40.2958984375, 41.96533203125, 43.634765625, 45.30419921875, 46.9736328125, 48.64306640625, 50.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 26.0, 23.0, 56.0, 72.0, 105.0, 193.0, 285.0, 435.0, 645.0, 915.0, 1368.0, 2087.0, 3037.0, 4579.0, 7004.0, 10512.0, 16050.0, 24587.0, 38182.0, 60302.0, 94376.0, 144219.0, 183440.0, 157343.0, 106264.0, 68175.0, 43254.0, 27863.0, 17833.0, 12040.0, 7834.0, 5164.0, 3309.0, 2310.0, 1574.0, 1040.0, 692.0, 449.0, 327.0, 206.0, 123.0, 89.0, 71.0, 29.0, 24.0, 7.0, 7.0, 5.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.0, -84.16015625, -81.3203125, -78.48046875, -75.640625, -72.80078125, -69.9609375, -67.12109375, -64.28125, -61.44140625, -58.6015625, -55.76171875, -52.921875, -50.08203125, -47.2421875, -44.40234375, -41.5625, -38.72265625, -35.8828125, -33.04296875, -30.203125, -27.36328125, -24.5234375, -21.68359375, -18.84375, -16.00390625, -13.1640625, -10.32421875, -7.484375, -4.64453125, -1.8046875, 1.03515625, 3.875, 6.71484375, 9.5546875, 12.39453125, 15.234375, 18.07421875, 20.9140625, 23.75390625, 26.59375, 29.43359375, 32.2734375, 35.11328125, 37.953125, 40.79296875, 43.6328125, 46.47265625, 49.3125, 52.15234375, 54.9921875, 57.83203125, 60.671875, 63.51171875, 66.3515625, 69.19140625, 72.03125, 74.87109375, 77.7109375, 80.55078125, 83.390625, 86.23046875, 89.0703125, 91.91015625, 94.75]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 6.0, 11.0, 20.0, 10.0, 20.0, 20.0, 24.0, 24.0, 26.0, 38.0, 23.0, 34.0, 36.0, 34.0, 34.0, 40.0, 35.0, 45.0, 38.0, 33.0, 31.0, 26.0, 39.0, 37.0, 29.0, 25.0, 27.0, 27.0, 25.0, 23.0, 24.0, 19.0, 13.0, 5.0, 11.0, 15.0, 14.0, 7.0, 8.0, 12.0, 4.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.90625, -28.955322265625, -28.00439453125, -27.053466796875, -26.1025390625, -25.151611328125, -24.20068359375, -23.249755859375, -22.298828125, -21.347900390625, -20.39697265625, -19.446044921875, -18.4951171875, -17.544189453125, -16.59326171875, -15.642333984375, -14.69140625, -13.740478515625, -12.78955078125, -11.838623046875, -10.8876953125, -9.936767578125, -8.98583984375, -8.034912109375, -7.083984375, -6.133056640625, -5.18212890625, -4.231201171875, -3.2802734375, -2.329345703125, -1.37841796875, -0.427490234375, 0.5234375, 1.474365234375, 2.42529296875, 3.376220703125, 4.3271484375, 5.278076171875, 6.22900390625, 7.179931640625, 8.130859375, 9.081787109375, 10.03271484375, 10.983642578125, 11.9345703125, 12.885498046875, 13.83642578125, 14.787353515625, 15.73828125, 16.689208984375, 17.64013671875, 18.591064453125, 19.5419921875, 20.492919921875, 21.44384765625, 22.394775390625, 23.345703125, 24.296630859375, 25.24755859375, 26.198486328125, 27.1494140625, 28.100341796875, 29.05126953125, 30.002197265625, 30.953125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 5.0, 10.0, 20.0, 17.0, 29.0, 42.0, 57.0, 70.0, 104.0, 158.0, 228.0, 286.0, 403.0, 629.0, 936.0, 1366.0, 2147.0, 3280.0, 5324.0, 8831.0, 15940.0, 32653.0, 79113.0, 278852.0, 416548.0, 112000.0, 41673.0, 19793.0, 10656.0, 6217.0, 3785.0, 2405.0, 1591.0, 1063.0, 728.0, 448.0, 344.0, 231.0, 175.0, 105.0, 82.0, 58.0, 50.0, 25.0, 17.0, 20.0, 14.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-11.9921875, -11.6072998046875, -11.222412109375, -10.8375244140625, -10.45263671875, -10.0677490234375, -9.682861328125, -9.2979736328125, -8.9130859375, -8.5281982421875, -8.143310546875, -7.7584228515625, -7.37353515625, -6.9886474609375, -6.603759765625, -6.2188720703125, -5.833984375, -5.4490966796875, -5.064208984375, -4.6793212890625, -4.29443359375, -3.9095458984375, -3.524658203125, -3.1397705078125, -2.7548828125, -2.3699951171875, -1.985107421875, -1.6002197265625, -1.21533203125, -0.8304443359375, -0.445556640625, -0.0606689453125, 0.32421875, 0.7091064453125, 1.093994140625, 1.4788818359375, 1.86376953125, 2.2486572265625, 2.633544921875, 3.0184326171875, 3.4033203125, 3.7882080078125, 4.173095703125, 4.5579833984375, 4.94287109375, 5.3277587890625, 5.712646484375, 6.0975341796875, 6.482421875, 6.8673095703125, 7.252197265625, 7.6370849609375, 8.02197265625, 8.4068603515625, 8.791748046875, 9.1766357421875, 9.5615234375, 9.9464111328125, 10.331298828125, 10.7161865234375, 11.10107421875, 11.4859619140625, 11.870849609375, 12.2557373046875, 12.640625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 7.0, 12.0, 11.0, 16.0, 19.0, 23.0, 41.0, 43.0, 66.0, 79.0, 91.0, 116.0, 93.0, 68.0, 67.0, 42.0, 41.0, 33.0, 36.0, 12.0, 13.0, 8.0, 9.0, 11.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00107574462890625, -0.001040816307067871, -0.0010058879852294922, -0.0009709596633911133, -0.0009360313415527344, -0.0009011030197143555, -0.0008661746978759766, -0.0008312463760375977, -0.0007963180541992188, -0.0007613897323608398, -0.0007264614105224609, -0.000691533088684082, -0.0006566047668457031, -0.0006216764450073242, -0.0005867481231689453, -0.0005518198013305664, -0.0005168914794921875, -0.0004819631576538086, -0.0004470348358154297, -0.0004121065139770508, -0.0003771781921386719, -0.00034224987030029297, -0.00030732154846191406, -0.00027239322662353516, -0.00023746490478515625, -0.00020253658294677734, -0.00016760826110839844, -0.00013267993927001953, -9.775161743164062e-05, -6.282329559326172e-05, -2.7894973754882812e-05, 7.033348083496094e-06, 4.1961669921875e-05, 7.68899917602539e-05, 0.00011181831359863281, 0.00014674663543701172, 0.00018167495727539062, 0.00021660327911376953, 0.00025153160095214844, 0.00028645992279052734, 0.00032138824462890625, 0.00035631656646728516, 0.00039124488830566406, 0.00042617321014404297, 0.0004611015319824219, 0.0004960298538208008, 0.0005309581756591797, 0.0005658864974975586, 0.0006008148193359375, 0.0006357431411743164, 0.0006706714630126953, 0.0007055997848510742, 0.0007405281066894531, 0.000775456428527832, 0.0008103847503662109, 0.0008453130722045898, 0.0008802413940429688, 0.0009151697158813477, 0.0009500980377197266, 0.0009850263595581055, 0.0010199546813964844, 0.0010548830032348633, 0.0010898113250732422, 0.001124739646911621, 0.00115966796875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 20.0, 19.0, 27.0, 27.0, 65.0, 85.0, 131.0, 189.0, 310.0, 440.0, 678.0, 1118.0, 1691.0, 2649.0, 4315.0, 6734.0, 11107.0, 19370.0, 36896.0, 82690.0, 254430.0, 389104.0, 125427.0, 49807.0, 24699.0, 14025.0, 8239.0, 5163.0, 3298.0, 2053.0, 1318.0, 812.0, 547.0, 332.0, 217.0, 166.0, 91.0, 77.0, 60.0, 30.0, 22.0, 19.0, 13.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.296875, -10.9566650390625, -10.616455078125, -10.2762451171875, -9.93603515625, -9.5958251953125, -9.255615234375, -8.9154052734375, -8.5751953125, -8.2349853515625, -7.894775390625, -7.5545654296875, -7.21435546875, -6.8741455078125, -6.533935546875, -6.1937255859375, -5.853515625, -5.5133056640625, -5.173095703125, -4.8328857421875, -4.49267578125, -4.1524658203125, -3.812255859375, -3.4720458984375, -3.1318359375, -2.7916259765625, -2.451416015625, -2.1112060546875, -1.77099609375, -1.4307861328125, -1.090576171875, -0.7503662109375, -0.41015625, -0.0699462890625, 0.270263671875, 0.6104736328125, 0.95068359375, 1.2908935546875, 1.631103515625, 1.9713134765625, 2.3115234375, 2.6517333984375, 2.991943359375, 3.3321533203125, 3.67236328125, 4.0125732421875, 4.352783203125, 4.6929931640625, 5.033203125, 5.3734130859375, 5.713623046875, 6.0538330078125, 6.39404296875, 6.7342529296875, 7.074462890625, 7.4146728515625, 7.7548828125, 8.0950927734375, 8.435302734375, 8.7755126953125, 9.11572265625, 9.4559326171875, 9.796142578125, 10.1363525390625, 10.4765625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 9.0, 4.0, 13.0, 10.0, 9.0, 14.0, 17.0, 21.0, 23.0, 31.0, 38.0, 49.0, 68.0, 100.0, 86.0, 93.0, 97.0, 90.0, 45.0, 29.0, 30.0, 22.0, 15.0, 13.0, 17.0, 9.0, 10.0, 3.0, 6.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.658203125, -3.553741455078125, -3.44927978515625, -3.344818115234375, -3.2403564453125, -3.135894775390625, -3.03143310546875, -2.926971435546875, -2.822509765625, -2.718048095703125, -2.61358642578125, -2.509124755859375, -2.4046630859375, -2.300201416015625, -2.19573974609375, -2.091278076171875, -1.98681640625, -1.882354736328125, -1.77789306640625, -1.673431396484375, -1.5689697265625, -1.464508056640625, -1.36004638671875, -1.255584716796875, -1.151123046875, -1.046661376953125, -0.94219970703125, -0.837738037109375, -0.7332763671875, -0.628814697265625, -0.52435302734375, -0.419891357421875, -0.3154296875, -0.210968017578125, -0.10650634765625, -0.002044677734375, 0.1024169921875, 0.206878662109375, 0.31134033203125, 0.415802001953125, 0.520263671875, 0.624725341796875, 0.72918701171875, 0.833648681640625, 0.9381103515625, 1.042572021484375, 1.14703369140625, 1.251495361328125, 1.35595703125, 1.460418701171875, 1.56488037109375, 1.669342041015625, 1.7738037109375, 1.878265380859375, 1.98272705078125, 2.087188720703125, 2.191650390625, 2.296112060546875, 2.40057373046875, 2.505035400390625, 2.6094970703125, 2.713958740234375, 2.81842041015625, 2.922882080078125, 3.02734375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 6.0, 4.0, 9.0, 8.0, 18.0, 11.0, 25.0, 30.0, 30.0, 57.0, 70.0, 58.0, 88.0, 91.0, 97.0, 84.0, 71.0, 49.0, 43.0, 34.0, 22.0, 14.0, 24.0, 16.0, 6.0, 6.0, 7.0, 6.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.1474609375, -83.43801879882812, -80.72857666015625, -78.01913452148438, -75.30970001220703, -72.60025787353516, -69.89081573486328, -67.1813735961914, -64.47193908691406, -61.76249694824219, -59.05305862426758, -56.3436164855957, -53.634178161621094, -50.92473602294922, -48.215293884277344, -45.50585174560547, -42.796409606933594, -40.08696746826172, -37.37752914428711, -34.668087005615234, -31.958646774291992, -29.24920654296875, -26.539764404296875, -23.830324172973633, -21.12088394165039, -18.41144371032715, -15.70200252532959, -12.992561340332031, -10.283121109008789, -7.573680877685547, -4.864238739013672, -2.1547985076904297, 0.5546493530273438, 3.264090061187744, 5.9735307693481445, 8.682971954345703, 11.392412185668945, 14.101852416992188, 16.811294555664062, 19.520734786987305, 22.230175018310547, 24.93961524963379, 27.64905548095703, 30.358497619628906, 33.06793975830078, 35.77737808227539, 38.486820220947266, 41.196258544921875, 43.90570068359375, 46.615142822265625, 49.324581146240234, 52.03402328491211, 54.74346160888672, 57.452903747558594, 60.16234588623047, 62.871788024902344, 65.58122253417969, 68.29066467285156, 71.00010681152344, 73.70954895019531, 76.41898345947266, 79.12842559814453, 81.8378677368164, 84.54730987548828, 87.25675201416016]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 9.0, 8.0, 10.0, 10.0, 18.0, 9.0, 19.0, 27.0, 23.0, 35.0, 32.0, 30.0, 30.0, 43.0, 30.0, 48.0, 35.0, 45.0, 50.0, 49.0, 43.0, 50.0, 32.0, 35.0, 35.0, 31.0, 32.0, 23.0, 31.0, 13.0, 23.0, 20.0, 8.0, 15.0, 10.0, 8.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.24112319946289, -52.443058013916016, -50.644996643066406, -48.84693145751953, -47.048866271972656, -45.25080108642578, -43.45273971557617, -41.6546745300293, -39.85661315917969, -38.05854797363281, -36.2604866027832, -34.46242141723633, -32.66435623168945, -30.86629295349121, -29.06822967529297, -27.270164489746094, -25.47209930419922, -23.674036026000977, -21.8759708404541, -20.07790756225586, -18.279842376708984, -16.481779098510742, -14.6837158203125, -12.885651588439941, -11.087587356567383, -9.289523124694824, -7.491459369659424, -5.693395614624023, -3.895331382751465, -2.0972671508789062, -0.29920387268066406, 1.4988603591918945, 3.2969284057617188, 5.094992637634277, 6.893056392669678, 8.691120147705078, 10.489184379577637, 12.287248611450195, 14.085311889648438, 15.883376121520996, 17.681440353393555, 19.479503631591797, 21.277568817138672, 23.075632095336914, 24.873695373535156, 26.67176055908203, 28.469823837280273, 30.267887115478516, 32.06595230102539, 33.864017486572266, 35.662078857421875, 37.46014404296875, 39.258209228515625, 41.0562744140625, 42.85433578491211, 44.652400970458984, 46.450462341308594, 48.24852752685547, 50.04658889770508, 51.84465408325195, 53.64271926879883, 55.44078063964844, 57.23884582519531, 59.03691101074219, 60.83497619628906]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 5.0, 12.0, 26.0, 26.0, 55.0, 96.0, 110.0, 200.0, 327.0, 508.0, 804.0, 1285.0, 2095.0, 3256.0, 5450.0, 8834.0, 14588.0, 24776.0, 44250.0, 83584.0, 176882.0, 597726.0, 1758730.0, 992509.0, 253894.0, 102708.0, 52348.0, 28415.0, 16041.0, 9629.0, 5763.0, 3457.0, 2237.0, 1345.0, 850.0, 560.0, 325.0, 210.0, 117.0, 76.0, 66.0, 37.0, 18.0, 17.0, 10.0, 14.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-79.5, -76.7275390625, -73.955078125, -71.1826171875, -68.41015625, -65.6376953125, -62.865234375, -60.0927734375, -57.3203125, -54.5478515625, -51.775390625, -49.0029296875, -46.23046875, -43.4580078125, -40.685546875, -37.9130859375, -35.140625, -32.3681640625, -29.595703125, -26.8232421875, -24.05078125, -21.2783203125, -18.505859375, -15.7333984375, -12.9609375, -10.1884765625, -7.416015625, -4.6435546875, -1.87109375, 0.9013671875, 3.673828125, 6.4462890625, 9.21875, 11.9912109375, 14.763671875, 17.5361328125, 20.30859375, 23.0810546875, 25.853515625, 28.6259765625, 31.3984375, 34.1708984375, 36.943359375, 39.7158203125, 42.48828125, 45.2607421875, 48.033203125, 50.8056640625, 53.578125, 56.3505859375, 59.123046875, 61.8955078125, 64.66796875, 67.4404296875, 70.212890625, 72.9853515625, 75.7578125, 78.5302734375, 81.302734375, 84.0751953125, 86.84765625, 89.6201171875, 92.392578125, 95.1650390625, 97.9375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 2.0, 5.0, 7.0, 14.0, 15.0, 11.0, 18.0, 16.0, 26.0, 22.0, 19.0, 26.0, 24.0, 41.0, 40.0, 46.0, 51.0, 44.0, 37.0, 41.0, 54.0, 51.0, 44.0, 37.0, 31.0, 40.0, 28.0, 41.0, 20.0, 22.0, 17.0, 16.0, 18.0, 16.0, 14.0, 8.0, 7.0, 7.0, 7.0, 5.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -37.00390625, -35.6640625, -34.32421875, -32.984375, -31.64453125, -30.3046875, -28.96484375, -27.625, -26.28515625, -24.9453125, -23.60546875, -22.265625, -20.92578125, -19.5859375, -18.24609375, -16.90625, -15.56640625, -14.2265625, -12.88671875, -11.546875, -10.20703125, -8.8671875, -7.52734375, -6.1875, -4.84765625, -3.5078125, -2.16796875, -0.828125, 0.51171875, 1.8515625, 3.19140625, 4.53125, 5.87109375, 7.2109375, 8.55078125, 9.890625, 11.23046875, 12.5703125, 13.91015625, 15.25, 16.58984375, 17.9296875, 19.26953125, 20.609375, 21.94921875, 23.2890625, 24.62890625, 25.96875, 27.30859375, 28.6484375, 29.98828125, 31.328125, 32.66796875, 34.0078125, 35.34765625, 36.6875, 38.02734375, 39.3671875, 40.70703125, 42.046875, 43.38671875, 44.7265625, 46.06640625, 47.40625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 16.0, 22.0, 27.0, 45.0, 91.0, 102.0, 187.0, 301.0, 419.0, 751.0, 1210.0, 1982.0, 3120.0, 5259.0, 8829.0, 15261.0, 27069.0, 48933.0, 92789.0, 185190.0, 396113.0, 1025190.0, 1391748.0, 511512.0, 228505.0, 113274.0, 59776.0, 32138.0, 18244.0, 10436.0, 6187.0, 3572.0, 2271.0, 1355.0, 851.0, 546.0, 328.0, 232.0, 137.0, 94.0, 52.0, 42.0, 20.0, 18.0, 9.0, 7.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-73.6875, -71.3955078125, -69.103515625, -66.8115234375, -64.51953125, -62.2275390625, -59.935546875, -57.6435546875, -55.3515625, -53.0595703125, -50.767578125, -48.4755859375, -46.18359375, -43.8916015625, -41.599609375, -39.3076171875, -37.015625, -34.7236328125, -32.431640625, -30.1396484375, -27.84765625, -25.5556640625, -23.263671875, -20.9716796875, -18.6796875, -16.3876953125, -14.095703125, -11.8037109375, -9.51171875, -7.2197265625, -4.927734375, -2.6357421875, -0.34375, 1.9482421875, 4.240234375, 6.5322265625, 8.82421875, 11.1162109375, 13.408203125, 15.7001953125, 17.9921875, 20.2841796875, 22.576171875, 24.8681640625, 27.16015625, 29.4521484375, 31.744140625, 34.0361328125, 36.328125, 38.6201171875, 40.912109375, 43.2041015625, 45.49609375, 47.7880859375, 50.080078125, 52.3720703125, 54.6640625, 56.9560546875, 59.248046875, 61.5400390625, 63.83203125, 66.1240234375, 68.416015625, 70.7080078125, 73.0]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 3.0, 6.0, 12.0, 10.0, 15.0, 19.0, 29.0, 27.0, 39.0, 41.0, 62.0, 85.0, 83.0, 113.0, 143.0, 151.0, 186.0, 232.0, 285.0, 372.0, 413.0, 346.0, 258.0, 197.0, 175.0, 126.0, 123.0, 121.0, 77.0, 67.0, 46.0, 39.0, 40.0, 25.0, 18.0, 19.0, 13.0, 11.0, 8.0, 4.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.84375, -22.13671875, -21.4296875, -20.72265625, -20.015625, -19.30859375, -18.6015625, -17.89453125, -17.1875, -16.48046875, -15.7734375, -15.06640625, -14.359375, -13.65234375, -12.9453125, -12.23828125, -11.53125, -10.82421875, -10.1171875, -9.41015625, -8.703125, -7.99609375, -7.2890625, -6.58203125, -5.875, -5.16796875, -4.4609375, -3.75390625, -3.046875, -2.33984375, -1.6328125, -0.92578125, -0.21875, 0.48828125, 1.1953125, 1.90234375, 2.609375, 3.31640625, 4.0234375, 4.73046875, 5.4375, 6.14453125, 6.8515625, 7.55859375, 8.265625, 8.97265625, 9.6796875, 10.38671875, 11.09375, 11.80078125, 12.5078125, 13.21484375, 13.921875, 14.62890625, 15.3359375, 16.04296875, 16.75, 17.45703125, 18.1640625, 18.87109375, 19.578125, 20.28515625, 20.9921875, 21.69921875, 22.40625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 8.0, 8.0, 10.0, 6.0, 11.0, 16.0, 15.0, 26.0, 41.0, 58.0, 69.0, 85.0, 93.0, 119.0, 82.0, 74.0, 76.0, 43.0, 37.0, 27.0, 21.0, 22.0, 12.0, 11.0, 15.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.85498046875, -78.57862854003906, -76.30227661132812, -74.02593231201172, -71.74958038330078, -69.47322845458984, -67.19688415527344, -64.9205322265625, -62.64418029785156, -60.367828369140625, -58.09148025512695, -55.81513214111328, -53.538780212402344, -51.262428283691406, -48.986080169677734, -46.70973205566406, -44.433380126953125, -42.15702819824219, -39.880680084228516, -37.604331970214844, -35.327980041503906, -33.05162811279297, -30.775279998779297, -28.498929977416992, -26.222579956054688, -23.946229934692383, -21.669879913330078, -19.393529891967773, -17.11717987060547, -14.840829849243164, -12.56447982788086, -10.288129806518555, -8.011772155761719, -5.735422134399414, -3.4590721130371094, -1.1827220916748047, 1.0936279296875, 3.3699779510498047, 5.646327972412109, 7.922677993774414, 10.199028015136719, 12.475378036499023, 14.751728057861328, 17.028078079223633, 19.304428100585938, 21.580778121948242, 23.857128143310547, 26.13347816467285, 28.409828186035156, 30.68617820739746, 32.962528228759766, 35.23887634277344, 37.515228271484375, 39.79158020019531, 42.067928314208984, 44.344276428222656, 46.620628356933594, 48.89698028564453, 51.1733283996582, 53.449676513671875, 55.72602844238281, 58.00238037109375, 60.27872848510742, 62.555076599121094, 64.83142852783203]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 9.0, 6.0, 3.0, 2.0, 9.0, 11.0, 13.0, 12.0, 13.0, 12.0, 10.0, 23.0, 9.0, 30.0, 23.0, 22.0, 25.0, 29.0, 30.0, 41.0, 30.0, 34.0, 43.0, 40.0, 36.0, 37.0, 33.0, 30.0, 34.0, 37.0, 34.0, 39.0, 31.0, 32.0, 24.0, 22.0, 11.0, 25.0, 18.0, 11.0, 12.0, 10.0, 7.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-37.225006103515625, -36.0454216003418, -34.865840911865234, -33.686256408691406, -32.506675720214844, -31.327091217041016, -30.147506713867188, -28.967924118041992, -27.788341522216797, -26.6087589263916, -25.429176330566406, -24.249591827392578, -23.070009231567383, -21.890426635742188, -20.71084213256836, -19.531259536743164, -18.35167694091797, -17.172094345092773, -15.992510795593262, -14.81292724609375, -13.633344650268555, -12.45376205444336, -11.274178504943848, -10.094594955444336, -8.91501235961914, -7.735429286956787, -6.555846214294434, -5.37626314163208, -4.196680068969727, -3.017096996307373, -1.8375139236450195, -0.6579303741455078, 0.5216522216796875, 1.701235294342041, 2.8808183670043945, 4.060401439666748, 5.239984512329102, 6.419567584991455, 7.599150657653809, 8.77873420715332, 9.958316802978516, 11.137899398803711, 12.317482948303223, 13.497066497802734, 14.67664909362793, 15.856231689453125, 17.035816192626953, 18.21539878845215, 19.394981384277344, 20.57456398010254, 21.754146575927734, 22.933731079101562, 24.113313674926758, 25.292896270751953, 26.47248077392578, 27.652063369750977, 28.831645965576172, 30.011228561401367, 31.190811157226562, 32.37039566040039, 33.54998016357422, 34.72956085205078, 35.90914535522461, 37.08872985839844, 38.268310546875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 20.0, 34.0, 45.0, 57.0, 87.0, 141.0, 192.0, 298.0, 443.0, 676.0, 1004.0, 1424.0, 2213.0, 3230.0, 4834.0, 7273.0, 10740.0, 16503.0, 25029.0, 38064.0, 59356.0, 92274.0, 147360.0, 207873.0, 153279.0, 97322.0, 62026.0, 39488.0, 26109.0, 17175.0, 11365.0, 7432.0, 5035.0, 3315.0, 2173.0, 1537.0, 989.0, 740.0, 420.0, 321.0, 192.0, 156.0, 110.0, 59.0, 43.0, 25.0, 22.0, 10.0, 10.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.78125, -21.0908203125, -20.400390625, -19.7099609375, -19.01953125, -18.3291015625, -17.638671875, -16.9482421875, -16.2578125, -15.5673828125, -14.876953125, -14.1865234375, -13.49609375, -12.8056640625, -12.115234375, -11.4248046875, -10.734375, -10.0439453125, -9.353515625, -8.6630859375, -7.97265625, -7.2822265625, -6.591796875, -5.9013671875, -5.2109375, -4.5205078125, -3.830078125, -3.1396484375, -2.44921875, -1.7587890625, -1.068359375, -0.3779296875, 0.3125, 1.0029296875, 1.693359375, 2.3837890625, 3.07421875, 3.7646484375, 4.455078125, 5.1455078125, 5.8359375, 6.5263671875, 7.216796875, 7.9072265625, 8.59765625, 9.2880859375, 9.978515625, 10.6689453125, 11.359375, 12.0498046875, 12.740234375, 13.4306640625, 14.12109375, 14.8115234375, 15.501953125, 16.1923828125, 16.8828125, 17.5732421875, 18.263671875, 18.9541015625, 19.64453125, 20.3349609375, 21.025390625, 21.7158203125, 22.40625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 10.0, 4.0, 6.0, 17.0, 9.0, 15.0, 21.0, 20.0, 20.0, 20.0, 26.0, 22.0, 32.0, 34.0, 34.0, 31.0, 40.0, 31.0, 43.0, 30.0, 34.0, 31.0, 32.0, 39.0, 33.0, 39.0, 29.0, 39.0, 26.0, 28.0, 22.0, 20.0, 24.0, 16.0, 19.0, 14.0, 11.0, 11.0, 7.0, 4.0, 8.0, 7.0, 4.0, 4.0, 1.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.75, -36.5732421875, -35.396484375, -34.2197265625, -33.04296875, -31.8662109375, -30.689453125, -29.5126953125, -28.3359375, -27.1591796875, -25.982421875, -24.8056640625, -23.62890625, -22.4521484375, -21.275390625, -20.0986328125, -18.921875, -17.7451171875, -16.568359375, -15.3916015625, -14.21484375, -13.0380859375, -11.861328125, -10.6845703125, -9.5078125, -8.3310546875, -7.154296875, -5.9775390625, -4.80078125, -3.6240234375, -2.447265625, -1.2705078125, -0.09375, 1.0830078125, 2.259765625, 3.4365234375, 4.61328125, 5.7900390625, 6.966796875, 8.1435546875, 9.3203125, 10.4970703125, 11.673828125, 12.8505859375, 14.02734375, 15.2041015625, 16.380859375, 17.5576171875, 18.734375, 19.9111328125, 21.087890625, 22.2646484375, 23.44140625, 24.6181640625, 25.794921875, 26.9716796875, 28.1484375, 29.3251953125, 30.501953125, 31.6787109375, 32.85546875, 34.0322265625, 35.208984375, 36.3857421875, 37.5625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 6.0, 4.0, 5.0, 5.0, 7.0, 12.0, 16.0, 36.0, 48.0, 62.0, 115.0, 166.0, 230.0, 369.0, 554.0, 918.0, 1471.0, 2426.0, 4052.0, 6910.0, 12325.0, 22254.0, 41994.0, 83399.0, 171159.0, 322721.0, 186866.0, 89703.0, 45240.0, 23858.0, 13116.0, 7344.0, 4326.0, 2568.0, 1547.0, 1022.0, 613.0, 382.0, 242.0, 142.0, 106.0, 67.0, 59.0, 31.0, 25.0, 11.0, 10.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-29.484375, -28.631103515625, -27.77783203125, -26.924560546875, -26.0712890625, -25.218017578125, -24.36474609375, -23.511474609375, -22.658203125, -21.804931640625, -20.95166015625, -20.098388671875, -19.2451171875, -18.391845703125, -17.53857421875, -16.685302734375, -15.83203125, -14.978759765625, -14.12548828125, -13.272216796875, -12.4189453125, -11.565673828125, -10.71240234375, -9.859130859375, -9.005859375, -8.152587890625, -7.29931640625, -6.446044921875, -5.5927734375, -4.739501953125, -3.88623046875, -3.032958984375, -2.1796875, -1.326416015625, -0.47314453125, 0.380126953125, 1.2333984375, 2.086669921875, 2.93994140625, 3.793212890625, 4.646484375, 5.499755859375, 6.35302734375, 7.206298828125, 8.0595703125, 8.912841796875, 9.76611328125, 10.619384765625, 11.47265625, 12.325927734375, 13.17919921875, 14.032470703125, 14.8857421875, 15.739013671875, 16.59228515625, 17.445556640625, 18.298828125, 19.152099609375, 20.00537109375, 20.858642578125, 21.7119140625, 22.565185546875, 23.41845703125, 24.271728515625, 25.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 6.0, 3.0, 2.0, 4.0, 6.0, 13.0, 11.0, 15.0, 18.0, 27.0, 25.0, 25.0, 27.0, 39.0, 38.0, 35.0, 30.0, 44.0, 42.0, 40.0, 35.0, 53.0, 39.0, 48.0, 42.0, 34.0, 46.0, 35.0, 38.0, 25.0, 19.0, 25.0, 22.0, 17.0, 13.0, 7.0, 9.0, 7.0, 3.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.390625, -28.491455078125, -27.59228515625, -26.693115234375, -25.7939453125, -24.894775390625, -23.99560546875, -23.096435546875, -22.197265625, -21.298095703125, -20.39892578125, -19.499755859375, -18.6005859375, -17.701416015625, -16.80224609375, -15.903076171875, -15.00390625, -14.104736328125, -13.20556640625, -12.306396484375, -11.4072265625, -10.508056640625, -9.60888671875, -8.709716796875, -7.810546875, -6.911376953125, -6.01220703125, -5.113037109375, -4.2138671875, -3.314697265625, -2.41552734375, -1.516357421875, -0.6171875, 0.281982421875, 1.18115234375, 2.080322265625, 2.9794921875, 3.878662109375, 4.77783203125, 5.677001953125, 6.576171875, 7.475341796875, 8.37451171875, 9.273681640625, 10.1728515625, 11.072021484375, 11.97119140625, 12.870361328125, 13.76953125, 14.668701171875, 15.56787109375, 16.467041015625, 17.3662109375, 18.265380859375, 19.16455078125, 20.063720703125, 20.962890625, 21.862060546875, 22.76123046875, 23.660400390625, 24.5595703125, 25.458740234375, 26.35791015625, 27.257080078125, 28.15625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 9.0, 13.0, 17.0, 32.0, 53.0, 51.0, 102.0, 146.0, 258.0, 437.0, 740.0, 1439.0, 3203.0, 7562.0, 22857.0, 92121.0, 623199.0, 232297.0, 41847.0, 12728.0, 4729.0, 2182.0, 1072.0, 604.0, 293.0, 210.0, 128.0, 72.0, 51.0, 34.0, 21.0, 11.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7001953125, -0.6811370849609375, -0.662078857421875, -0.6430206298828125, -0.62396240234375, -0.6049041748046875, -0.585845947265625, -0.5667877197265625, -0.5477294921875, -0.5286712646484375, -0.509613037109375, -0.4905548095703125, -0.47149658203125, -0.4524383544921875, -0.433380126953125, -0.4143218994140625, -0.395263671875, -0.3762054443359375, -0.357147216796875, -0.3380889892578125, -0.31903076171875, -0.2999725341796875, -0.280914306640625, -0.2618560791015625, -0.2427978515625, -0.2237396240234375, -0.204681396484375, -0.1856231689453125, -0.16656494140625, -0.1475067138671875, -0.128448486328125, -0.1093902587890625, -0.09033203125, -0.0712738037109375, -0.052215576171875, -0.0331573486328125, -0.01409912109375, 0.0049591064453125, 0.024017333984375, 0.0430755615234375, 0.0621337890625, 0.0811920166015625, 0.100250244140625, 0.1193084716796875, 0.13836669921875, 0.1574249267578125, 0.176483154296875, 0.1955413818359375, 0.214599609375, 0.2336578369140625, 0.252716064453125, 0.2717742919921875, 0.29083251953125, 0.3098907470703125, 0.328948974609375, 0.3480072021484375, 0.3670654296875, 0.3861236572265625, 0.405181884765625, 0.4242401123046875, 0.44329833984375, 0.4623565673828125, 0.481414794921875, 0.5004730224609375, 0.51953125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 4.0, 7.0, 5.0, 9.0, 10.0, 16.0, 25.0, 23.0, 40.0, 42.0, 50.0, 66.0, 86.0, 88.0, 94.0, 79.0, 79.0, 59.0, 52.0, 34.0, 29.0, 22.0, 18.0, 13.0, 9.0, 3.0, 3.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0001323223114013672, -0.00012877583503723145, -0.0001252293586730957, -0.00012168288230895996, -0.00011813640594482422, -0.00011458992958068848, -0.00011104345321655273, -0.00010749697685241699, -0.00010395050048828125, -0.00010040402412414551, -9.685754776000977e-05, -9.331107139587402e-05, -8.976459503173828e-05, -8.621811866760254e-05, -8.26716423034668e-05, -7.912516593933105e-05, -7.557868957519531e-05, -7.203221321105957e-05, -6.848573684692383e-05, -6.493926048278809e-05, -6.139278411865234e-05, -5.78463077545166e-05, -5.429983139038086e-05, -5.075335502624512e-05, -4.7206878662109375e-05, -4.366040229797363e-05, -4.011392593383789e-05, -3.656744956970215e-05, -3.3020973205566406e-05, -2.9474496841430664e-05, -2.5928020477294922e-05, -2.238154411315918e-05, -1.8835067749023438e-05, -1.5288591384887695e-05, -1.1742115020751953e-05, -8.195638656616211e-06, -4.649162292480469e-06, -1.1026859283447266e-06, 2.4437904357910156e-06, 5.990266799926758e-06, 9.5367431640625e-06, 1.3083219528198242e-05, 1.6629695892333984e-05, 2.0176172256469727e-05, 2.372264862060547e-05, 2.726912498474121e-05, 3.081560134887695e-05, 3.4362077713012695e-05, 3.790855407714844e-05, 4.145503044128418e-05, 4.500150680541992e-05, 4.8547983169555664e-05, 5.2094459533691406e-05, 5.564093589782715e-05, 5.918741226196289e-05, 6.273388862609863e-05, 6.628036499023438e-05, 6.982684135437012e-05, 7.337331771850586e-05, 7.69197940826416e-05, 8.046627044677734e-05, 8.401274681091309e-05, 8.755922317504883e-05, 9.110569953918457e-05, 9.465217590332031e-05]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 9.0, 13.0, 21.0, 27.0, 30.0, 50.0, 70.0, 108.0, 140.0, 216.0, 288.0, 395.0, 547.0, 852.0, 1264.0, 1823.0, 2899.0, 4740.0, 8081.0, 14165.0, 26670.0, 55586.0, 135887.0, 394784.0, 232718.0, 83274.0, 37547.0, 18950.0, 10487.0, 5961.0, 3750.0, 2340.0, 1513.0, 958.0, 712.0, 477.0, 328.0, 271.0, 185.0, 115.0, 96.0, 76.0, 57.0, 26.0, 11.0, 16.0, 4.0, 5.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.289306640625, -0.27957916259765625, -0.2698516845703125, -0.26012420654296875, -0.250396728515625, -0.24066925048828125, -0.2309417724609375, -0.22121429443359375, -0.21148681640625, -0.20175933837890625, -0.1920318603515625, -0.18230438232421875, -0.172576904296875, -0.16284942626953125, -0.1531219482421875, -0.14339447021484375, -0.1336669921875, -0.12393951416015625, -0.1142120361328125, -0.10448455810546875, -0.094757080078125, -0.08502960205078125, -0.0753021240234375, -0.06557464599609375, -0.05584716796875, -0.04611968994140625, -0.0363922119140625, -0.02666473388671875, -0.016937255859375, -0.00720977783203125, 0.0025177001953125, 0.01224517822265625, 0.02197265625, 0.03170013427734375, 0.0414276123046875, 0.05115509033203125, 0.060882568359375, 0.07061004638671875, 0.0803375244140625, 0.09006500244140625, 0.09979248046875, 0.10951995849609375, 0.1192474365234375, 0.12897491455078125, 0.138702392578125, 0.14842987060546875, 0.1581573486328125, 0.16788482666015625, 0.1776123046875, 0.18733978271484375, 0.1970672607421875, 0.20679473876953125, 0.216522216796875, 0.22624969482421875, 0.2359771728515625, 0.24570465087890625, 0.25543212890625, 0.26515960693359375, 0.2748870849609375, 0.28461456298828125, 0.294342041015625, 0.30406951904296875, 0.3137969970703125, 0.32352447509765625, 0.333251953125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 17.0, 23.0, 15.0, 30.0, 24.0, 40.0, 39.0, 57.0, 76.0, 76.0, 77.0, 79.0, 74.0, 56.0, 57.0, 40.0, 32.0, 33.0, 22.0, 22.0, 14.0, 8.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09307861328125, -0.09016036987304688, -0.08724212646484375, -0.08432388305664062, -0.0814056396484375, -0.07848739624023438, -0.07556915283203125, -0.07265090942382812, -0.069732666015625, -0.06681442260742188, -0.06389617919921875, -0.060977935791015625, -0.0580596923828125, -0.055141448974609375, -0.05222320556640625, -0.049304962158203125, -0.04638671875, -0.043468475341796875, -0.04055023193359375, -0.037631988525390625, -0.0347137451171875, -0.031795501708984375, -0.02887725830078125, -0.025959014892578125, -0.023040771484375, -0.020122528076171875, -0.01720428466796875, -0.014286041259765625, -0.0113677978515625, -0.008449554443359375, -0.00553131103515625, -0.002613067626953125, 0.00030517578125, 0.003223419189453125, 0.00614166259765625, 0.009059906005859375, 0.0119781494140625, 0.014896392822265625, 0.01781463623046875, 0.020732879638671875, 0.023651123046875, 0.026569366455078125, 0.02948760986328125, 0.032405853271484375, 0.0353240966796875, 0.038242340087890625, 0.04116058349609375, 0.044078826904296875, 0.0469970703125, 0.049915313720703125, 0.05283355712890625, 0.055751800537109375, 0.0586700439453125, 0.061588287353515625, 0.06450653076171875, 0.06742477416992188, 0.070343017578125, 0.07326126098632812, 0.07617950439453125, 0.07909774780273438, 0.0820159912109375, 0.08493423461914062, 0.08785247802734375, 0.09077072143554688, 0.09368896484375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 11.0, 9.0, 9.0, 9.0, 13.0, 13.0, 27.0, 46.0, 43.0, 77.0, 81.0, 106.0, 109.0, 107.0, 78.0, 61.0, 52.0, 27.0, 37.0, 18.0, 15.0, 14.0, 12.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.83135223388672, -77.58602905273438, -75.34070587158203, -73.09538269042969, -70.85005950927734, -68.604736328125, -66.35941314697266, -64.11408996582031, -61.86876678466797, -59.623443603515625, -57.37812042236328, -55.13279724121094, -52.887474060058594, -50.64215087890625, -48.396827697753906, -46.15150451660156, -43.90618133544922, -41.660858154296875, -39.41553497314453, -37.17021179199219, -34.924888610839844, -32.6795654296875, -30.434242248535156, -28.188919067382812, -25.94359588623047, -23.698272705078125, -21.45294952392578, -19.207626342773438, -16.962303161621094, -14.71697998046875, -12.471656799316406, -10.226333618164062, -7.981006622314453, -5.735683441162109, -3.4903602600097656, -1.2450370788574219, 1.0002861022949219, 3.2456092834472656, 5.490932464599609, 7.736255645751953, 9.981578826904297, 12.22690200805664, 14.472225189208984, 16.717548370361328, 18.962871551513672, 21.208194732666016, 23.45351791381836, 25.698841094970703, 27.944164276123047, 30.18948745727539, 32.434810638427734, 34.68013381958008, 36.92545700073242, 39.170780181884766, 41.41610336303711, 43.66142654418945, 45.9067497253418, 48.15207290649414, 50.397396087646484, 52.64271926879883, 54.88804244995117, 57.133365631103516, 59.37868881225586, 61.6240119934082, 63.86933517456055]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 3.0, 5.0, 7.0, 10.0, 13.0, 11.0, 17.0, 9.0, 9.0, 22.0, 12.0, 28.0, 24.0, 21.0, 23.0, 30.0, 29.0, 40.0, 30.0, 36.0, 44.0, 36.0, 39.0, 35.0, 37.0, 31.0, 29.0, 38.0, 35.0, 46.0, 26.0, 31.0, 25.0, 21.0, 12.0, 26.0, 21.0, 12.0, 9.0, 10.0, 7.0, 10.0, 7.0, 4.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-35.50832748413086, -34.384117126464844, -33.259910583496094, -32.13570022583008, -31.011489868164062, -29.887279510498047, -28.763071060180664, -27.63886260986328, -26.514652252197266, -25.39044189453125, -24.266233444213867, -23.142024993896484, -22.01781463623047, -20.893604278564453, -19.76939582824707, -18.645187377929688, -17.520977020263672, -16.396766662597656, -15.272558212280273, -14.148348808288574, -13.024139404296875, -11.899930000305176, -10.775720596313477, -9.651511192321777, -8.527301788330078, -7.403092384338379, -6.27888298034668, -5.1546735763549805, -4.030464172363281, -2.906254768371582, -1.7820453643798828, -0.6578359603881836, 0.46636962890625, 1.5905790328979492, 2.7147884368896484, 3.8389978408813477, 4.963207244873047, 6.087416648864746, 7.211626052856445, 8.335835456848145, 9.460044860839844, 10.584254264831543, 11.708463668823242, 12.832673072814941, 13.95688247680664, 15.08109188079834, 16.20530128479004, 17.329509735107422, 18.453720092773438, 19.577930450439453, 20.702138900756836, 21.82634735107422, 22.950557708740234, 24.07476806640625, 25.198976516723633, 26.323184967041016, 27.44739532470703, 28.571605682373047, 29.69581413269043, 30.820022583007812, 31.944232940673828, 33.068443298339844, 34.192649841308594, 35.31686019897461, 36.441070556640625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 8.0, 13.0, 22.0, 48.0, 84.0, 113.0, 158.0, 202.0, 363.0, 493.0, 702.0, 1123.0, 1734.0, 2484.0, 3730.0, 5714.0, 8893.0, 13401.0, 20837.0, 31751.0, 49683.0, 76359.0, 114011.0, 153388.0, 164557.0, 133353.0, 91533.0, 61252.0, 39528.0, 25595.0, 16205.0, 10476.0, 7000.0, 4452.0, 3028.0, 2048.0, 1365.0, 967.0, 618.0, 413.0, 312.0, 182.0, 107.0, 91.0, 54.0, 32.0, 25.0, 15.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-60.8125, -58.92578125, -57.0390625, -55.15234375, -53.265625, -51.37890625, -49.4921875, -47.60546875, -45.71875, -43.83203125, -41.9453125, -40.05859375, -38.171875, -36.28515625, -34.3984375, -32.51171875, -30.625, -28.73828125, -26.8515625, -24.96484375, -23.078125, -21.19140625, -19.3046875, -17.41796875, -15.53125, -13.64453125, -11.7578125, -9.87109375, -7.984375, -6.09765625, -4.2109375, -2.32421875, -0.4375, 1.44921875, 3.3359375, 5.22265625, 7.109375, 8.99609375, 10.8828125, 12.76953125, 14.65625, 16.54296875, 18.4296875, 20.31640625, 22.203125, 24.08984375, 25.9765625, 27.86328125, 29.75, 31.63671875, 33.5234375, 35.41015625, 37.296875, 39.18359375, 41.0703125, 42.95703125, 44.84375, 46.73046875, 48.6171875, 50.50390625, 52.390625, 54.27734375, 56.1640625, 58.05078125, 59.9375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 12.0, 6.0, 8.0, 8.0, 10.0, 13.0, 21.0, 15.0, 21.0, 28.0, 24.0, 19.0, 33.0, 37.0, 24.0, 28.0, 42.0, 44.0, 38.0, 46.0, 35.0, 31.0, 35.0, 45.0, 29.0, 36.0, 30.0, 33.0, 37.0, 37.0, 29.0, 24.0, 14.0, 16.0, 11.0, 11.0, 13.0, 7.0, 5.0, 5.0, 2.0, 10.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-30.40625, -29.39990234375, -28.3935546875, -27.38720703125, -26.380859375, -25.37451171875, -24.3681640625, -23.36181640625, -22.35546875, -21.34912109375, -20.3427734375, -19.33642578125, -18.330078125, -17.32373046875, -16.3173828125, -15.31103515625, -14.3046875, -13.29833984375, -12.2919921875, -11.28564453125, -10.279296875, -9.27294921875, -8.2666015625, -7.26025390625, -6.25390625, -5.24755859375, -4.2412109375, -3.23486328125, -2.228515625, -1.22216796875, -0.2158203125, 0.79052734375, 1.796875, 2.80322265625, 3.8095703125, 4.81591796875, 5.822265625, 6.82861328125, 7.8349609375, 8.84130859375, 9.84765625, 10.85400390625, 11.8603515625, 12.86669921875, 13.873046875, 14.87939453125, 15.8857421875, 16.89208984375, 17.8984375, 18.90478515625, 19.9111328125, 20.91748046875, 21.923828125, 22.93017578125, 23.9365234375, 24.94287109375, 25.94921875, 26.95556640625, 27.9619140625, 28.96826171875, 29.974609375, 30.98095703125, 31.9873046875, 32.99365234375, 34.0]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 15.0, 23.0, 25.0, 32.0, 61.0, 75.0, 137.0, 185.0, 288.0, 474.0, 729.0, 1233.0, 1778.0, 2617.0, 4025.0, 6034.0, 9572.0, 14898.0, 23136.0, 36822.0, 58594.0, 92316.0, 141398.0, 180690.0, 163151.0, 112983.0, 72206.0, 45440.0, 28325.0, 18116.0, 11628.0, 7465.0, 4866.0, 3141.0, 2046.0, 1386.0, 922.0, 581.0, 424.0, 235.0, 159.0, 110.0, 78.0, 53.0, 32.0, 20.0, 14.0, 4.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-62.625, -60.76806640625, -58.9111328125, -57.05419921875, -55.197265625, -53.34033203125, -51.4833984375, -49.62646484375, -47.76953125, -45.91259765625, -44.0556640625, -42.19873046875, -40.341796875, -38.48486328125, -36.6279296875, -34.77099609375, -32.9140625, -31.05712890625, -29.2001953125, -27.34326171875, -25.486328125, -23.62939453125, -21.7724609375, -19.91552734375, -18.05859375, -16.20166015625, -14.3447265625, -12.48779296875, -10.630859375, -8.77392578125, -6.9169921875, -5.06005859375, -3.203125, -1.34619140625, 0.5107421875, 2.36767578125, 4.224609375, 6.08154296875, 7.9384765625, 9.79541015625, 11.65234375, 13.50927734375, 15.3662109375, 17.22314453125, 19.080078125, 20.93701171875, 22.7939453125, 24.65087890625, 26.5078125, 28.36474609375, 30.2216796875, 32.07861328125, 33.935546875, 35.79248046875, 37.6494140625, 39.50634765625, 41.36328125, 43.22021484375, 45.0771484375, 46.93408203125, 48.791015625, 50.64794921875, 52.5048828125, 54.36181640625, 56.21875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 9.0, 5.0, 5.0, 15.0, 8.0, 15.0, 12.0, 13.0, 21.0, 27.0, 16.0, 32.0, 23.0, 24.0, 38.0, 37.0, 39.0, 53.0, 56.0, 48.0, 43.0, 36.0, 34.0, 37.0, 29.0, 26.0, 31.0, 33.0, 26.0, 28.0, 33.0, 19.0, 25.0, 14.0, 18.0, 15.0, 10.0, 8.0, 9.0, 4.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-23.75, -23.08935546875, -22.4287109375, -21.76806640625, -21.107421875, -20.44677734375, -19.7861328125, -19.12548828125, -18.46484375, -17.80419921875, -17.1435546875, -16.48291015625, -15.822265625, -15.16162109375, -14.5009765625, -13.84033203125, -13.1796875, -12.51904296875, -11.8583984375, -11.19775390625, -10.537109375, -9.87646484375, -9.2158203125, -8.55517578125, -7.89453125, -7.23388671875, -6.5732421875, -5.91259765625, -5.251953125, -4.59130859375, -3.9306640625, -3.27001953125, -2.609375, -1.94873046875, -1.2880859375, -0.62744140625, 0.033203125, 0.69384765625, 1.3544921875, 2.01513671875, 2.67578125, 3.33642578125, 3.9970703125, 4.65771484375, 5.318359375, 5.97900390625, 6.6396484375, 7.30029296875, 7.9609375, 8.62158203125, 9.2822265625, 9.94287109375, 10.603515625, 11.26416015625, 11.9248046875, 12.58544921875, 13.24609375, 13.90673828125, 14.5673828125, 15.22802734375, 15.888671875, 16.54931640625, 17.2099609375, 17.87060546875, 18.53125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 14.0, 10.0, 27.0, 29.0, 37.0, 61.0, 86.0, 152.0, 219.0, 295.0, 511.0, 840.0, 1348.0, 2318.0, 3862.0, 7049.0, 13166.0, 25913.0, 55629.0, 137654.0, 402417.0, 237902.0, 82375.0, 36678.0, 18090.0, 9280.0, 5133.0, 2845.0, 1781.0, 1016.0, 644.0, 407.0, 266.0, 155.0, 112.0, 76.0, 51.0, 39.0, 21.0, 20.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.11907958984375, -5.9061279296875, -5.69317626953125, -5.480224609375, -5.26727294921875, -5.0543212890625, -4.84136962890625, -4.62841796875, -4.41546630859375, -4.2025146484375, -3.98956298828125, -3.776611328125, -3.56365966796875, -3.3507080078125, -3.13775634765625, -2.9248046875, -2.71185302734375, -2.4989013671875, -2.28594970703125, -2.072998046875, -1.86004638671875, -1.6470947265625, -1.43414306640625, -1.22119140625, -1.00823974609375, -0.7952880859375, -0.58233642578125, -0.369384765625, -0.15643310546875, 0.0565185546875, 0.26947021484375, 0.482421875, 0.69537353515625, 0.9083251953125, 1.12127685546875, 1.334228515625, 1.54718017578125, 1.7601318359375, 1.97308349609375, 2.18603515625, 2.39898681640625, 2.6119384765625, 2.82489013671875, 3.037841796875, 3.25079345703125, 3.4637451171875, 3.67669677734375, 3.8896484375, 4.10260009765625, 4.3155517578125, 4.52850341796875, 4.741455078125, 4.95440673828125, 5.1673583984375, 5.38031005859375, 5.59326171875, 5.80621337890625, 6.0191650390625, 6.23211669921875, 6.445068359375, 6.65802001953125, 6.8709716796875, 7.08392333984375, 7.296875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 10.0, 6.0, 13.0, 20.0, 21.0, 33.0, 43.0, 57.0, 98.0, 131.0, 149.0, 121.0, 88.0, 43.0, 48.0, 26.0, 30.0, 19.0, 13.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.001041412353515625, -0.0010112226009368896, -0.0009810328483581543, -0.0009508430957794189, -0.0009206533432006836, -0.0008904635906219482, -0.0008602738380432129, -0.0008300840854644775, -0.0007998943328857422, -0.0007697045803070068, -0.0007395148277282715, -0.0007093250751495361, -0.0006791353225708008, -0.0006489455699920654, -0.0006187558174133301, -0.0005885660648345947, -0.0005583763122558594, -0.000528186559677124, -0.0004979968070983887, -0.0004678070545196533, -0.00043761730194091797, -0.0004074275493621826, -0.00037723779678344727, -0.0003470480442047119, -0.00031685829162597656, -0.0002866685390472412, -0.00025647878646850586, -0.0002262890338897705, -0.00019609928131103516, -0.0001659095287322998, -0.00013571977615356445, -0.0001055300235748291, -7.534027099609375e-05, -4.51505184173584e-05, -1.4960765838623047e-05, 1.5228986740112305e-05, 4.5418739318847656e-05, 7.560849189758301e-05, 0.00010579824447631836, 0.0001359879970550537, 0.00016617774963378906, 0.00019636750221252441, 0.00022655725479125977, 0.0002567470073699951, 0.00028693675994873047, 0.0003171265125274658, 0.00034731626510620117, 0.0003775060176849365, 0.0004076957702636719, 0.0004378855228424072, 0.0004680752754211426, 0.0004982650279998779, 0.0005284547805786133, 0.0005586445331573486, 0.000588834285736084, 0.0006190240383148193, 0.0006492137908935547, 0.00067940354347229, 0.0007095932960510254, 0.0007397830486297607, 0.0007699728012084961, 0.0008001625537872314, 0.0008303523063659668, 0.0008605420589447021, 0.0008907318115234375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 6.0, 10.0, 19.0, 23.0, 47.0, 45.0, 83.0, 152.0, 169.0, 252.0, 363.0, 511.0, 810.0, 1085.0, 1686.0, 2469.0, 3788.0, 6247.0, 10202.0, 17270.0, 30841.0, 58190.0, 125740.0, 314026.0, 255818.0, 102467.0, 49352.0, 26408.0, 15137.0, 9178.0, 5642.0, 3426.0, 2288.0, 1493.0, 1030.0, 693.0, 452.0, 326.0, 262.0, 164.0, 116.0, 76.0, 60.0, 33.0, 32.0, 15.0, 16.0, 7.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.78515625, -4.625, -4.46484375, -4.3046875, -4.14453125, -3.984375, -3.82421875, -3.6640625, -3.50390625, -3.34375, -3.18359375, -3.0234375, -2.86328125, -2.703125, -2.54296875, -2.3828125, -2.22265625, -2.0625, -1.90234375, -1.7421875, -1.58203125, -1.421875, -1.26171875, -1.1015625, -0.94140625, -0.78125, -0.62109375, -0.4609375, -0.30078125, -0.140625, 0.01953125, 0.1796875, 0.33984375, 0.5, 0.66015625, 0.8203125, 0.98046875, 1.140625, 1.30078125, 1.4609375, 1.62109375, 1.78125, 1.94140625, 2.1015625, 2.26171875, 2.421875, 2.58203125, 2.7421875, 2.90234375, 3.0625, 3.22265625, 3.3828125, 3.54296875, 3.703125, 3.86328125, 4.0234375, 4.18359375, 4.34375, 4.50390625, 4.6640625, 4.82421875, 4.984375, 5.14453125, 5.3046875, 5.46484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 6.0, 8.0, 7.0, 15.0, 10.0, 19.0, 26.0, 23.0, 26.0, 22.0, 37.0, 28.0, 46.0, 42.0, 72.0, 60.0, 66.0, 62.0, 54.0, 61.0, 52.0, 30.0, 31.0, 20.0, 28.0, 27.0, 23.0, 19.0, 8.0, 7.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0], "bins": [-1.5302734375, -1.490203857421875, -1.45013427734375, -1.410064697265625, -1.3699951171875, -1.329925537109375, -1.28985595703125, -1.249786376953125, -1.209716796875, -1.169647216796875, -1.12957763671875, -1.089508056640625, -1.0494384765625, -1.009368896484375, -0.96929931640625, -0.929229736328125, -0.88916015625, -0.849090576171875, -0.80902099609375, -0.768951416015625, -0.7288818359375, -0.688812255859375, -0.64874267578125, -0.608673095703125, -0.568603515625, -0.528533935546875, -0.48846435546875, -0.448394775390625, -0.4083251953125, -0.368255615234375, -0.32818603515625, -0.288116455078125, -0.248046875, -0.207977294921875, -0.16790771484375, -0.127838134765625, -0.0877685546875, -0.047698974609375, -0.00762939453125, 0.032440185546875, 0.072509765625, 0.112579345703125, 0.15264892578125, 0.192718505859375, 0.2327880859375, 0.272857666015625, 0.31292724609375, 0.352996826171875, 0.39306640625, 0.433135986328125, 0.47320556640625, 0.513275146484375, 0.5533447265625, 0.593414306640625, 0.63348388671875, 0.673553466796875, 0.713623046875, 0.753692626953125, 0.79376220703125, 0.833831787109375, 0.8739013671875, 0.913970947265625, 0.95404052734375, 0.994110107421875, 1.0341796875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 8.0, 16.0, 14.0, 10.0, 21.0, 27.0, 40.0, 54.0, 63.0, 60.0, 85.0, 89.0, 101.0, 73.0, 63.0, 57.0, 38.0, 49.0, 23.0, 19.0, 13.0, 11.0, 13.0, 12.0, 4.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-69.36333465576172, -67.66860961914062, -65.973876953125, -64.2791519165039, -62.58441925048828, -60.88969039916992, -59.19496154785156, -57.50023651123047, -55.805503845214844, -54.110774993896484, -52.416046142578125, -50.721317291259766, -49.026588439941406, -47.33185958862305, -45.63713073730469, -43.942405700683594, -42.247676849365234, -40.552947998046875, -38.858219146728516, -37.163490295410156, -35.4687614440918, -33.77403259277344, -32.079307556152344, -30.38457679748535, -28.689847946166992, -26.995119094848633, -25.300390243530273, -23.605663299560547, -21.910934448242188, -20.216205596923828, -18.52147674560547, -16.82674789428711, -15.132022857666016, -13.437294006347656, -11.742565155029297, -10.047837257385254, -8.353108406066895, -6.658379554748535, -4.963651657104492, -3.268922805786133, -1.5741939544677734, 0.12053465843200684, 1.815263271331787, 3.5099916458129883, 5.204720497131348, 6.899449348449707, 8.59417724609375, 10.28890609741211, 11.983634948730469, 13.678363800048828, 15.373092651367188, 17.067821502685547, 18.762550354003906, 20.457279205322266, 22.152006149291992, 23.84673500061035, 25.54146385192871, 27.23619270324707, 28.93092155456543, 30.625648498535156, 32.320377349853516, 34.015106201171875, 35.709835052490234, 37.404563903808594, 39.09929275512695]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 6.0, 9.0, 9.0, 7.0, 16.0, 10.0, 21.0, 14.0, 25.0, 28.0, 27.0, 28.0, 30.0, 31.0, 29.0, 30.0, 38.0, 39.0, 38.0, 35.0, 38.0, 40.0, 39.0, 31.0, 35.0, 36.0, 30.0, 41.0, 32.0, 27.0, 21.0, 22.0, 14.0, 20.0, 22.0, 7.0, 10.0, 10.0, 9.0, 4.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.142690658569336, -28.109111785888672, -27.075532913208008, -26.041954040527344, -25.008373260498047, -23.974796295166016, -22.94121551513672, -21.907636642456055, -20.87405776977539, -19.840478897094727, -18.806900024414062, -17.7733211517334, -16.739742279052734, -15.706162452697754, -14.672582626342773, -13.63900375366211, -12.605424880981445, -11.571846008300781, -10.538267135620117, -9.504687309265137, -8.471108436584473, -7.437529563903809, -6.403950214385986, -5.370370864868164, -4.3367919921875, -3.303212881088257, -2.2696337699890137, -1.2360546588897705, -0.20247554779052734, 0.8311033248901367, 1.864682674407959, 2.8982620239257812, 3.9318389892578125, 4.965417861938477, 5.998997211456299, 7.032576560974121, 8.066155433654785, 9.09973430633545, 10.13331413269043, 11.166893005371094, 12.200471878051758, 13.234050750732422, 14.267629623413086, 15.301209449768066, 16.334789276123047, 17.368366241455078, 18.401947021484375, 19.43552589416504, 20.469104766845703, 21.502683639526367, 22.53626251220703, 23.569841384887695, 24.60342025756836, 25.637001037597656, 26.67057991027832, 27.704158782958984, 28.73773765563965, 29.771316528320312, 30.804895401000977, 31.83847427368164, 32.87205505371094, 33.90563201904297, 34.939212799072266, 35.97279357910156, 37.006370544433594]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 16.0, 13.0, 27.0, 34.0, 50.0, 87.0, 128.0, 166.0, 304.0, 428.0, 698.0, 1123.0, 1688.0, 2581.0, 4002.0, 6166.0, 9802.0, 15540.0, 25132.0, 40750.0, 67654.0, 117542.0, 231785.0, 617734.0, 1318228.0, 990900.0, 360362.0, 157571.0, 87566.0, 51468.0, 30841.0, 19178.0, 12116.0, 7869.0, 5154.0, 3251.0, 2076.0, 1431.0, 880.0, 649.0, 442.0, 299.0, 193.0, 105.0, 73.0, 65.0, 36.0, 33.0, 21.0, 12.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.4375, -42.99169921875, -41.5458984375, -40.10009765625, -38.654296875, -37.20849609375, -35.7626953125, -34.31689453125, -32.87109375, -31.42529296875, -29.9794921875, -28.53369140625, -27.087890625, -25.64208984375, -24.1962890625, -22.75048828125, -21.3046875, -19.85888671875, -18.4130859375, -16.96728515625, -15.521484375, -14.07568359375, -12.6298828125, -11.18408203125, -9.73828125, -8.29248046875, -6.8466796875, -5.40087890625, -3.955078125, -2.50927734375, -1.0634765625, 0.38232421875, 1.828125, 3.27392578125, 4.7197265625, 6.16552734375, 7.611328125, 9.05712890625, 10.5029296875, 11.94873046875, 13.39453125, 14.84033203125, 16.2861328125, 17.73193359375, 19.177734375, 20.62353515625, 22.0693359375, 23.51513671875, 24.9609375, 26.40673828125, 27.8525390625, 29.29833984375, 30.744140625, 32.18994140625, 33.6357421875, 35.08154296875, 36.52734375, 37.97314453125, 39.4189453125, 40.86474609375, 42.310546875, 43.75634765625, 45.2021484375, 46.64794921875, 48.09375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 3.0, 3.0, 3.0, 5.0, 7.0, 3.0, 5.0, 11.0, 9.0, 14.0, 9.0, 19.0, 14.0, 18.0, 16.0, 31.0, 22.0, 24.0, 31.0, 25.0, 36.0, 31.0, 40.0, 31.0, 28.0, 35.0, 35.0, 30.0, 31.0, 31.0, 27.0, 39.0, 29.0, 35.0, 30.0, 28.0, 17.0, 27.0, 20.0, 25.0, 16.0, 13.0, 15.0, 14.0, 17.0, 10.0, 4.0, 8.0, 7.0, 5.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-21.125, -20.416748046875, -19.70849609375, -19.000244140625, -18.2919921875, -17.583740234375, -16.87548828125, -16.167236328125, -15.458984375, -14.750732421875, -14.04248046875, -13.334228515625, -12.6259765625, -11.917724609375, -11.20947265625, -10.501220703125, -9.79296875, -9.084716796875, -8.37646484375, -7.668212890625, -6.9599609375, -6.251708984375, -5.54345703125, -4.835205078125, -4.126953125, -3.418701171875, -2.71044921875, -2.002197265625, -1.2939453125, -0.585693359375, 0.12255859375, 0.830810546875, 1.5390625, 2.247314453125, 2.95556640625, 3.663818359375, 4.3720703125, 5.080322265625, 5.78857421875, 6.496826171875, 7.205078125, 7.913330078125, 8.62158203125, 9.329833984375, 10.0380859375, 10.746337890625, 11.45458984375, 12.162841796875, 12.87109375, 13.579345703125, 14.28759765625, 14.995849609375, 15.7041015625, 16.412353515625, 17.12060546875, 17.828857421875, 18.537109375, 19.245361328125, 19.95361328125, 20.661865234375, 21.3701171875, 22.078369140625, 22.78662109375, 23.494873046875, 24.203125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 27.0, 25.0, 45.0, 62.0, 111.0, 175.0, 249.0, 424.0, 659.0, 1031.0, 1725.0, 2614.0, 4151.0, 6657.0, 10535.0, 17375.0, 29072.0, 49718.0, 88380.0, 161577.0, 313095.0, 655174.0, 1302478.0, 770142.0, 358368.0, 182427.0, 98916.0, 55792.0, 32639.0, 19449.0, 11873.0, 7259.0, 4518.0, 2802.0, 1706.0, 1069.0, 696.0, 446.0, 291.0, 181.0, 130.0, 64.0, 58.0, 36.0, 15.0, 15.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-41.59375, -40.234375, -38.875, -37.515625, -36.15625, -34.796875, -33.4375, -32.078125, -30.71875, -29.359375, -28.0, -26.640625, -25.28125, -23.921875, -22.5625, -21.203125, -19.84375, -18.484375, -17.125, -15.765625, -14.40625, -13.046875, -11.6875, -10.328125, -8.96875, -7.609375, -6.25, -4.890625, -3.53125, -2.171875, -0.8125, 0.546875, 1.90625, 3.265625, 4.625, 5.984375, 7.34375, 8.703125, 10.0625, 11.421875, 12.78125, 14.140625, 15.5, 16.859375, 18.21875, 19.578125, 20.9375, 22.296875, 23.65625, 25.015625, 26.375, 27.734375, 29.09375, 30.453125, 31.8125, 33.171875, 34.53125, 35.890625, 37.25, 38.609375, 39.96875, 41.328125, 42.6875, 44.046875, 45.40625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 11.0, 19.0, 12.0, 27.0, 25.0, 34.0, 47.0, 43.0, 69.0, 72.0, 103.0, 103.0, 113.0, 163.0, 183.0, 196.0, 225.0, 287.0, 341.0, 328.0, 263.0, 228.0, 199.0, 162.0, 119.0, 115.0, 91.0, 80.0, 56.0, 62.0, 59.0, 37.0, 36.0, 30.0, 21.0, 17.0, 16.0, 16.0, 15.0, 10.0, 11.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.703125, -12.2608642578125, -11.818603515625, -11.3763427734375, -10.93408203125, -10.4918212890625, -10.049560546875, -9.6072998046875, -9.1650390625, -8.7227783203125, -8.280517578125, -7.8382568359375, -7.39599609375, -6.9537353515625, -6.511474609375, -6.0692138671875, -5.626953125, -5.1846923828125, -4.742431640625, -4.3001708984375, -3.85791015625, -3.4156494140625, -2.973388671875, -2.5311279296875, -2.0888671875, -1.6466064453125, -1.204345703125, -0.7620849609375, -0.31982421875, 0.1224365234375, 0.564697265625, 1.0069580078125, 1.44921875, 1.8914794921875, 2.333740234375, 2.7760009765625, 3.21826171875, 3.6605224609375, 4.102783203125, 4.5450439453125, 4.9873046875, 5.4295654296875, 5.871826171875, 6.3140869140625, 6.75634765625, 7.1986083984375, 7.640869140625, 8.0831298828125, 8.525390625, 8.9676513671875, 9.409912109375, 9.8521728515625, 10.29443359375, 10.7366943359375, 11.178955078125, 11.6212158203125, 12.0634765625, 12.5057373046875, 12.947998046875, 13.3902587890625, 13.83251953125, 14.2747802734375, 14.717041015625, 15.1593017578125, 15.6015625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 5.0, 8.0, 6.0, 3.0, 10.0, 10.0, 16.0, 23.0, 27.0, 31.0, 27.0, 39.0, 56.0, 67.0, 61.0, 74.0, 92.0, 66.0, 71.0, 47.0, 39.0, 46.0, 29.0, 28.0, 24.0, 25.0, 15.0, 14.0, 10.0, 3.0, 3.0, 6.0, 6.0, 3.0, 4.0, 0.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.743953704833984, -42.50876998901367, -41.27358627319336, -40.03840255737305, -38.80321502685547, -37.568031311035156, -36.332847595214844, -35.09766387939453, -33.86248016357422, -32.627296447753906, -31.392112731933594, -30.15692710876465, -28.921743392944336, -27.686559677124023, -26.451374053955078, -25.216190338134766, -23.981006622314453, -22.74582290649414, -21.510639190673828, -20.275453567504883, -19.04026985168457, -17.805086135864258, -16.569900512695312, -15.334716796875, -14.099533081054688, -12.864349365234375, -11.629164695739746, -10.393980026245117, -9.158796310424805, -7.923612117767334, -6.688427925109863, -5.453243255615234, -4.2180633544921875, -2.982879161834717, -1.747694969177246, -0.5125107765197754, 0.7226734161376953, 1.957857608795166, 3.1930418014526367, 4.428226470947266, 5.663410186767578, 6.898594379425049, 8.13377857208252, 9.368963241577148, 10.604146957397461, 11.839330673217773, 13.074515342712402, 14.309700012207031, 15.544883728027344, 16.780067443847656, 18.01525115966797, 19.250436782836914, 20.485620498657227, 21.72080421447754, 22.955989837646484, 24.191173553466797, 25.42635726928711, 26.661540985107422, 27.896724700927734, 29.13191032409668, 30.367094039916992, 31.602277755737305, 32.83746337890625, 34.07264709472656, 35.307830810546875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 9.0, 13.0, 11.0, 18.0, 6.0, 16.0, 6.0, 15.0, 25.0, 25.0, 20.0, 28.0, 23.0, 24.0, 19.0, 31.0, 38.0, 34.0, 27.0, 33.0, 44.0, 35.0, 31.0, 34.0, 32.0, 30.0, 29.0, 29.0, 33.0, 29.0, 13.0, 29.0, 25.0, 23.0, 18.0, 16.0, 27.0, 18.0, 12.0, 11.0, 10.0, 5.0, 4.0, 7.0, 1.0, 3.0, 4.0, 8.0, 4.0, 3.0, 0.0, 2.0, 4.0], "bins": [-25.17343521118164, -24.404706954956055, -23.63597869873047, -22.867250442504883, -22.098522186279297, -21.32979393005371, -20.561065673828125, -19.792339324951172, -19.023609161376953, -18.254880905151367, -17.48615264892578, -16.717424392700195, -15.94869613647461, -15.179967880249023, -14.411240577697754, -13.642512321472168, -12.873785018920898, -12.105056762695312, -11.336328506469727, -10.56760025024414, -9.798871994018555, -9.030143737792969, -8.2614164352417, -7.492688179016113, -6.723959922790527, -5.955231666564941, -5.1865034103393555, -4.417775630950928, -3.649047374725342, -2.880319118499756, -2.111591339111328, -1.3428630828857422, -0.5741329193115234, 0.19459521770477295, 0.9633233547210693, 1.7320513725280762, 2.500779628753662, 3.269507884979248, 4.038235664367676, 4.806963920593262, 5.575692176818848, 6.344420433044434, 7.1131486892700195, 7.881876468658447, 8.650604248046875, 9.419332504272461, 10.188060760498047, 10.956789016723633, 11.725517272949219, 12.494245529174805, 13.26297378540039, 14.031702041625977, 14.800430297851562, 15.569158554077148, 16.337886810302734, 17.106613159179688, 17.875343322753906, 18.644071578979492, 19.412799835205078, 20.181528091430664, 20.95025634765625, 21.718984603881836, 22.487712860107422, 23.256439208984375, 24.02516746520996]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 9.0, 6.0, 29.0, 40.0, 38.0, 63.0, 96.0, 124.0, 197.0, 285.0, 466.0, 661.0, 987.0, 1568.0, 2177.0, 3177.0, 4867.0, 7203.0, 10921.0, 16583.0, 25337.0, 39978.0, 62421.0, 98881.0, 160276.0, 216200.0, 143674.0, 90224.0, 56925.0, 36410.0, 23231.0, 15191.0, 10038.0, 6616.0, 4520.0, 2961.0, 2022.0, 1414.0, 969.0, 641.0, 406.0, 223.0, 169.0, 114.0, 73.0, 51.0, 40.0, 20.0, 14.0, 6.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-12.625, -12.180419921875, -11.73583984375, -11.291259765625, -10.8466796875, -10.402099609375, -9.95751953125, -9.512939453125, -9.068359375, -8.623779296875, -8.17919921875, -7.734619140625, -7.2900390625, -6.845458984375, -6.40087890625, -5.956298828125, -5.51171875, -5.067138671875, -4.62255859375, -4.177978515625, -3.7333984375, -3.288818359375, -2.84423828125, -2.399658203125, -1.955078125, -1.510498046875, -1.06591796875, -0.621337890625, -0.1767578125, 0.267822265625, 0.71240234375, 1.156982421875, 1.6015625, 2.046142578125, 2.49072265625, 2.935302734375, 3.3798828125, 3.824462890625, 4.26904296875, 4.713623046875, 5.158203125, 5.602783203125, 6.04736328125, 6.491943359375, 6.9365234375, 7.381103515625, 7.82568359375, 8.270263671875, 8.71484375, 9.159423828125, 9.60400390625, 10.048583984375, 10.4931640625, 10.937744140625, 11.38232421875, 11.826904296875, 12.271484375, 12.716064453125, 13.16064453125, 13.605224609375, 14.0498046875, 14.494384765625, 14.93896484375, 15.383544921875, 15.828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 10.0, 11.0, 14.0, 14.0, 14.0, 13.0, 17.0, 18.0, 17.0, 22.0, 37.0, 31.0, 26.0, 34.0, 25.0, 21.0, 38.0, 47.0, 42.0, 46.0, 38.0, 26.0, 20.0, 31.0, 21.0, 36.0, 31.0, 25.0, 31.0, 20.0, 28.0, 26.0, 23.0, 19.0, 15.0, 14.0, 13.0, 15.0, 5.0, 5.0, 11.0, 3.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-26.640625, -25.825927734375, -25.01123046875, -24.196533203125, -23.3818359375, -22.567138671875, -21.75244140625, -20.937744140625, -20.123046875, -19.308349609375, -18.49365234375, -17.678955078125, -16.8642578125, -16.049560546875, -15.23486328125, -14.420166015625, -13.60546875, -12.790771484375, -11.97607421875, -11.161376953125, -10.3466796875, -9.531982421875, -8.71728515625, -7.902587890625, -7.087890625, -6.273193359375, -5.45849609375, -4.643798828125, -3.8291015625, -3.014404296875, -2.19970703125, -1.385009765625, -0.5703125, 0.244384765625, 1.05908203125, 1.873779296875, 2.6884765625, 3.503173828125, 4.31787109375, 5.132568359375, 5.947265625, 6.761962890625, 7.57666015625, 8.391357421875, 9.2060546875, 10.020751953125, 10.83544921875, 11.650146484375, 12.46484375, 13.279541015625, 14.09423828125, 14.908935546875, 15.7236328125, 16.538330078125, 17.35302734375, 18.167724609375, 18.982421875, 19.797119140625, 20.61181640625, 21.426513671875, 22.2412109375, 23.055908203125, 23.87060546875, 24.685302734375, 25.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 12.0, 9.0, 24.0, 28.0, 36.0, 69.0, 113.0, 195.0, 312.0, 489.0, 840.0, 1475.0, 2573.0, 4464.0, 8361.0, 15911.0, 31395.0, 64279.0, 136360.0, 314868.0, 248592.0, 110472.0, 52347.0, 25835.0, 13167.0, 7112.0, 3900.0, 2170.0, 1232.0, 735.0, 465.0, 270.0, 172.0, 76.0, 58.0, 39.0, 33.0, 20.0, 14.0, 6.0, 11.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.254638671875, -16.58740234375, -15.920166015625, -15.2529296875, -14.585693359375, -13.91845703125, -13.251220703125, -12.583984375, -11.916748046875, -11.24951171875, -10.582275390625, -9.9150390625, -9.247802734375, -8.58056640625, -7.913330078125, -7.24609375, -6.578857421875, -5.91162109375, -5.244384765625, -4.5771484375, -3.909912109375, -3.24267578125, -2.575439453125, -1.908203125, -1.240966796875, -0.57373046875, 0.093505859375, 0.7607421875, 1.427978515625, 2.09521484375, 2.762451171875, 3.4296875, 4.096923828125, 4.76416015625, 5.431396484375, 6.0986328125, 6.765869140625, 7.43310546875, 8.100341796875, 8.767578125, 9.434814453125, 10.10205078125, 10.769287109375, 11.4365234375, 12.103759765625, 12.77099609375, 13.438232421875, 14.10546875, 14.772705078125, 15.43994140625, 16.107177734375, 16.7744140625, 17.441650390625, 18.10888671875, 18.776123046875, 19.443359375, 20.110595703125, 20.77783203125, 21.445068359375, 22.1123046875, 22.779541015625, 23.44677734375, 24.114013671875, 24.78125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 8.0, 11.0, 13.0, 13.0, 14.0, 21.0, 24.0, 27.0, 19.0, 18.0, 30.0, 23.0, 34.0, 33.0, 33.0, 39.0, 34.0, 36.0, 38.0, 55.0, 44.0, 36.0, 32.0, 31.0, 31.0, 22.0, 33.0, 18.0, 28.0, 20.0, 18.0, 32.0, 15.0, 12.0, 15.0, 14.0, 9.0, 6.0, 6.0, 3.0, 6.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0], "bins": [-19.890625, -19.33984375, -18.7890625, -18.23828125, -17.6875, -17.13671875, -16.5859375, -16.03515625, -15.484375, -14.93359375, -14.3828125, -13.83203125, -13.28125, -12.73046875, -12.1796875, -11.62890625, -11.078125, -10.52734375, -9.9765625, -9.42578125, -8.875, -8.32421875, -7.7734375, -7.22265625, -6.671875, -6.12109375, -5.5703125, -5.01953125, -4.46875, -3.91796875, -3.3671875, -2.81640625, -2.265625, -1.71484375, -1.1640625, -0.61328125, -0.0625, 0.48828125, 1.0390625, 1.58984375, 2.140625, 2.69140625, 3.2421875, 3.79296875, 4.34375, 4.89453125, 5.4453125, 5.99609375, 6.546875, 7.09765625, 7.6484375, 8.19921875, 8.75, 9.30078125, 9.8515625, 10.40234375, 10.953125, 11.50390625, 12.0546875, 12.60546875, 13.15625, 13.70703125, 14.2578125, 14.80859375, 15.359375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 11.0, 12.0, 11.0, 26.0, 49.0, 62.0, 74.0, 126.0, 217.0, 350.0, 549.0, 1022.0, 1800.0, 3256.0, 6366.0, 12786.0, 28607.0, 73489.0, 236398.0, 452532.0, 141393.0, 48812.0, 20380.0, 9447.0, 4777.0, 2483.0, 1462.0, 806.0, 446.0, 291.0, 180.0, 115.0, 57.0, 45.0, 38.0, 22.0, 18.0, 10.0, 9.0, 2.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25439453125, -0.2469768524169922, -0.23955917358398438, -0.23214149475097656, -0.22472381591796875, -0.21730613708496094, -0.20988845825195312, -0.2024707794189453, -0.1950531005859375, -0.1876354217529297, -0.18021774291992188, -0.17280006408691406, -0.16538238525390625, -0.15796470642089844, -0.15054702758789062, -0.1431293487548828, -0.135711669921875, -0.1282939910888672, -0.12087631225585938, -0.11345863342285156, -0.10604095458984375, -0.09862327575683594, -0.09120559692382812, -0.08378791809082031, -0.0763702392578125, -0.06895256042480469, -0.061534881591796875, -0.05411720275878906, -0.04669952392578125, -0.03928184509277344, -0.031864166259765625, -0.024446487426757812, -0.01702880859375, -0.009611129760742188, -0.002193450927734375, 0.0052242279052734375, 0.01264190673828125, 0.020059585571289062, 0.027477264404296875, 0.03489494323730469, 0.0423126220703125, 0.04973030090332031, 0.057147979736328125, 0.06456565856933594, 0.07198333740234375, 0.07940101623535156, 0.08681869506835938, 0.09423637390136719, 0.101654052734375, 0.10907173156738281, 0.11648941040039062, 0.12390708923339844, 0.13132476806640625, 0.13874244689941406, 0.14616012573242188, 0.1535778045654297, 0.1609954833984375, 0.1684131622314453, 0.17583084106445312, 0.18324851989746094, 0.19066619873046875, 0.19808387756347656, 0.20550155639648438, 0.2129192352294922, 0.2203369140625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 6.0, 7.0, 9.0, 11.0, 8.0, 22.0, 21.0, 30.0, 40.0, 46.0, 70.0, 72.0, 110.0, 106.0, 81.0, 70.0, 60.0, 51.0, 40.0, 33.0, 23.0, 21.0, 10.0, 12.0, 6.0, 7.0, 8.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.64863395690918e-05, -8.402671664953232e-05, -8.156709372997284e-05, -7.910747081041336e-05, -7.664784789085388e-05, -7.41882249712944e-05, -7.172860205173492e-05, -6.926897913217545e-05, -6.680935621261597e-05, -6.434973329305649e-05, -6.189011037349701e-05, -5.943048745393753e-05, -5.697086453437805e-05, -5.451124161481857e-05, -5.2051618695259094e-05, -4.9591995775699615e-05, -4.713237285614014e-05, -4.467274993658066e-05, -4.221312701702118e-05, -3.97535040974617e-05, -3.729388117790222e-05, -3.483425825834274e-05, -3.2374635338783264e-05, -2.9915012419223785e-05, -2.7455389499664307e-05, -2.4995766580104828e-05, -2.253614366054535e-05, -2.007652074098587e-05, -1.761689782142639e-05, -1.5157274901866913e-05, -1.2697651982307434e-05, -1.0238029062747955e-05, -7.778406143188477e-06, -5.318783223628998e-06, -2.859160304069519e-06, -3.995373845100403e-07, 2.0600855350494385e-06, 4.519708454608917e-06, 6.979331374168396e-06, 9.438954293727875e-06, 1.1898577213287354e-05, 1.4358200132846832e-05, 1.681782305240631e-05, 1.927744597196579e-05, 2.173706889152527e-05, 2.4196691811084747e-05, 2.6656314730644226e-05, 2.9115937650203705e-05, 3.1575560569763184e-05, 3.403518348932266e-05, 3.649480640888214e-05, 3.895442932844162e-05, 4.14140522480011e-05, 4.387367516756058e-05, 4.6333298087120056e-05, 4.8792921006679535e-05, 5.1252543926239014e-05, 5.371216684579849e-05, 5.617178976535797e-05, 5.863141268491745e-05, 6.109103560447693e-05, 6.355065852403641e-05, 6.601028144359589e-05, 6.846990436315536e-05, 7.092952728271484e-05]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 7.0, 5.0, 4.0, 8.0, 13.0, 13.0, 24.0, 24.0, 42.0, 49.0, 82.0, 139.0, 231.0, 422.0, 805.0, 1492.0, 2990.0, 6046.0, 12183.0, 26646.0, 62038.0, 170939.0, 430650.0, 203736.0, 72423.0, 30031.0, 13878.0, 6626.0, 3370.0, 1631.0, 865.0, 477.0, 253.0, 144.0, 74.0, 60.0, 35.0, 26.0, 19.0, 16.0, 13.0, 10.0, 7.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.2548828125, -0.24771881103515625, -0.2405548095703125, -0.23339080810546875, -0.226226806640625, -0.21906280517578125, -0.2118988037109375, -0.20473480224609375, -0.19757080078125, -0.19040679931640625, -0.1832427978515625, -0.17607879638671875, -0.168914794921875, -0.16175079345703125, -0.1545867919921875, -0.14742279052734375, -0.1402587890625, -0.13309478759765625, -0.1259307861328125, -0.11876678466796875, -0.111602783203125, -0.10443878173828125, -0.0972747802734375, -0.09011077880859375, -0.08294677734375, -0.07578277587890625, -0.0686187744140625, -0.06145477294921875, -0.054290771484375, -0.04712677001953125, -0.0399627685546875, -0.03279876708984375, -0.025634765625, -0.01847076416015625, -0.0113067626953125, -0.00414276123046875, 0.003021240234375, 0.01018524169921875, 0.0173492431640625, 0.02451324462890625, 0.03167724609375, 0.03884124755859375, 0.0460052490234375, 0.05316925048828125, 0.060333251953125, 0.06749725341796875, 0.0746612548828125, 0.08182525634765625, 0.0889892578125, 0.09615325927734375, 0.1033172607421875, 0.11048126220703125, 0.117645263671875, 0.12480926513671875, 0.1319732666015625, 0.13913726806640625, 0.14630126953125, 0.15346527099609375, 0.1606292724609375, 0.16779327392578125, 0.174957275390625, 0.18212127685546875, 0.1892852783203125, 0.19644927978515625, 0.20361328125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 7.0, 11.0, 14.0, 24.0, 18.0, 32.0, 42.0, 45.0, 50.0, 55.0, 75.0, 119.0, 87.0, 71.0, 53.0, 50.0, 41.0, 42.0, 32.0, 20.0, 23.0, 20.0, 15.0, 8.0, 9.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08099365234375, -0.07905435562133789, -0.07711505889892578, -0.07517576217651367, -0.07323646545410156, -0.07129716873168945, -0.06935787200927734, -0.06741857528686523, -0.06547927856445312, -0.06353998184204102, -0.061600685119628906, -0.0596613883972168, -0.05772209167480469, -0.05578279495239258, -0.05384349822998047, -0.05190420150756836, -0.04996490478515625, -0.04802560806274414, -0.04608631134033203, -0.04414701461791992, -0.04220771789550781, -0.0402684211730957, -0.038329124450683594, -0.036389827728271484, -0.034450531005859375, -0.032511234283447266, -0.030571937561035156, -0.028632640838623047, -0.026693344116210938, -0.024754047393798828, -0.02281475067138672, -0.02087545394897461, -0.0189361572265625, -0.01699686050415039, -0.015057563781738281, -0.013118267059326172, -0.011178970336914062, -0.009239673614501953, -0.007300376892089844, -0.005361080169677734, -0.003421783447265625, -0.0014824867248535156, 0.00045680999755859375, 0.002396106719970703, 0.0043354034423828125, 0.006274700164794922, 0.008213996887207031, 0.01015329360961914, 0.01209259033203125, 0.01403188705444336, 0.01597118377685547, 0.017910480499267578, 0.019849777221679688, 0.021789073944091797, 0.023728370666503906, 0.025667667388916016, 0.027606964111328125, 0.029546260833740234, 0.031485557556152344, 0.03342485427856445, 0.03536415100097656, 0.03730344772338867, 0.03924274444580078, 0.04118204116821289, 0.043121337890625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 16.0, 17.0, 18.0, 33.0, 22.0, 31.0, 46.0, 54.0, 59.0, 71.0, 74.0, 84.0, 78.0, 61.0, 50.0, 47.0, 38.0, 38.0, 27.0, 24.0, 18.0, 19.0, 9.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-44.175907135009766, -42.959068298339844, -41.742225646972656, -40.525386810302734, -39.30854797363281, -38.091705322265625, -36.8748664855957, -35.65802764892578, -34.441184997558594, -33.22434616088867, -32.007503509521484, -30.790664672851562, -29.573823928833008, -28.356983184814453, -27.14014434814453, -25.923303604125977, -24.706462860107422, -23.489622116088867, -22.272781372070312, -21.05594253540039, -19.839101791381836, -18.62226104736328, -17.40542221069336, -16.188581466674805, -14.97174072265625, -13.754899978637695, -12.538060188293457, -11.321220397949219, -10.104379653930664, -8.88753890991211, -7.670699119567871, -6.453859329223633, -5.237022399902344, -4.020182132720947, -2.803341865539551, -1.5865015983581543, -0.3696613311767578, 0.8471789360046387, 2.064019203186035, 3.2808589935302734, 4.497699737548828, 5.714540004730225, 6.931380271911621, 8.14822006225586, 9.365060806274414, 10.581901550292969, 11.798741340637207, 13.015581130981445, 14.232421875, 15.449262619018555, 16.66610336303711, 17.88294219970703, 19.099782943725586, 20.31662368774414, 21.533462524414062, 22.750303268432617, 23.967144012451172, 25.183984756469727, 26.40082550048828, 27.617664337158203, 28.834505081176758, 30.051345825195312, 31.268184661865234, 32.485023498535156, 33.701866149902344]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 7.0, 8.0, 15.0, 8.0, 18.0, 9.0, 12.0, 9.0, 21.0, 19.0, 23.0, 24.0, 24.0, 23.0, 27.0, 19.0, 31.0, 37.0, 31.0, 31.0, 30.0, 45.0, 32.0, 31.0, 36.0, 28.0, 31.0, 31.0, 27.0, 31.0, 31.0, 15.0, 28.0, 25.0, 22.0, 17.0, 17.0, 25.0, 20.0, 9.0, 14.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 6.0], "bins": [-24.003742218017578, -23.267955780029297, -22.53217124938965, -21.796384811401367, -21.060598373413086, -20.324813842773438, -19.589027404785156, -18.853240966796875, -18.117454528808594, -17.381668090820312, -16.645883560180664, -15.910097122192383, -15.174310684204102, -14.438525199890137, -13.702739715576172, -12.96695327758789, -12.231168746948242, -11.495383262634277, -10.759596824645996, -10.023811340332031, -9.28802490234375, -8.552239418029785, -7.81645393371582, -7.080667972564697, -6.344882011413574, -5.609096050262451, -4.873310089111328, -4.137524604797363, -3.4017386436462402, -2.665952682495117, -1.9301671981811523, -1.1943812370300293, -0.45859718322753906, 0.27718865871429443, 1.012974500656128, 1.7487602233886719, 2.484546184539795, 3.220332145690918, 3.956117630004883, 4.691903591156006, 5.427689552307129, 6.163475513458252, 6.899261474609375, 7.63504695892334, 8.370832443237305, 9.106618881225586, 9.84240436553955, 10.578189849853516, 11.313976287841797, 12.049761772155762, 12.785548210144043, 13.521333694458008, 14.257120132446289, 14.992905616760254, 15.728691101074219, 16.4644775390625, 17.20026397705078, 17.936050415039062, 18.67183494567871, 19.407621383666992, 20.143407821655273, 20.879192352294922, 21.614978790283203, 22.350765228271484, 23.086549758911133]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 5.0, 6.0, 11.0, 14.0, 26.0, 31.0, 44.0, 72.0, 95.0, 161.0, 228.0, 315.0, 499.0, 734.0, 970.0, 1401.0, 2255.0, 2967.0, 4391.0, 6277.0, 9150.0, 13672.0, 20203.0, 30069.0, 44607.0, 65831.0, 93834.0, 126083.0, 149204.0, 136889.0, 105266.0, 74791.0, 51080.0, 34587.0, 23176.0, 15766.0, 10649.0, 7286.0, 4881.0, 3392.0, 2300.0, 1685.0, 1156.0, 786.0, 545.0, 394.0, 252.0, 177.0, 122.0, 71.0, 61.0, 29.0, 23.0, 16.0, 11.0, 7.0, 5.0, 7.0, 3.0, 2.0], "bins": [-39.4375, -38.23046875, -37.0234375, -35.81640625, -34.609375, -33.40234375, -32.1953125, -30.98828125, -29.78125, -28.57421875, -27.3671875, -26.16015625, -24.953125, -23.74609375, -22.5390625, -21.33203125, -20.125, -18.91796875, -17.7109375, -16.50390625, -15.296875, -14.08984375, -12.8828125, -11.67578125, -10.46875, -9.26171875, -8.0546875, -6.84765625, -5.640625, -4.43359375, -3.2265625, -2.01953125, -0.8125, 0.39453125, 1.6015625, 2.80859375, 4.015625, 5.22265625, 6.4296875, 7.63671875, 8.84375, 10.05078125, 11.2578125, 12.46484375, 13.671875, 14.87890625, 16.0859375, 17.29296875, 18.5, 19.70703125, 20.9140625, 22.12109375, 23.328125, 24.53515625, 25.7421875, 26.94921875, 28.15625, 29.36328125, 30.5703125, 31.77734375, 32.984375, 34.19140625, 35.3984375, 36.60546875, 37.8125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 3.0, 4.0, 7.0, 12.0, 17.0, 17.0, 12.0, 19.0, 11.0, 19.0, 17.0, 19.0, 29.0, 25.0, 29.0, 33.0, 27.0, 30.0, 39.0, 30.0, 38.0, 30.0, 30.0, 37.0, 39.0, 36.0, 35.0, 33.0, 30.0, 27.0, 32.0, 28.0, 20.0, 31.0, 22.0, 21.0, 18.0, 28.0, 5.0, 10.0, 7.0, 5.0, 6.0, 7.0, 6.0, 5.0, 0.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-21.9375, -21.259521484375, -20.58154296875, -19.903564453125, -19.2255859375, -18.547607421875, -17.86962890625, -17.191650390625, -16.513671875, -15.835693359375, -15.15771484375, -14.479736328125, -13.8017578125, -13.123779296875, -12.44580078125, -11.767822265625, -11.08984375, -10.411865234375, -9.73388671875, -9.055908203125, -8.3779296875, -7.699951171875, -7.02197265625, -6.343994140625, -5.666015625, -4.988037109375, -4.31005859375, -3.632080078125, -2.9541015625, -2.276123046875, -1.59814453125, -0.920166015625, -0.2421875, 0.435791015625, 1.11376953125, 1.791748046875, 2.4697265625, 3.147705078125, 3.82568359375, 4.503662109375, 5.181640625, 5.859619140625, 6.53759765625, 7.215576171875, 7.8935546875, 8.571533203125, 9.24951171875, 9.927490234375, 10.60546875, 11.283447265625, 11.96142578125, 12.639404296875, 13.3173828125, 13.995361328125, 14.67333984375, 15.351318359375, 16.029296875, 16.707275390625, 17.38525390625, 18.063232421875, 18.7412109375, 19.419189453125, 20.09716796875, 20.775146484375, 21.453125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 4.0, 14.0, 17.0, 42.0, 36.0, 60.0, 97.0, 135.0, 199.0, 305.0, 462.0, 728.0, 1064.0, 1672.0, 2724.0, 4390.0, 6874.0, 11175.0, 17956.0, 29193.0, 48172.0, 78375.0, 125358.0, 179145.0, 186770.0, 133830.0, 84297.0, 51882.0, 31841.0, 19428.0, 12240.0, 7363.0, 4636.0, 2908.0, 1796.0, 1152.0, 719.0, 509.0, 316.0, 223.0, 139.0, 86.0, 62.0, 55.0, 29.0, 22.0, 13.0, 11.0, 11.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0], "bins": [-44.5625, -43.17333984375, -41.7841796875, -40.39501953125, -39.005859375, -37.61669921875, -36.2275390625, -34.83837890625, -33.44921875, -32.06005859375, -30.6708984375, -29.28173828125, -27.892578125, -26.50341796875, -25.1142578125, -23.72509765625, -22.3359375, -20.94677734375, -19.5576171875, -18.16845703125, -16.779296875, -15.39013671875, -14.0009765625, -12.61181640625, -11.22265625, -9.83349609375, -8.4443359375, -7.05517578125, -5.666015625, -4.27685546875, -2.8876953125, -1.49853515625, -0.109375, 1.27978515625, 2.6689453125, 4.05810546875, 5.447265625, 6.83642578125, 8.2255859375, 9.61474609375, 11.00390625, 12.39306640625, 13.7822265625, 15.17138671875, 16.560546875, 17.94970703125, 19.3388671875, 20.72802734375, 22.1171875, 23.50634765625, 24.8955078125, 26.28466796875, 27.673828125, 29.06298828125, 30.4521484375, 31.84130859375, 33.23046875, 34.61962890625, 36.0087890625, 37.39794921875, 38.787109375, 40.17626953125, 41.5654296875, 42.95458984375, 44.34375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 11.0, 6.0, 8.0, 9.0, 21.0, 13.0, 19.0, 15.0, 25.0, 43.0, 31.0, 36.0, 32.0, 33.0, 34.0, 46.0, 46.0, 41.0, 49.0, 51.0, 33.0, 40.0, 37.0, 39.0, 29.0, 37.0, 24.0, 25.0, 26.0, 23.0, 25.0, 20.0, 11.0, 12.0, 11.0, 15.0, 6.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.46875, -14.96435546875, -14.4599609375, -13.95556640625, -13.451171875, -12.94677734375, -12.4423828125, -11.93798828125, -11.43359375, -10.92919921875, -10.4248046875, -9.92041015625, -9.416015625, -8.91162109375, -8.4072265625, -7.90283203125, -7.3984375, -6.89404296875, -6.3896484375, -5.88525390625, -5.380859375, -4.87646484375, -4.3720703125, -3.86767578125, -3.36328125, -2.85888671875, -2.3544921875, -1.85009765625, -1.345703125, -0.84130859375, -0.3369140625, 0.16748046875, 0.671875, 1.17626953125, 1.6806640625, 2.18505859375, 2.689453125, 3.19384765625, 3.6982421875, 4.20263671875, 4.70703125, 5.21142578125, 5.7158203125, 6.22021484375, 6.724609375, 7.22900390625, 7.7333984375, 8.23779296875, 8.7421875, 9.24658203125, 9.7509765625, 10.25537109375, 10.759765625, 11.26416015625, 11.7685546875, 12.27294921875, 12.77734375, 13.28173828125, 13.7861328125, 14.29052734375, 14.794921875, 15.29931640625, 15.8037109375, 16.30810546875, 16.8125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 11.0, 12.0, 13.0, 28.0, 39.0, 61.0, 90.0, 131.0, 251.0, 421.0, 794.0, 1396.0, 2892.0, 5869.0, 12946.0, 33290.0, 109708.0, 547816.0, 239157.0, 56666.0, 19979.0, 8604.0, 3945.0, 2003.0, 1017.0, 576.0, 331.0, 183.0, 106.0, 59.0, 42.0, 31.0, 25.0, 20.0, 12.0, 9.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.109375, -13.7032470703125, -13.297119140625, -12.8909912109375, -12.48486328125, -12.0787353515625, -11.672607421875, -11.2664794921875, -10.8603515625, -10.4542236328125, -10.048095703125, -9.6419677734375, -9.23583984375, -8.8297119140625, -8.423583984375, -8.0174560546875, -7.611328125, -7.2052001953125, -6.799072265625, -6.3929443359375, -5.98681640625, -5.5806884765625, -5.174560546875, -4.7684326171875, -4.3623046875, -3.9561767578125, -3.550048828125, -3.1439208984375, -2.73779296875, -2.3316650390625, -1.925537109375, -1.5194091796875, -1.11328125, -0.7071533203125, -0.301025390625, 0.1051025390625, 0.51123046875, 0.9173583984375, 1.323486328125, 1.7296142578125, 2.1357421875, 2.5418701171875, 2.947998046875, 3.3541259765625, 3.76025390625, 4.1663818359375, 4.572509765625, 4.9786376953125, 5.384765625, 5.7908935546875, 6.197021484375, 6.6031494140625, 7.00927734375, 7.4154052734375, 7.821533203125, 8.2276611328125, 8.6337890625, 9.0399169921875, 9.446044921875, 9.8521728515625, 10.25830078125, 10.6644287109375, 11.070556640625, 11.4766845703125, 11.8828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 11.0, 24.0, 38.0, 72.0, 151.0, 328.0, 184.0, 103.0, 46.0, 19.0, 12.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002414703369140625, -0.002357989549636841, -0.0023012757301330566, -0.0022445619106292725, -0.0021878480911254883, -0.002131134271621704, -0.00207442045211792, -0.0020177066326141357, -0.0019609928131103516, -0.0019042789936065674, -0.0018475651741027832, -0.001790851354598999, -0.0017341375350952148, -0.0016774237155914307, -0.0016207098960876465, -0.0015639960765838623, -0.0015072822570800781, -0.001450568437576294, -0.0013938546180725098, -0.0013371407985687256, -0.0012804269790649414, -0.0012237131595611572, -0.001166999340057373, -0.0011102855205535889, -0.0010535717010498047, -0.0009968578815460205, -0.0009401440620422363, -0.0008834302425384521, -0.000826716423034668, -0.0007700026035308838, -0.0007132887840270996, -0.0006565749645233154, -0.0005998611450195312, -0.0005431473255157471, -0.0004864335060119629, -0.0004297196865081787, -0.00037300586700439453, -0.00031629204750061035, -0.00025957822799682617, -0.000202864408493042, -0.0001461505889892578, -8.943676948547363e-05, -3.272294998168945e-05, 2.3990869522094727e-05, 8.07046890258789e-05, 0.00013741850852966309, 0.00019413232803344727, 0.00025084614753723145, 0.0003075599670410156, 0.0003642737865447998, 0.000420987606048584, 0.00047770142555236816, 0.0005344152450561523, 0.0005911290645599365, 0.0006478428840637207, 0.0007045567035675049, 0.0007612705230712891, 0.0008179843425750732, 0.0008746981620788574, 0.0009314119815826416, 0.0009881258010864258, 0.00104483962059021, 0.0011015534400939941, 0.0011582672595977783, 0.0012149810791015625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 8.0, 9.0, 7.0, 16.0, 29.0, 29.0, 65.0, 71.0, 103.0, 164.0, 255.0, 311.0, 493.0, 761.0, 1150.0, 1913.0, 2944.0, 4938.0, 8698.0, 17133.0, 36089.0, 85743.0, 255403.0, 401009.0, 128820.0, 51457.0, 23233.0, 11456.0, 6293.0, 3598.0, 2194.0, 1412.0, 900.0, 593.0, 411.0, 270.0, 199.0, 113.0, 85.0, 56.0, 40.0, 35.0, 21.0, 10.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.736572265625, -8.46533203125, -8.194091796875, -7.9228515625, -7.651611328125, -7.38037109375, -7.109130859375, -6.837890625, -6.566650390625, -6.29541015625, -6.024169921875, -5.7529296875, -5.481689453125, -5.21044921875, -4.939208984375, -4.66796875, -4.396728515625, -4.12548828125, -3.854248046875, -3.5830078125, -3.311767578125, -3.04052734375, -2.769287109375, -2.498046875, -2.226806640625, -1.95556640625, -1.684326171875, -1.4130859375, -1.141845703125, -0.87060546875, -0.599365234375, -0.328125, -0.056884765625, 0.21435546875, 0.485595703125, 0.7568359375, 1.028076171875, 1.29931640625, 1.570556640625, 1.841796875, 2.113037109375, 2.38427734375, 2.655517578125, 2.9267578125, 3.197998046875, 3.46923828125, 3.740478515625, 4.01171875, 4.282958984375, 4.55419921875, 4.825439453125, 5.0966796875, 5.367919921875, 5.63916015625, 5.910400390625, 6.181640625, 6.452880859375, 6.72412109375, 6.995361328125, 7.2666015625, 7.537841796875, 7.80908203125, 8.080322265625, 8.3515625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 0.0, 0.0, 3.0, 12.0, 1.0, 7.0, 6.0, 9.0, 11.0, 11.0, 20.0, 41.0, 37.0, 47.0, 49.0, 63.0, 109.0, 84.0, 90.0, 75.0, 64.0, 58.0, 44.0, 34.0, 27.0, 26.0, 12.0, 12.0, 13.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.141021728515625, -2.06134033203125, -1.981658935546875, -1.9019775390625, -1.822296142578125, -1.74261474609375, -1.662933349609375, -1.583251953125, -1.503570556640625, -1.42388916015625, -1.344207763671875, -1.2645263671875, -1.184844970703125, -1.10516357421875, -1.025482177734375, -0.94580078125, -0.866119384765625, -0.78643798828125, -0.706756591796875, -0.6270751953125, -0.547393798828125, -0.46771240234375, -0.388031005859375, -0.308349609375, -0.228668212890625, -0.14898681640625, -0.069305419921875, 0.0103759765625, 0.090057373046875, 0.16973876953125, 0.249420166015625, 0.3291015625, 0.408782958984375, 0.48846435546875, 0.568145751953125, 0.6478271484375, 0.727508544921875, 0.80718994140625, 0.886871337890625, 0.966552734375, 1.046234130859375, 1.12591552734375, 1.205596923828125, 1.2852783203125, 1.364959716796875, 1.44464111328125, 1.524322509765625, 1.60400390625, 1.683685302734375, 1.76336669921875, 1.843048095703125, 1.9227294921875, 2.002410888671875, 2.08209228515625, 2.161773681640625, 2.241455078125, 2.321136474609375, 2.40081787109375, 2.480499267578125, 2.5601806640625, 2.639862060546875, 2.71954345703125, 2.799224853515625, 2.87890625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 3.0, 2.0, 7.0, 11.0, 16.0, 10.0, 20.0, 22.0, 13.0, 42.0, 42.0, 56.0, 56.0, 55.0, 67.0, 73.0, 77.0, 89.0, 53.0, 61.0, 52.0, 31.0, 16.0, 23.0, 19.0, 10.0, 17.0, 10.0, 4.0, 5.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.318138122558594, -33.239139556884766, -32.16014099121094, -31.081140518188477, -30.002140045166016, -28.923141479492188, -27.84414291381836, -26.76514434814453, -25.68614387512207, -24.607145309448242, -23.52814483642578, -22.449146270751953, -21.370147705078125, -20.291147232055664, -19.212148666381836, -18.133148193359375, -17.054149627685547, -15.975150108337402, -14.896150588989258, -13.81715202331543, -12.738152503967285, -11.65915298461914, -10.580154418945312, -9.501154899597168, -8.422155380249023, -7.343155860900879, -6.264156818389893, -5.185157775878906, -4.106158256530762, -3.027158737182617, -1.9481596946716309, -0.8691606521606445, 0.20983505249023438, 1.2888343334197998, 2.3678336143493652, 3.4468328952789307, 4.525832176208496, 5.604831695556641, 6.683830738067627, 7.762829780578613, 8.841829299926758, 9.920828819274902, 10.999828338623047, 12.078826904296875, 13.15782642364502, 14.236825942993164, 15.315824508666992, 16.394824981689453, 17.47382354736328, 18.55282211303711, 19.63182258605957, 20.7108211517334, 21.78982162475586, 22.868820190429688, 23.947818756103516, 25.026817321777344, 26.105817794799805, 27.184816360473633, 28.263816833496094, 29.342815399169922, 30.42181396484375, 31.50081443786621, 32.57981491088867, 33.6588134765625, 34.73781204223633]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 9.0, 7.0, 9.0, 12.0, 17.0, 14.0, 17.0, 16.0, 23.0, 27.0, 28.0, 21.0, 21.0, 29.0, 33.0, 26.0, 27.0, 35.0, 38.0, 43.0, 45.0, 39.0, 36.0, 33.0, 24.0, 47.0, 33.0, 40.0, 35.0, 30.0, 23.0, 18.0, 22.0, 14.0, 11.0, 15.0, 19.0, 12.0, 11.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.477584838867188, -21.7300968170166, -20.982608795166016, -20.235122680664062, -19.487634658813477, -18.74014663696289, -17.992660522460938, -17.24517250061035, -16.497684478759766, -15.75019645690918, -15.00270938873291, -14.25522232055664, -13.507734298706055, -12.760246276855469, -12.0127592086792, -11.26527214050293, -10.517784118652344, -9.770296096801758, -9.022809028625488, -8.275321960449219, -7.527833938598633, -6.780346393585205, -6.032858848571777, -5.28537130355835, -4.537883758544922, -3.790396213531494, -3.0429086685180664, -2.2954211235046387, -1.547933578491211, -0.8004460334777832, -0.05295848846435547, 0.6945290565490723, 1.4420166015625, 2.1895041465759277, 2.9369916915893555, 3.684479236602783, 4.431966781616211, 5.179454326629639, 5.926941871643066, 6.674429416656494, 7.421916961669922, 8.169404983520508, 8.916892051696777, 9.664379119873047, 10.411867141723633, 11.159355163574219, 11.906842231750488, 12.654329299926758, 13.401817321777344, 14.14930534362793, 14.8967924118042, 15.644279479980469, 16.391767501831055, 17.13925552368164, 17.886741638183594, 18.63422966003418, 19.381717681884766, 20.12920570373535, 20.876693725585938, 21.62417984008789, 22.371667861938477, 23.119155883789062, 23.866641998291016, 24.6141300201416, 25.361618041992188]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 15.0, 23.0, 50.0, 51.0, 87.0, 141.0, 249.0, 354.0, 564.0, 813.0, 1263.0, 1973.0, 3150.0, 4895.0, 7679.0, 12299.0, 19381.0, 31316.0, 50862.0, 86538.0, 156229.0, 332963.0, 836103.0, 1276014.0, 739474.0, 284349.0, 137817.0, 78425.0, 47141.0, 29366.0, 18667.0, 12070.0, 7949.0, 5182.0, 3533.0, 2312.0, 1589.0, 1124.0, 738.0, 473.0, 355.0, 225.0, 168.0, 95.0, 70.0, 43.0, 29.0, 16.0, 19.0, 12.0, 4.0, 10.0, 6.0, 2.0, 3.0], "bins": [-32.5625, -31.558349609375, -30.55419921875, -29.550048828125, -28.5458984375, -27.541748046875, -26.53759765625, -25.533447265625, -24.529296875, -23.525146484375, -22.52099609375, -21.516845703125, -20.5126953125, -19.508544921875, -18.50439453125, -17.500244140625, -16.49609375, -15.491943359375, -14.48779296875, -13.483642578125, -12.4794921875, -11.475341796875, -10.47119140625, -9.467041015625, -8.462890625, -7.458740234375, -6.45458984375, -5.450439453125, -4.4462890625, -3.442138671875, -2.43798828125, -1.433837890625, -0.4296875, 0.574462890625, 1.57861328125, 2.582763671875, 3.5869140625, 4.591064453125, 5.59521484375, 6.599365234375, 7.603515625, 8.607666015625, 9.61181640625, 10.615966796875, 11.6201171875, 12.624267578125, 13.62841796875, 14.632568359375, 15.63671875, 16.640869140625, 17.64501953125, 18.649169921875, 19.6533203125, 20.657470703125, 21.66162109375, 22.665771484375, 23.669921875, 24.674072265625, 25.67822265625, 26.682373046875, 27.6865234375, 28.690673828125, 29.69482421875, 30.698974609375, 31.703125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 10.0, 11.0, 10.0, 9.0, 17.0, 8.0, 27.0, 25.0, 20.0, 22.0, 22.0, 23.0, 30.0, 33.0, 36.0, 31.0, 32.0, 42.0, 44.0, 40.0, 47.0, 37.0, 33.0, 31.0, 44.0, 30.0, 34.0, 26.0, 22.0, 26.0, 19.0, 27.0, 19.0, 23.0, 18.0, 14.0, 14.0, 6.0, 5.0, 2.0, 7.0, 10.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.1875, -17.581298828125, -16.97509765625, -16.368896484375, -15.7626953125, -15.156494140625, -14.55029296875, -13.944091796875, -13.337890625, -12.731689453125, -12.12548828125, -11.519287109375, -10.9130859375, -10.306884765625, -9.70068359375, -9.094482421875, -8.48828125, -7.882080078125, -7.27587890625, -6.669677734375, -6.0634765625, -5.457275390625, -4.85107421875, -4.244873046875, -3.638671875, -3.032470703125, -2.42626953125, -1.820068359375, -1.2138671875, -0.607666015625, -0.00146484375, 0.604736328125, 1.2109375, 1.817138671875, 2.42333984375, 3.029541015625, 3.6357421875, 4.241943359375, 4.84814453125, 5.454345703125, 6.060546875, 6.666748046875, 7.27294921875, 7.879150390625, 8.4853515625, 9.091552734375, 9.69775390625, 10.303955078125, 10.91015625, 11.516357421875, 12.12255859375, 12.728759765625, 13.3349609375, 13.941162109375, 14.54736328125, 15.153564453125, 15.759765625, 16.365966796875, 16.97216796875, 17.578369140625, 18.1845703125, 18.790771484375, 19.39697265625, 20.003173828125, 20.609375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 14.0, 12.0, 23.0, 43.0, 73.0, 110.0, 179.0, 284.0, 422.0, 695.0, 1057.0, 1768.0, 2798.0, 4808.0, 8005.0, 13991.0, 24077.0, 42921.0, 79233.0, 149716.0, 300985.0, 642647.0, 1271358.0, 848703.0, 388444.0, 190212.0, 98416.0, 52999.0, 29439.0, 16781.0, 9439.0, 5714.0, 3400.0, 2079.0, 1267.0, 796.0, 489.0, 313.0, 204.0, 106.0, 92.0, 52.0, 40.0, 25.0, 19.0, 9.0, 9.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 3.0], "bins": [-34.875, -33.8076171875, -32.740234375, -31.6728515625, -30.60546875, -29.5380859375, -28.470703125, -27.4033203125, -26.3359375, -25.2685546875, -24.201171875, -23.1337890625, -22.06640625, -20.9990234375, -19.931640625, -18.8642578125, -17.796875, -16.7294921875, -15.662109375, -14.5947265625, -13.52734375, -12.4599609375, -11.392578125, -10.3251953125, -9.2578125, -8.1904296875, -7.123046875, -6.0556640625, -4.98828125, -3.9208984375, -2.853515625, -1.7861328125, -0.71875, 0.3486328125, 1.416015625, 2.4833984375, 3.55078125, 4.6181640625, 5.685546875, 6.7529296875, 7.8203125, 8.8876953125, 9.955078125, 11.0224609375, 12.08984375, 13.1572265625, 14.224609375, 15.2919921875, 16.359375, 17.4267578125, 18.494140625, 19.5615234375, 20.62890625, 21.6962890625, 22.763671875, 23.8310546875, 24.8984375, 25.9658203125, 27.033203125, 28.1005859375, 29.16796875, 30.2353515625, 31.302734375, 32.3701171875, 33.4375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 8.0, 10.0, 6.0, 13.0, 14.0, 20.0, 30.0, 30.0, 48.0, 63.0, 78.0, 112.0, 146.0, 144.0, 165.0, 203.0, 288.0, 324.0, 318.0, 343.0, 313.0, 254.0, 208.0, 162.0, 150.0, 114.0, 87.0, 89.0, 66.0, 64.0, 65.0, 36.0, 28.0, 23.0, 17.0, 9.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.646484375, -11.26171875, -10.876953125, -10.4921875, -10.107421875, -9.72265625, -9.337890625, -8.953125, -8.568359375, -8.18359375, -7.798828125, -7.4140625, -7.029296875, -6.64453125, -6.259765625, -5.875, -5.490234375, -5.10546875, -4.720703125, -4.3359375, -3.951171875, -3.56640625, -3.181640625, -2.796875, -2.412109375, -2.02734375, -1.642578125, -1.2578125, -0.873046875, -0.48828125, -0.103515625, 0.28125, 0.666015625, 1.05078125, 1.435546875, 1.8203125, 2.205078125, 2.58984375, 2.974609375, 3.359375, 3.744140625, 4.12890625, 4.513671875, 4.8984375, 5.283203125, 5.66796875, 6.052734375, 6.4375, 6.822265625, 7.20703125, 7.591796875, 7.9765625, 8.361328125, 8.74609375, 9.130859375, 9.515625, 9.900390625, 10.28515625, 10.669921875, 11.0546875, 11.439453125, 11.82421875, 12.208984375, 12.59375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 11.0, 6.0, 6.0, 7.0, 8.0, 14.0, 17.0, 21.0, 31.0, 31.0, 37.0, 38.0, 55.0, 57.0, 73.0, 69.0, 69.0, 69.0, 53.0, 57.0, 39.0, 35.0, 41.0, 31.0, 20.0, 22.0, 17.0, 20.0, 8.0, 8.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.497220993041992, -25.67423439025879, -24.85124969482422, -24.028263092041016, -23.205276489257812, -22.38228988647461, -21.559303283691406, -20.736318588256836, -19.913331985473633, -19.09034538269043, -18.26736068725586, -17.444374084472656, -16.621387481689453, -15.79840087890625, -14.975415229797363, -14.152429580688477, -13.329442977905273, -12.50645637512207, -11.683470726013184, -10.860485076904297, -10.037498474121094, -9.21451187133789, -8.391526222229004, -7.568540096282959, -6.745553970336914, -5.922567844390869, -5.099581718444824, -4.276595592498779, -3.4536094665527344, -2.6306233406066895, -1.8076372146606445, -0.9846510887145996, -0.16166305541992188, 0.661323070526123, 1.484309196472168, 2.307295322418213, 3.130281448364258, 3.9532675743103027, 4.776253700256348, 5.599239826202393, 6.4222259521484375, 7.245212078094482, 8.068198204040527, 8.891183853149414, 9.714170455932617, 10.53715705871582, 11.360142707824707, 12.183128356933594, 13.006114959716797, 13.8291015625, 14.652087211608887, 15.475072860717773, 16.298059463500977, 17.12104606628418, 17.94403076171875, 18.767017364501953, 19.590003967285156, 20.41299057006836, 21.235977172851562, 22.058961868286133, 22.881948471069336, 23.70493507385254, 24.52791976928711, 25.350906372070312, 26.173892974853516]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 4.0, 7.0, 8.0, 13.0, 15.0, 16.0, 25.0, 15.0, 31.0, 30.0, 32.0, 27.0, 26.0, 28.0, 26.0, 33.0, 29.0, 31.0, 42.0, 36.0, 36.0, 33.0, 35.0, 28.0, 40.0, 33.0, 38.0, 26.0, 19.0, 31.0, 18.0, 23.0, 29.0, 17.0, 15.0, 14.0, 15.0, 15.0, 9.0, 6.0, 8.0, 3.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.677629470825195, -18.071374893188477, -17.465120315551758, -16.85886573791504, -16.252609252929688, -15.646355628967285, -15.04010009765625, -14.433845520019531, -13.827590942382812, -13.221336364746094, -12.615081787109375, -12.00882625579834, -11.402571678161621, -10.796317100524902, -10.190061569213867, -9.583806991577148, -8.97755241394043, -8.371297836303711, -7.765042781829834, -7.158787727355957, -6.552533149719238, -5.9462785720825195, -5.340023517608643, -4.733768463134766, -4.127513885498047, -3.521259069442749, -2.915004253387451, -2.3087494373321533, -1.7024946212768555, -1.0962398052215576, -0.48998498916625977, 0.11627006530761719, 0.7225246429443359, 1.3287794589996338, 1.9350342750549316, 2.5412890911102295, 3.1475439071655273, 3.753798723220825, 4.360053539276123, 4.96630859375, 5.572563171386719, 6.1788177490234375, 6.7850728034973145, 7.391327857971191, 7.99758243560791, 8.603837013244629, 9.210092544555664, 9.816347122192383, 10.422601699829102, 11.02885627746582, 11.635110855102539, 12.241366386413574, 12.847620964050293, 13.453875541687012, 14.060131072998047, 14.666385650634766, 15.272640228271484, 15.878894805908203, 16.485149383544922, 17.09140396118164, 17.69765853881836, 18.30391502380371, 18.91016960144043, 19.51642417907715, 20.122678756713867]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 1.0, 14.0, 15.0, 18.0, 30.0, 53.0, 85.0, 90.0, 157.0, 171.0, 284.0, 384.0, 599.0, 860.0, 1263.0, 1877.0, 2726.0, 4097.0, 6063.0, 9324.0, 13911.0, 21216.0, 32599.0, 50886.0, 80124.0, 126619.0, 194540.0, 179443.0, 114817.0, 72603.0, 46054.0, 29731.0, 19457.0, 12559.0, 8448.0, 5755.0, 3693.0, 2521.0, 1723.0, 1154.0, 824.0, 535.0, 407.0, 266.0, 160.0, 122.0, 99.0, 74.0, 24.0, 29.0, 17.0, 14.0, 9.0, 4.0, 4.0, 4.0, 4.0, 2.0], "bins": [-10.3359375, -10.021728515625, -9.70751953125, -9.393310546875, -9.0791015625, -8.764892578125, -8.45068359375, -8.136474609375, -7.822265625, -7.508056640625, -7.19384765625, -6.879638671875, -6.5654296875, -6.251220703125, -5.93701171875, -5.622802734375, -5.30859375, -4.994384765625, -4.68017578125, -4.365966796875, -4.0517578125, -3.737548828125, -3.42333984375, -3.109130859375, -2.794921875, -2.480712890625, -2.16650390625, -1.852294921875, -1.5380859375, -1.223876953125, -0.90966796875, -0.595458984375, -0.28125, 0.032958984375, 0.34716796875, 0.661376953125, 0.9755859375, 1.289794921875, 1.60400390625, 1.918212890625, 2.232421875, 2.546630859375, 2.86083984375, 3.175048828125, 3.4892578125, 3.803466796875, 4.11767578125, 4.431884765625, 4.74609375, 5.060302734375, 5.37451171875, 5.688720703125, 6.0029296875, 6.317138671875, 6.63134765625, 6.945556640625, 7.259765625, 7.573974609375, 7.88818359375, 8.202392578125, 8.5166015625, 8.830810546875, 9.14501953125, 9.459228515625, 9.7734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 3.0, 2.0, 4.0, 6.0, 8.0, 8.0, 16.0, 12.0, 17.0, 18.0, 26.0, 20.0, 21.0, 25.0, 32.0, 42.0, 24.0, 26.0, 40.0, 27.0, 35.0, 35.0, 39.0, 39.0, 31.0, 33.0, 27.0, 32.0, 34.0, 22.0, 31.0, 27.0, 23.0, 33.0, 26.0, 16.0, 16.0, 14.0, 15.0, 19.0, 10.0, 5.0, 18.0, 8.0, 6.0, 6.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-19.984375, -19.38330078125, -18.7822265625, -18.18115234375, -17.580078125, -16.97900390625, -16.3779296875, -15.77685546875, -15.17578125, -14.57470703125, -13.9736328125, -13.37255859375, -12.771484375, -12.17041015625, -11.5693359375, -10.96826171875, -10.3671875, -9.76611328125, -9.1650390625, -8.56396484375, -7.962890625, -7.36181640625, -6.7607421875, -6.15966796875, -5.55859375, -4.95751953125, -4.3564453125, -3.75537109375, -3.154296875, -2.55322265625, -1.9521484375, -1.35107421875, -0.75, -0.14892578125, 0.4521484375, 1.05322265625, 1.654296875, 2.25537109375, 2.8564453125, 3.45751953125, 4.05859375, 4.65966796875, 5.2607421875, 5.86181640625, 6.462890625, 7.06396484375, 7.6650390625, 8.26611328125, 8.8671875, 9.46826171875, 10.0693359375, 10.67041015625, 11.271484375, 11.87255859375, 12.4736328125, 13.07470703125, 13.67578125, 14.27685546875, 14.8779296875, 15.47900390625, 16.080078125, 16.68115234375, 17.2822265625, 17.88330078125, 18.484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 8.0, 15.0, 20.0, 28.0, 41.0, 67.0, 125.0, 198.0, 308.0, 522.0, 802.0, 1458.0, 2434.0, 4401.0, 8124.0, 15282.0, 30343.0, 61848.0, 131618.0, 310341.0, 258885.0, 112680.0, 53219.0, 26078.0, 13323.0, 7093.0, 3867.0, 2137.0, 1299.0, 736.0, 485.0, 252.0, 180.0, 107.0, 75.0, 44.0, 31.0, 22.0, 15.0, 12.0, 12.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.703125, -15.2108154296875, -14.718505859375, -14.2261962890625, -13.73388671875, -13.2415771484375, -12.749267578125, -12.2569580078125, -11.7646484375, -11.2723388671875, -10.780029296875, -10.2877197265625, -9.79541015625, -9.3031005859375, -8.810791015625, -8.3184814453125, -7.826171875, -7.3338623046875, -6.841552734375, -6.3492431640625, -5.85693359375, -5.3646240234375, -4.872314453125, -4.3800048828125, -3.8876953125, -3.3953857421875, -2.903076171875, -2.4107666015625, -1.91845703125, -1.4261474609375, -0.933837890625, -0.4415283203125, 0.05078125, 0.5430908203125, 1.035400390625, 1.5277099609375, 2.02001953125, 2.5123291015625, 3.004638671875, 3.4969482421875, 3.9892578125, 4.4815673828125, 4.973876953125, 5.4661865234375, 5.95849609375, 6.4508056640625, 6.943115234375, 7.4354248046875, 7.927734375, 8.4200439453125, 8.912353515625, 9.4046630859375, 9.89697265625, 10.3892822265625, 10.881591796875, 11.3739013671875, 11.8662109375, 12.3585205078125, 12.850830078125, 13.3431396484375, 13.83544921875, 14.3277587890625, 14.820068359375, 15.3123779296875, 15.8046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 8.0, 9.0, 12.0, 8.0, 13.0, 10.0, 23.0, 23.0, 30.0, 29.0, 21.0, 28.0, 32.0, 46.0, 42.0, 41.0, 37.0, 40.0, 37.0, 43.0, 44.0, 38.0, 39.0, 44.0, 25.0, 36.0, 34.0, 28.0, 20.0, 23.0, 13.0, 21.0, 16.0, 12.0, 15.0, 11.0, 3.0, 8.0, 12.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.359375, -13.91650390625, -13.4736328125, -13.03076171875, -12.587890625, -12.14501953125, -11.7021484375, -11.25927734375, -10.81640625, -10.37353515625, -9.9306640625, -9.48779296875, -9.044921875, -8.60205078125, -8.1591796875, -7.71630859375, -7.2734375, -6.83056640625, -6.3876953125, -5.94482421875, -5.501953125, -5.05908203125, -4.6162109375, -4.17333984375, -3.73046875, -3.28759765625, -2.8447265625, -2.40185546875, -1.958984375, -1.51611328125, -1.0732421875, -0.63037109375, -0.1875, 0.25537109375, 0.6982421875, 1.14111328125, 1.583984375, 2.02685546875, 2.4697265625, 2.91259765625, 3.35546875, 3.79833984375, 4.2412109375, 4.68408203125, 5.126953125, 5.56982421875, 6.0126953125, 6.45556640625, 6.8984375, 7.34130859375, 7.7841796875, 8.22705078125, 8.669921875, 9.11279296875, 9.5556640625, 9.99853515625, 10.44140625, 10.88427734375, 11.3271484375, 11.77001953125, 12.212890625, 12.65576171875, 13.0986328125, 13.54150390625, 13.984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 14.0, 15.0, 27.0, 46.0, 44.0, 83.0, 111.0, 189.0, 284.0, 513.0, 802.0, 1455.0, 2617.0, 5115.0, 10294.0, 22551.0, 56891.0, 173605.0, 481358.0, 186187.0, 59868.0, 23980.0, 10753.0, 5215.0, 2754.0, 1538.0, 882.0, 495.0, 304.0, 206.0, 119.0, 86.0, 43.0, 37.0, 18.0, 15.0, 14.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2196044921875, -0.21305465698242188, -0.20650482177734375, -0.19995498657226562, -0.1934051513671875, -0.18685531616210938, -0.18030548095703125, -0.17375564575195312, -0.167205810546875, -0.16065597534179688, -0.15410614013671875, -0.14755630493164062, -0.1410064697265625, -0.13445663452148438, -0.12790679931640625, -0.12135696411132812, -0.11480712890625, -0.10825729370117188, -0.10170745849609375, -0.09515762329101562, -0.0886077880859375, -0.08205795288085938, -0.07550811767578125, -0.06895828247070312, -0.062408447265625, -0.055858612060546875, -0.04930877685546875, -0.042758941650390625, -0.0362091064453125, -0.029659271240234375, -0.02310943603515625, -0.016559600830078125, -0.010009765625, -0.003459930419921875, 0.00308990478515625, 0.009639739990234375, 0.0161895751953125, 0.022739410400390625, 0.02928924560546875, 0.035839080810546875, 0.042388916015625, 0.048938751220703125, 0.05548858642578125, 0.062038421630859375, 0.0685882568359375, 0.07513809204101562, 0.08168792724609375, 0.08823776245117188, 0.09478759765625, 0.10133743286132812, 0.10788726806640625, 0.11443710327148438, 0.1209869384765625, 0.12753677368164062, 0.13408660888671875, 0.14063644409179688, 0.147186279296875, 0.15373611450195312, 0.16028594970703125, 0.16683578491210938, 0.1733856201171875, 0.17993545532226562, 0.18648529052734375, 0.19303512573242188, 0.1995849609375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 8.0, 6.0, 7.0, 6.0, 15.0, 18.0, 21.0, 19.0, 35.0, 36.0, 47.0, 55.0, 74.0, 89.0, 79.0, 87.0, 69.0, 68.0, 50.0, 47.0, 30.0, 22.0, 26.0, 15.0, 13.0, 13.0, 9.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.091594696044922e-05, -5.8867037296295166e-05, -5.681812763214111e-05, -5.476921796798706e-05, -5.272030830383301e-05, -5.0671398639678955e-05, -4.86224889755249e-05, -4.657357931137085e-05, -4.45246696472168e-05, -4.2475759983062744e-05, -4.042685031890869e-05, -3.837794065475464e-05, -3.6329030990600586e-05, -3.428012132644653e-05, -3.223121166229248e-05, -3.0182301998138428e-05, -2.8133392333984375e-05, -2.6084482669830322e-05, -2.403557300567627e-05, -2.1986663341522217e-05, -1.9937753677368164e-05, -1.788884401321411e-05, -1.583993434906006e-05, -1.3791024684906006e-05, -1.1742115020751953e-05, -9.6932053565979e-06, -7.644295692443848e-06, -5.595386028289795e-06, -3.546476364135742e-06, -1.4975666999816895e-06, 5.513429641723633e-07, 2.600252628326416e-06, 4.649162292480469e-06, 6.6980719566345215e-06, 8.746981620788574e-06, 1.0795891284942627e-05, 1.284480094909668e-05, 1.4893710613250732e-05, 1.6942620277404785e-05, 1.8991529941558838e-05, 2.104043960571289e-05, 2.3089349269866943e-05, 2.5138258934020996e-05, 2.718716859817505e-05, 2.92360782623291e-05, 3.1284987926483154e-05, 3.333389759063721e-05, 3.538280725479126e-05, 3.743171691894531e-05, 3.9480626583099365e-05, 4.152953624725342e-05, 4.357844591140747e-05, 4.5627355575561523e-05, 4.7676265239715576e-05, 4.972517490386963e-05, 5.177408456802368e-05, 5.3822994232177734e-05, 5.587190389633179e-05, 5.792081356048584e-05, 5.996972322463989e-05, 6.201863288879395e-05, 6.4067542552948e-05, 6.611645221710205e-05, 6.81653618812561e-05, 7.021427154541016e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 8.0, 19.0, 24.0, 37.0, 47.0, 74.0, 111.0, 137.0, 241.0, 402.0, 697.0, 1101.0, 1747.0, 3157.0, 5351.0, 9543.0, 17630.0, 33906.0, 70670.0, 165195.0, 357606.0, 208362.0, 85622.0, 39884.0, 20628.0, 11191.0, 6184.0, 3668.0, 2126.0, 1210.0, 701.0, 458.0, 289.0, 182.0, 105.0, 73.0, 50.0, 29.0, 20.0, 18.0, 15.0, 12.0, 2.0, 2.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0], "bins": [-0.1651611328125, -0.16039085388183594, -0.15562057495117188, -0.1508502960205078, -0.14608001708984375, -0.1413097381591797, -0.13653945922851562, -0.13176918029785156, -0.1269989013671875, -0.12222862243652344, -0.11745834350585938, -0.11268806457519531, -0.10791778564453125, -0.10314750671386719, -0.09837722778320312, -0.09360694885253906, -0.088836669921875, -0.08406639099121094, -0.07929611206054688, -0.07452583312988281, -0.06975555419921875, -0.06498527526855469, -0.060214996337890625, -0.05544471740722656, -0.0506744384765625, -0.04590415954589844, -0.041133880615234375, -0.03636360168457031, -0.03159332275390625, -0.026823043823242188, -0.022052764892578125, -0.017282485961914062, -0.01251220703125, -0.0077419281005859375, -0.002971649169921875, 0.0017986297607421875, 0.00656890869140625, 0.011339187622070312, 0.016109466552734375, 0.020879745483398438, 0.0256500244140625, 0.030420303344726562, 0.035190582275390625, 0.03996086120605469, 0.04473114013671875, 0.04950141906738281, 0.054271697998046875, 0.05904197692871094, 0.063812255859375, 0.06858253479003906, 0.07335281372070312, 0.07812309265136719, 0.08289337158203125, 0.08766365051269531, 0.09243392944335938, 0.09720420837402344, 0.1019744873046875, 0.10674476623535156, 0.11151504516601562, 0.11628532409667969, 0.12105560302734375, 0.1258258819580078, 0.13059616088867188, 0.13536643981933594, 0.14013671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 7.0, 11.0, 6.0, 22.0, 16.0, 25.0, 21.0, 33.0, 28.0, 38.0, 43.0, 49.0, 69.0, 72.0, 98.0, 75.0, 74.0, 53.0, 47.0, 33.0, 26.0, 21.0, 15.0, 23.0, 15.0, 16.0, 9.0, 8.0, 12.0, 7.0, 2.0, 10.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.060791015625, -0.05914115905761719, -0.057491302490234375, -0.05584144592285156, -0.05419158935546875, -0.05254173278808594, -0.050891876220703125, -0.04924201965332031, -0.0475921630859375, -0.04594230651855469, -0.044292449951171875, -0.04264259338378906, -0.04099273681640625, -0.03934288024902344, -0.037693023681640625, -0.03604316711425781, -0.034393310546875, -0.03274345397949219, -0.031093597412109375, -0.029443740844726562, -0.02779388427734375, -0.026144027709960938, -0.024494171142578125, -0.022844314575195312, -0.0211944580078125, -0.019544601440429688, -0.017894744873046875, -0.016244888305664062, -0.01459503173828125, -0.012945175170898438, -0.011295318603515625, -0.009645462036132812, -0.00799560546875, -0.0063457489013671875, -0.004695892333984375, -0.0030460357666015625, -0.00139617919921875, 0.0002536773681640625, 0.001903533935546875, 0.0035533905029296875, 0.0052032470703125, 0.0068531036376953125, 0.008502960205078125, 0.010152816772460938, 0.01180267333984375, 0.013452529907226562, 0.015102386474609375, 0.016752243041992188, 0.018402099609375, 0.020051956176757812, 0.021701812744140625, 0.023351669311523438, 0.02500152587890625, 0.026651382446289062, 0.028301239013671875, 0.029951095581054688, 0.0316009521484375, 0.03325080871582031, 0.034900665283203125, 0.03655052185058594, 0.03820037841796875, 0.03985023498535156, 0.041500091552734375, 0.04314994812011719, 0.0447998046875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 9.0, 10.0, 13.0, 20.0, 26.0, 26.0, 36.0, 45.0, 52.0, 60.0, 71.0, 58.0, 62.0, 83.0, 57.0, 61.0, 42.0, 34.0, 43.0, 28.0, 26.0, 22.0, 16.0, 23.0, 16.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-26.1502685546875, -25.34549903869629, -24.54073143005371, -23.7359619140625, -22.93119239807129, -22.126422882080078, -21.3216552734375, -20.51688575744629, -19.712116241455078, -18.907346725463867, -18.10257911682129, -17.297809600830078, -16.493040084838867, -15.688271522521973, -14.883502960205078, -14.078733444213867, -13.273965835571289, -12.469197273254395, -11.664427757263184, -10.859659194946289, -10.054889678955078, -9.250121116638184, -8.445352554321289, -7.640583515167236, -6.835814476013184, -6.031045436859131, -5.226276397705078, -4.421507835388184, -3.616738796234131, -2.811969757080078, -2.0072011947631836, -1.2024321556091309, -0.3976631164550781, 0.40710580348968506, 1.2118747234344482, 2.016643524169922, 2.8214125633239746, 3.6261816024780273, 4.430950164794922, 5.235719203948975, 6.040488243103027, 6.84525728225708, 7.650026321411133, 8.454794883728027, 9.259563446044922, 10.064332962036133, 10.869101524353027, 11.673870086669922, 12.478639602661133, 13.283408164978027, 14.088177680969238, 14.892946243286133, 15.697715759277344, 16.502483367919922, 17.307252883911133, 18.112022399902344, 18.916790008544922, 19.721559524536133, 20.52632713317871, 21.331096649169922, 22.135866165161133, 22.940635681152344, 23.745403289794922, 24.550172805786133, 25.354942321777344]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 7.0, 9.0, 5.0, 8.0, 12.0, 13.0, 16.0, 21.0, 20.0, 23.0, 35.0, 28.0, 28.0, 30.0, 21.0, 33.0, 31.0, 32.0, 27.0, 41.0, 39.0, 33.0, 37.0, 27.0, 39.0, 29.0, 38.0, 37.0, 31.0, 20.0, 27.0, 25.0, 14.0, 31.0, 22.0, 12.0, 16.0, 17.0, 11.0, 13.0, 5.0, 8.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.314128875732422, -17.724695205688477, -17.1352596282959, -16.545825958251953, -15.956390380859375, -15.36695671081543, -14.777522087097168, -14.188087463378906, -13.598652839660645, -13.009218215942383, -12.419783592224121, -11.83034896850586, -11.240915298461914, -10.651479721069336, -10.06204605102539, -9.472611427307129, -8.883176803588867, -8.293742179870605, -7.704307556152344, -7.11487340927124, -6.5254387855529785, -5.936004161834717, -5.346570014953613, -4.757135391235352, -4.16770076751709, -3.578266143798828, -2.9888317584991455, -2.399397373199463, -1.8099627494812012, -1.2205281257629395, -0.6310937404632568, -0.04165935516357422, 0.5477771759033203, 1.1372116804122925, 1.7266461849212646, 2.3160805702209473, 2.905515193939209, 3.4949498176574707, 4.084383964538574, 4.673818588256836, 5.263253211975098, 5.852687835693359, 6.442122459411621, 7.031556606292725, 7.620991230010986, 8.210426330566406, 8.799860000610352, 9.389294624328613, 9.978729248046875, 10.568163871765137, 11.157598495483398, 11.74703311920166, 12.336467742919922, 12.925901412963867, 13.515336036682129, 14.10477066040039, 14.694205284118652, 15.283639907836914, 15.873074531555176, 16.462509155273438, 17.051942825317383, 17.64137840270996, 18.230812072753906, 18.820247650146484, 19.40968132019043]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 24.0, 23.0, 41.0, 54.0, 145.0, 112.0, 217.0, 313.0, 495.0, 730.0, 1069.0, 1727.0, 2436.0, 3848.0, 5960.0, 8863.0, 13248.0, 20223.0, 29997.0, 45239.0, 66963.0, 97774.0, 136001.0, 160054.0, 139972.0, 102165.0, 70242.0, 47022.0, 31609.0, 20973.0, 13777.0, 9122.0, 6101.0, 4016.0, 2733.0, 1855.0, 1136.0, 775.0, 490.0, 329.0, 231.0, 147.0, 90.0, 77.0, 43.0, 34.0, 23.0, 11.0, 7.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-28.828125, -27.91455078125, -27.0009765625, -26.08740234375, -25.173828125, -24.26025390625, -23.3466796875, -22.43310546875, -21.51953125, -20.60595703125, -19.6923828125, -18.77880859375, -17.865234375, -16.95166015625, -16.0380859375, -15.12451171875, -14.2109375, -13.29736328125, -12.3837890625, -11.47021484375, -10.556640625, -9.64306640625, -8.7294921875, -7.81591796875, -6.90234375, -5.98876953125, -5.0751953125, -4.16162109375, -3.248046875, -2.33447265625, -1.4208984375, -0.50732421875, 0.40625, 1.31982421875, 2.2333984375, 3.14697265625, 4.060546875, 4.97412109375, 5.8876953125, 6.80126953125, 7.71484375, 8.62841796875, 9.5419921875, 10.45556640625, 11.369140625, 12.28271484375, 13.1962890625, 14.10986328125, 15.0234375, 15.93701171875, 16.8505859375, 17.76416015625, 18.677734375, 19.59130859375, 20.5048828125, 21.41845703125, 22.33203125, 23.24560546875, 24.1591796875, 25.07275390625, 25.986328125, 26.89990234375, 27.8134765625, 28.72705078125, 29.640625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 3.0, 8.0, 6.0, 7.0, 10.0, 12.0, 18.0, 21.0, 20.0, 23.0, 27.0, 31.0, 24.0, 28.0, 25.0, 39.0, 29.0, 41.0, 36.0, 33.0, 41.0, 36.0, 39.0, 39.0, 35.0, 31.0, 31.0, 31.0, 26.0, 33.0, 27.0, 21.0, 23.0, 26.0, 22.0, 20.0, 15.0, 11.0, 14.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-17.90625, -17.3515625, -16.796875, -16.2421875, -15.6875, -15.1328125, -14.578125, -14.0234375, -13.46875, -12.9140625, -12.359375, -11.8046875, -11.25, -10.6953125, -10.140625, -9.5859375, -9.03125, -8.4765625, -7.921875, -7.3671875, -6.8125, -6.2578125, -5.703125, -5.1484375, -4.59375, -4.0390625, -3.484375, -2.9296875, -2.375, -1.8203125, -1.265625, -0.7109375, -0.15625, 0.3984375, 0.953125, 1.5078125, 2.0625, 2.6171875, 3.171875, 3.7265625, 4.28125, 4.8359375, 5.390625, 5.9453125, 6.5, 7.0546875, 7.609375, 8.1640625, 8.71875, 9.2734375, 9.828125, 10.3828125, 10.9375, 11.4921875, 12.046875, 12.6015625, 13.15625, 13.7109375, 14.265625, 14.8203125, 15.375, 15.9296875, 16.484375, 17.0390625, 17.59375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 13.0, 10.0, 16.0, 25.0, 48.0, 64.0, 106.0, 141.0, 200.0, 334.0, 531.0, 762.0, 1227.0, 1828.0, 3001.0, 4411.0, 7040.0, 11027.0, 17865.0, 28585.0, 46237.0, 73148.0, 114325.0, 162446.0, 180063.0, 141195.0, 94269.0, 59636.0, 37194.0, 22923.0, 14577.0, 9072.0, 5729.0, 3801.0, 2319.0, 1520.0, 977.0, 631.0, 428.0, 270.0, 182.0, 135.0, 82.0, 58.0, 38.0, 21.0, 16.0, 13.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-32.9375, -31.9169921875, -30.896484375, -29.8759765625, -28.85546875, -27.8349609375, -26.814453125, -25.7939453125, -24.7734375, -23.7529296875, -22.732421875, -21.7119140625, -20.69140625, -19.6708984375, -18.650390625, -17.6298828125, -16.609375, -15.5888671875, -14.568359375, -13.5478515625, -12.52734375, -11.5068359375, -10.486328125, -9.4658203125, -8.4453125, -7.4248046875, -6.404296875, -5.3837890625, -4.36328125, -3.3427734375, -2.322265625, -1.3017578125, -0.28125, 0.7392578125, 1.759765625, 2.7802734375, 3.80078125, 4.8212890625, 5.841796875, 6.8623046875, 7.8828125, 8.9033203125, 9.923828125, 10.9443359375, 11.96484375, 12.9853515625, 14.005859375, 15.0263671875, 16.046875, 17.0673828125, 18.087890625, 19.1083984375, 20.12890625, 21.1494140625, 22.169921875, 23.1904296875, 24.2109375, 25.2314453125, 26.251953125, 27.2724609375, 28.29296875, 29.3134765625, 30.333984375, 31.3544921875, 32.375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 7.0, 18.0, 13.0, 17.0, 24.0, 23.0, 17.0, 20.0, 28.0, 34.0, 31.0, 47.0, 30.0, 43.0, 34.0, 51.0, 47.0, 42.0, 53.0, 40.0, 34.0, 42.0, 39.0, 26.0, 24.0, 38.0, 29.0, 20.0, 27.0, 13.0, 17.0, 21.0, 10.0, 6.0, 3.0, 3.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.2283935546875, -11.823974609375, -11.4195556640625, -11.01513671875, -10.6107177734375, -10.206298828125, -9.8018798828125, -9.3974609375, -8.9930419921875, -8.588623046875, -8.1842041015625, -7.77978515625, -7.3753662109375, -6.970947265625, -6.5665283203125, -6.162109375, -5.7576904296875, -5.353271484375, -4.9488525390625, -4.54443359375, -4.1400146484375, -3.735595703125, -3.3311767578125, -2.9267578125, -2.5223388671875, -2.117919921875, -1.7135009765625, -1.30908203125, -0.9046630859375, -0.500244140625, -0.0958251953125, 0.30859375, 0.7130126953125, 1.117431640625, 1.5218505859375, 1.92626953125, 2.3306884765625, 2.735107421875, 3.1395263671875, 3.5439453125, 3.9483642578125, 4.352783203125, 4.7572021484375, 5.16162109375, 5.5660400390625, 5.970458984375, 6.3748779296875, 6.779296875, 7.1837158203125, 7.588134765625, 7.9925537109375, 8.39697265625, 8.8013916015625, 9.205810546875, 9.6102294921875, 10.0146484375, 10.4190673828125, 10.823486328125, 11.2279052734375, 11.63232421875, 12.0367431640625, 12.441162109375, 12.8455810546875, 13.25]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 5.0, 9.0, 14.0, 21.0, 24.0, 40.0, 47.0, 84.0, 98.0, 142.0, 213.0, 305.0, 416.0, 615.0, 953.0, 1523.0, 2309.0, 3445.0, 5893.0, 10027.0, 18059.0, 39011.0, 136160.0, 555289.0, 179443.0, 45804.0, 20256.0, 10839.0, 6462.0, 3826.0, 2393.0, 1616.0, 986.0, 702.0, 464.0, 310.0, 214.0, 154.0, 110.0, 87.0, 57.0, 40.0, 25.0, 20.0, 17.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9046630859375, -7.637451171875, -7.3702392578125, -7.10302734375, -6.8358154296875, -6.568603515625, -6.3013916015625, -6.0341796875, -5.7669677734375, -5.499755859375, -5.2325439453125, -4.96533203125, -4.6981201171875, -4.430908203125, -4.1636962890625, -3.896484375, -3.6292724609375, -3.362060546875, -3.0948486328125, -2.82763671875, -2.5604248046875, -2.293212890625, -2.0260009765625, -1.7587890625, -1.4915771484375, -1.224365234375, -0.9571533203125, -0.68994140625, -0.4227294921875, -0.155517578125, 0.1116943359375, 0.37890625, 0.6461181640625, 0.913330078125, 1.1805419921875, 1.44775390625, 1.7149658203125, 1.982177734375, 2.2493896484375, 2.5166015625, 2.7838134765625, 3.051025390625, 3.3182373046875, 3.58544921875, 3.8526611328125, 4.119873046875, 4.3870849609375, 4.654296875, 4.9215087890625, 5.188720703125, 5.4559326171875, 5.72314453125, 5.9903564453125, 6.257568359375, 6.5247802734375, 6.7919921875, 7.0592041015625, 7.326416015625, 7.5936279296875, 7.86083984375, 8.1280517578125, 8.395263671875, 8.6624755859375, 8.9296875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 16.0, 17.0, 24.0, 32.0, 81.0, 117.0, 160.0, 179.0, 139.0, 77.0, 59.0, 27.0, 17.0, 21.0, 10.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008459091186523438, -0.000820353627204895, -0.0007947981357574463, -0.0007692426443099976, -0.0007436871528625488, -0.0007181316614151001, -0.0006925761699676514, -0.0006670206785202026, -0.0006414651870727539, -0.0006159096956253052, -0.0005903542041778564, -0.0005647987127304077, -0.000539243221282959, -0.0005136877298355103, -0.0004881322383880615, -0.0004625767469406128, -0.00043702125549316406, -0.00041146576404571533, -0.0003859102725982666, -0.00036035478115081787, -0.00033479928970336914, -0.0003092437982559204, -0.0002836883068084717, -0.00025813281536102295, -0.00023257732391357422, -0.0002070218324661255, -0.00018146634101867676, -0.00015591084957122803, -0.0001303553581237793, -0.00010479986667633057, -7.924437522888184e-05, -5.3688883781433105e-05, -2.8133392333984375e-05, -2.5779008865356445e-06, 2.2977590560913086e-05, 4.8533082008361816e-05, 7.408857345581055e-05, 9.964406490325928e-05, 0.000125199556350708, 0.00015075504779815674, 0.00017631053924560547, 0.0002018660306930542, 0.00022742152214050293, 0.00025297701358795166, 0.0002785325050354004, 0.0003040879964828491, 0.00032964348793029785, 0.0003551989793777466, 0.0003807544708251953, 0.00040630996227264404, 0.0004318654537200928, 0.0004574209451675415, 0.00048297643661499023, 0.000508531928062439, 0.0005340874195098877, 0.0005596429109573364, 0.0005851984024047852, 0.0006107538938522339, 0.0006363093852996826, 0.0006618648767471313, 0.0006874203681945801, 0.0007129758596420288, 0.0007385313510894775, 0.0007640868425369263, 0.000789642333984375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 7.0, 7.0, 8.0, 18.0, 15.0, 26.0, 40.0, 59.0, 77.0, 121.0, 196.0, 252.0, 389.0, 521.0, 786.0, 1128.0, 1814.0, 2836.0, 4179.0, 6686.0, 10865.0, 18988.0, 39150.0, 116137.0, 493489.0, 228090.0, 60033.0, 25546.0, 13830.0, 8324.0, 5042.0, 3295.0, 2190.0, 1435.0, 959.0, 617.0, 467.0, 290.0, 180.0, 131.0, 104.0, 74.0, 46.0, 42.0, 26.0, 13.0, 9.0, 11.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.28436279296875, -6.0491943359375, -5.81402587890625, -5.578857421875, -5.34368896484375, -5.1085205078125, -4.87335205078125, -4.63818359375, -4.40301513671875, -4.1678466796875, -3.93267822265625, -3.697509765625, -3.46234130859375, -3.2271728515625, -2.99200439453125, -2.7568359375, -2.52166748046875, -2.2864990234375, -2.05133056640625, -1.816162109375, -1.58099365234375, -1.3458251953125, -1.11065673828125, -0.87548828125, -0.64031982421875, -0.4051513671875, -0.16998291015625, 0.065185546875, 0.30035400390625, 0.5355224609375, 0.77069091796875, 1.005859375, 1.24102783203125, 1.4761962890625, 1.71136474609375, 1.946533203125, 2.18170166015625, 2.4168701171875, 2.65203857421875, 2.88720703125, 3.12237548828125, 3.3575439453125, 3.59271240234375, 3.827880859375, 4.06304931640625, 4.2982177734375, 4.53338623046875, 4.7685546875, 5.00372314453125, 5.2388916015625, 5.47406005859375, 5.709228515625, 5.94439697265625, 6.1795654296875, 6.41473388671875, 6.64990234375, 6.88507080078125, 7.1202392578125, 7.35540771484375, 7.590576171875, 7.82574462890625, 8.0609130859375, 8.29608154296875, 8.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 7.0, 12.0, 8.0, 12.0, 11.0, 10.0, 16.0, 21.0, 13.0, 48.0, 77.0, 95.0, 149.0, 158.0, 110.0, 68.0, 33.0, 23.0, 9.0, 21.0, 5.0, 10.0, 12.0, 12.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0546875, -1.983551025390625, -1.91241455078125, -1.841278076171875, -1.7701416015625, -1.699005126953125, -1.62786865234375, -1.556732177734375, -1.485595703125, -1.414459228515625, -1.34332275390625, -1.272186279296875, -1.2010498046875, -1.129913330078125, -1.05877685546875, -0.987640380859375, -0.91650390625, -0.845367431640625, -0.77423095703125, -0.703094482421875, -0.6319580078125, -0.560821533203125, -0.48968505859375, -0.418548583984375, -0.347412109375, -0.276275634765625, -0.20513916015625, -0.134002685546875, -0.0628662109375, 0.008270263671875, 0.07940673828125, 0.150543212890625, 0.2216796875, 0.292816162109375, 0.36395263671875, 0.435089111328125, 0.5062255859375, 0.577362060546875, 0.64849853515625, 0.719635009765625, 0.790771484375, 0.861907958984375, 0.93304443359375, 1.004180908203125, 1.0753173828125, 1.146453857421875, 1.21759033203125, 1.288726806640625, 1.35986328125, 1.430999755859375, 1.50213623046875, 1.573272705078125, 1.6444091796875, 1.715545654296875, 1.78668212890625, 1.857818603515625, 1.928955078125, 2.000091552734375, 2.07122802734375, 2.142364501953125, 2.2135009765625, 2.284637451171875, 2.35577392578125, 2.426910400390625, 2.498046875]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 7.0, 6.0, 11.0, 6.0, 8.0, 18.0, 16.0, 22.0, 30.0, 38.0, 44.0, 45.0, 57.0, 61.0, 75.0, 75.0, 62.0, 60.0, 57.0, 49.0, 34.0, 46.0, 39.0, 32.0, 17.0, 9.0, 15.0, 6.0, 10.0, 6.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.161348342895508, -20.400991439819336, -19.640636444091797, -18.880279541015625, -18.119924545288086, -17.359567642211914, -16.599212646484375, -15.838855743408203, -15.078500747680664, -14.318144798278809, -13.557788848876953, -12.797432899475098, -12.037076950073242, -11.276721000671387, -10.516365051269531, -9.75600814819336, -8.995652198791504, -8.235296249389648, -7.474940299987793, -6.7145843505859375, -5.954228401184082, -5.193872451782227, -4.433516025543213, -3.6731600761413574, -2.912804126739502, -2.1524481773376465, -1.3920921087265015, -0.6317360401153564, 0.12861990928649902, 0.8889758586883545, 1.649332046508789, 2.4096879959106445, 3.1700439453125, 3.9303998947143555, 4.690755844116211, 5.451111793518066, 6.211467742919922, 6.971823692321777, 7.732180118560791, 8.492536544799805, 9.252891540527344, 10.0132474899292, 10.773603439331055, 11.53395938873291, 12.294315338134766, 13.054671287536621, 13.815027236938477, 14.575384140014648, 15.335740089416504, 16.09609603881836, 16.85645294189453, 17.61680793762207, 18.377164840698242, 19.13751983642578, 19.897876739501953, 20.658231735229492, 21.418588638305664, 22.178945541381836, 22.939300537109375, 23.699657440185547, 24.460012435913086, 25.220369338989258, 25.980724334716797, 26.74108123779297, 27.501436233520508]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 7.0, 9.0, 16.0, 6.0, 18.0, 13.0, 18.0, 14.0, 18.0, 24.0, 25.0, 20.0, 25.0, 25.0, 29.0, 41.0, 40.0, 51.0, 37.0, 37.0, 41.0, 32.0, 42.0, 32.0, 27.0, 30.0, 24.0, 32.0, 24.0, 39.0, 28.0, 26.0, 28.0, 21.0, 24.0, 11.0, 18.0, 9.0, 12.0, 2.0, 7.0, 8.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.428661346435547, -19.841289520263672, -19.253915786743164, -18.666542053222656, -18.07917022705078, -17.491798400878906, -16.9044246673584, -16.31705093383789, -15.729679107666016, -15.142306327819824, -14.554933547973633, -13.967560768127441, -13.38018798828125, -12.792815208435059, -12.205442428588867, -11.618069648742676, -11.030696868896484, -10.443324089050293, -9.855951309204102, -9.26857852935791, -8.681205749511719, -8.093832969665527, -7.506460189819336, -6.9190874099731445, -6.331714630126953, -5.744341850280762, -5.15696907043457, -4.569596290588379, -3.9822235107421875, -3.394850730895996, -2.8074779510498047, -2.2201051712036133, -1.632730484008789, -1.0453577041625977, -0.45798492431640625, 0.12938785552978516, 0.7167606353759766, 1.304133415222168, 1.8915061950683594, 2.478878974914551, 3.066251754760742, 3.6536245346069336, 4.240997314453125, 4.828370094299316, 5.415742874145508, 6.003115653991699, 6.590488433837891, 7.177861213684082, 7.765233993530273, 8.352606773376465, 8.939979553222656, 9.527352333068848, 10.114725112915039, 10.70209789276123, 11.289470672607422, 11.876843452453613, 12.464216232299805, 13.051589012145996, 13.638961791992188, 14.226334571838379, 14.81370735168457, 15.401080131530762, 15.988452911376953, 16.575824737548828, 17.163198471069336]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 15.0, 30.0, 34.0, 70.0, 79.0, 126.0, 176.0, 264.0, 380.0, 559.0, 792.0, 1189.0, 1658.0, 2309.0, 3547.0, 5025.0, 7382.0, 10679.0, 15960.0, 23720.0, 36001.0, 55228.0, 87366.0, 144382.0, 277896.0, 637630.0, 1087986.0, 870882.0, 402452.0, 195227.0, 112885.0, 71748.0, 46970.0, 31162.0, 20758.0, 13603.0, 9016.0, 6289.0, 4237.0, 2797.0, 1941.0, 1291.0, 874.0, 523.0, 419.0, 233.0, 164.0, 109.0, 76.0, 57.0, 40.0, 19.0, 13.0, 7.0, 5.0, 8.0, 4.0, 1.0], "bins": [-22.28125, -21.6005859375, -20.919921875, -20.2392578125, -19.55859375, -18.8779296875, -18.197265625, -17.5166015625, -16.8359375, -16.1552734375, -15.474609375, -14.7939453125, -14.11328125, -13.4326171875, -12.751953125, -12.0712890625, -11.390625, -10.7099609375, -10.029296875, -9.3486328125, -8.66796875, -7.9873046875, -7.306640625, -6.6259765625, -5.9453125, -5.2646484375, -4.583984375, -3.9033203125, -3.22265625, -2.5419921875, -1.861328125, -1.1806640625, -0.5, 0.1806640625, 0.861328125, 1.5419921875, 2.22265625, 2.9033203125, 3.583984375, 4.2646484375, 4.9453125, 5.6259765625, 6.306640625, 6.9873046875, 7.66796875, 8.3486328125, 9.029296875, 9.7099609375, 10.390625, 11.0712890625, 11.751953125, 12.4326171875, 13.11328125, 13.7939453125, 14.474609375, 15.1552734375, 15.8359375, 16.5166015625, 17.197265625, 17.8779296875, 18.55859375, 19.2392578125, 19.919921875, 20.6005859375, 21.28125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 7.0, 7.0, 11.0, 10.0, 10.0, 13.0, 18.0, 19.0, 13.0, 26.0, 22.0, 21.0, 34.0, 23.0, 35.0, 35.0, 48.0, 40.0, 43.0, 40.0, 45.0, 41.0, 53.0, 33.0, 32.0, 24.0, 32.0, 33.0, 27.0, 34.0, 22.0, 25.0, 21.0, 15.0, 22.0, 16.0, 10.0, 4.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.0479736328125, -15.564697265625, -15.0814208984375, -14.59814453125, -14.1148681640625, -13.631591796875, -13.1483154296875, -12.6650390625, -12.1817626953125, -11.698486328125, -11.2152099609375, -10.73193359375, -10.2486572265625, -9.765380859375, -9.2821044921875, -8.798828125, -8.3155517578125, -7.832275390625, -7.3489990234375, -6.86572265625, -6.3824462890625, -5.899169921875, -5.4158935546875, -4.9326171875, -4.4493408203125, -3.966064453125, -3.4827880859375, -2.99951171875, -2.5162353515625, -2.032958984375, -1.5496826171875, -1.06640625, -0.5831298828125, -0.099853515625, 0.3834228515625, 0.86669921875, 1.3499755859375, 1.833251953125, 2.3165283203125, 2.7998046875, 3.2830810546875, 3.766357421875, 4.2496337890625, 4.73291015625, 5.2161865234375, 5.699462890625, 6.1827392578125, 6.666015625, 7.1492919921875, 7.632568359375, 8.1158447265625, 8.59912109375, 9.0823974609375, 9.565673828125, 10.0489501953125, 10.5322265625, 11.0155029296875, 11.498779296875, 11.9820556640625, 12.46533203125, 12.9486083984375, 13.431884765625, 13.9151611328125, 14.3984375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 10.0, 13.0, 19.0, 47.0, 72.0, 91.0, 149.0, 203.0, 347.0, 574.0, 834.0, 1290.0, 2038.0, 3170.0, 5372.0, 8463.0, 13716.0, 23416.0, 40175.0, 70132.0, 126336.0, 235821.0, 457416.0, 910183.0, 1084936.0, 565080.0, 289321.0, 152335.0, 84329.0, 47699.0, 27965.0, 16332.0, 9986.0, 6081.0, 3700.0, 2453.0, 1453.0, 955.0, 632.0, 362.0, 267.0, 169.0, 111.0, 59.0, 46.0, 35.0, 27.0, 19.0, 8.0, 10.0, 12.0, 3.0, 3.0, 6.0], "bins": [-25.859375, -25.102294921875, -24.34521484375, -23.588134765625, -22.8310546875, -22.073974609375, -21.31689453125, -20.559814453125, -19.802734375, -19.045654296875, -18.28857421875, -17.531494140625, -16.7744140625, -16.017333984375, -15.26025390625, -14.503173828125, -13.74609375, -12.989013671875, -12.23193359375, -11.474853515625, -10.7177734375, -9.960693359375, -9.20361328125, -8.446533203125, -7.689453125, -6.932373046875, -6.17529296875, -5.418212890625, -4.6611328125, -3.904052734375, -3.14697265625, -2.389892578125, -1.6328125, -0.875732421875, -0.11865234375, 0.638427734375, 1.3955078125, 2.152587890625, 2.90966796875, 3.666748046875, 4.423828125, 5.180908203125, 5.93798828125, 6.695068359375, 7.4521484375, 8.209228515625, 8.96630859375, 9.723388671875, 10.48046875, 11.237548828125, 11.99462890625, 12.751708984375, 13.5087890625, 14.265869140625, 15.02294921875, 15.780029296875, 16.537109375, 17.294189453125, 18.05126953125, 18.808349609375, 19.5654296875, 20.322509765625, 21.07958984375, 21.836669921875, 22.59375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 7.0, 9.0, 16.0, 20.0, 23.0, 28.0, 40.0, 43.0, 64.0, 66.0, 81.0, 107.0, 133.0, 169.0, 183.0, 228.0, 255.0, 287.0, 302.0, 281.0, 278.0, 235.0, 206.0, 176.0, 149.0, 142.0, 94.0, 84.0, 69.0, 57.0, 47.0, 49.0, 44.0, 16.0, 16.0, 13.0, 12.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.15625, -8.8775634765625, -8.598876953125, -8.3201904296875, -8.04150390625, -7.7628173828125, -7.484130859375, -7.2054443359375, -6.9267578125, -6.6480712890625, -6.369384765625, -6.0906982421875, -5.81201171875, -5.5333251953125, -5.254638671875, -4.9759521484375, -4.697265625, -4.4185791015625, -4.139892578125, -3.8612060546875, -3.58251953125, -3.3038330078125, -3.025146484375, -2.7464599609375, -2.4677734375, -2.1890869140625, -1.910400390625, -1.6317138671875, -1.35302734375, -1.0743408203125, -0.795654296875, -0.5169677734375, -0.23828125, 0.0404052734375, 0.319091796875, 0.5977783203125, 0.87646484375, 1.1551513671875, 1.433837890625, 1.7125244140625, 1.9912109375, 2.2698974609375, 2.548583984375, 2.8272705078125, 3.10595703125, 3.3846435546875, 3.663330078125, 3.9420166015625, 4.220703125, 4.4993896484375, 4.778076171875, 5.0567626953125, 5.33544921875, 5.6141357421875, 5.892822265625, 6.1715087890625, 6.4501953125, 6.7288818359375, 7.007568359375, 7.2862548828125, 7.56494140625, 7.8436279296875, 8.122314453125, 8.4010009765625, 8.6796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 2.0, 10.0, 7.0, 8.0, 11.0, 12.0, 17.0, 23.0, 23.0, 31.0, 35.0, 33.0, 66.0, 59.0, 64.0, 69.0, 69.0, 58.0, 68.0, 56.0, 48.0, 46.0, 26.0, 34.0, 13.0, 23.0, 21.0, 17.0, 8.0, 13.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.35442352294922, -22.692520141601562, -22.03061866760254, -21.368715286254883, -20.70681381225586, -20.044910430908203, -19.383007049560547, -18.72110366821289, -18.059202194213867, -17.39729881286621, -16.735397338867188, -16.07349395751953, -15.411591529846191, -14.749689102172852, -14.087785720825195, -13.425883293151855, -12.763980865478516, -12.102078437805176, -11.440176010131836, -10.77827262878418, -10.11637020111084, -9.4544677734375, -8.792564392089844, -8.130661964416504, -7.468759536743164, -6.806857109069824, -6.144954204559326, -5.483051300048828, -4.821148872375488, -4.159246444702148, -3.4973435401916504, -2.8354406356811523, -2.1735363006591797, -1.5116336345672607, -0.8497309684753418, -0.18782830238342285, 0.4740743637084961, 1.135977029800415, 1.797879695892334, 2.459782600402832, 3.121685028076172, 3.783587694168091, 4.44549036026001, 5.107393264770508, 5.769295692443848, 6.4311981201171875, 7.0931010246276855, 7.755003929138184, 8.416906356811523, 9.078808784484863, 9.740711212158203, 10.40261459350586, 11.0645170211792, 11.726419448852539, 12.388322830200195, 13.050225257873535, 13.712127685546875, 14.374030113220215, 15.035932540893555, 15.697835922241211, 16.359737396240234, 17.02164077758789, 17.683544158935547, 18.345447540283203, 19.007349014282227]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 9.0, 7.0, 11.0, 13.0, 25.0, 12.0, 10.0, 14.0, 23.0, 12.0, 26.0, 21.0, 22.0, 16.0, 30.0, 33.0, 35.0, 38.0, 41.0, 29.0, 38.0, 44.0, 36.0, 37.0, 33.0, 23.0, 36.0, 36.0, 23.0, 35.0, 27.0, 17.0, 25.0, 17.0, 23.0, 18.0, 12.0, 12.0, 8.0, 9.0, 13.0, 3.0, 9.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-15.310504913330078, -14.85014533996582, -14.389786720275879, -13.929427146911621, -13.469067573547363, -13.008708953857422, -12.548349380493164, -12.087989807128906, -11.627630233764648, -11.16727066040039, -10.70691204071045, -10.246552467346191, -9.786192893981934, -9.325834274291992, -8.865474700927734, -8.405115127563477, -7.944756507873535, -7.4843974113464355, -7.024037837982178, -6.563678741455078, -6.10331916809082, -5.642960071563721, -5.182600975036621, -4.722241401672363, -4.261882305145264, -3.801522970199585, -3.3411636352539062, -2.8808045387268066, -2.420445203781128, -1.9600858688354492, -1.4997267723083496, -1.039367437362671, -0.5790081024169922, -0.11864882707595825, 0.3417104482650757, 0.8020696640014648, 1.2624289989471436, 1.7227883338928223, 2.183147430419922, 2.6435067653656006, 3.1038661003112793, 3.564225435256958, 4.024584770202637, 4.484943866729736, 4.945302963256836, 5.405662536621094, 5.866021633148193, 6.326380729675293, 6.786740303039551, 7.24709939956665, 7.707458972930908, 8.167818069458008, 8.628177642822266, 9.088537216186523, 9.548895835876465, 10.009255409240723, 10.469614028930664, 10.929973602294922, 11.390332221984863, 11.850691795349121, 12.311051368713379, 12.77140998840332, 13.231769561767578, 13.692129135131836, 14.152488708496094]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 15.0, 24.0, 26.0, 37.0, 54.0, 77.0, 102.0, 171.0, 224.0, 320.0, 482.0, 691.0, 1002.0, 1452.0, 2120.0, 3156.0, 4674.0, 6751.0, 10143.0, 14809.0, 22478.0, 32725.0, 48325.0, 70894.0, 102980.0, 158332.0, 187237.0, 121947.0, 82093.0, 55958.0, 38588.0, 26105.0, 17574.0, 11929.0, 7961.0, 5446.0, 3675.0, 2562.0, 1615.0, 1145.0, 836.0, 537.0, 426.0, 252.0, 213.0, 145.0, 86.0, 64.0, 34.0, 25.0, 19.0, 13.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.95703125, -6.73406982421875, -6.5111083984375, -6.28814697265625, -6.065185546875, -5.84222412109375, -5.6192626953125, -5.39630126953125, -5.17333984375, -4.95037841796875, -4.7274169921875, -4.50445556640625, -4.281494140625, -4.05853271484375, -3.8355712890625, -3.61260986328125, -3.3896484375, -3.16668701171875, -2.9437255859375, -2.72076416015625, -2.497802734375, -2.27484130859375, -2.0518798828125, -1.82891845703125, -1.60595703125, -1.38299560546875, -1.1600341796875, -0.93707275390625, -0.714111328125, -0.49114990234375, -0.2681884765625, -0.04522705078125, 0.177734375, 0.40069580078125, 0.6236572265625, 0.84661865234375, 1.069580078125, 1.29254150390625, 1.5155029296875, 1.73846435546875, 1.96142578125, 2.18438720703125, 2.4073486328125, 2.63031005859375, 2.853271484375, 3.07623291015625, 3.2991943359375, 3.52215576171875, 3.7451171875, 3.96807861328125, 4.1910400390625, 4.41400146484375, 4.636962890625, 4.85992431640625, 5.0828857421875, 5.30584716796875, 5.52880859375, 5.75177001953125, 5.9747314453125, 6.19769287109375, 6.420654296875, 6.64361572265625, 6.8665771484375, 7.08953857421875, 7.3125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 5.0, 3.0, 9.0, 13.0, 6.0, 16.0, 14.0, 17.0, 20.0, 15.0, 18.0, 21.0, 23.0, 17.0, 24.0, 29.0, 30.0, 36.0, 42.0, 33.0, 34.0, 51.0, 32.0, 40.0, 41.0, 20.0, 25.0, 25.0, 37.0, 29.0, 35.0, 34.0, 29.0, 29.0, 22.0, 14.0, 14.0, 16.0, 15.0, 9.0, 12.0, 10.0, 7.0, 3.0, 6.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.6171875, -15.12744140625, -14.6376953125, -14.14794921875, -13.658203125, -13.16845703125, -12.6787109375, -12.18896484375, -11.69921875, -11.20947265625, -10.7197265625, -10.22998046875, -9.740234375, -9.25048828125, -8.7607421875, -8.27099609375, -7.78125, -7.29150390625, -6.8017578125, -6.31201171875, -5.822265625, -5.33251953125, -4.8427734375, -4.35302734375, -3.86328125, -3.37353515625, -2.8837890625, -2.39404296875, -1.904296875, -1.41455078125, -0.9248046875, -0.43505859375, 0.0546875, 0.54443359375, 1.0341796875, 1.52392578125, 2.013671875, 2.50341796875, 2.9931640625, 3.48291015625, 3.97265625, 4.46240234375, 4.9521484375, 5.44189453125, 5.931640625, 6.42138671875, 6.9111328125, 7.40087890625, 7.890625, 8.38037109375, 8.8701171875, 9.35986328125, 9.849609375, 10.33935546875, 10.8291015625, 11.31884765625, 11.80859375, 12.29833984375, 12.7880859375, 13.27783203125, 13.767578125, 14.25732421875, 14.7470703125, 15.23681640625, 15.7265625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 13.0, 19.0, 27.0, 34.0, 68.0, 87.0, 130.0, 211.0, 317.0, 499.0, 827.0, 1291.0, 2109.0, 3527.0, 5912.0, 10157.0, 18194.0, 33113.0, 63624.0, 126991.0, 280967.0, 253459.0, 116662.0, 59021.0, 30954.0, 16692.0, 9607.0, 5479.0, 3208.0, 1988.0, 1193.0, 710.0, 492.0, 349.0, 220.0, 141.0, 82.0, 60.0, 31.0, 20.0, 26.0, 5.0, 6.0, 6.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.2734375, -9.9302978515625, -9.587158203125, -9.2440185546875, -8.90087890625, -8.5577392578125, -8.214599609375, -7.8714599609375, -7.5283203125, -7.1851806640625, -6.842041015625, -6.4989013671875, -6.15576171875, -5.8126220703125, -5.469482421875, -5.1263427734375, -4.783203125, -4.4400634765625, -4.096923828125, -3.7537841796875, -3.41064453125, -3.0675048828125, -2.724365234375, -2.3812255859375, -2.0380859375, -1.6949462890625, -1.351806640625, -1.0086669921875, -0.66552734375, -0.3223876953125, 0.020751953125, 0.3638916015625, 0.70703125, 1.0501708984375, 1.393310546875, 1.7364501953125, 2.07958984375, 2.4227294921875, 2.765869140625, 3.1090087890625, 3.4521484375, 3.7952880859375, 4.138427734375, 4.4815673828125, 4.82470703125, 5.1678466796875, 5.510986328125, 5.8541259765625, 6.197265625, 6.5404052734375, 6.883544921875, 7.2266845703125, 7.56982421875, 7.9129638671875, 8.256103515625, 8.5992431640625, 8.9423828125, 9.2855224609375, 9.628662109375, 9.9718017578125, 10.31494140625, 10.6580810546875, 11.001220703125, 11.3443603515625, 11.6875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 8.0, 7.0, 3.0, 7.0, 8.0, 10.0, 15.0, 16.0, 20.0, 22.0, 22.0, 25.0, 31.0, 32.0, 26.0, 28.0, 39.0, 31.0, 27.0, 24.0, 39.0, 34.0, 49.0, 40.0, 38.0, 39.0, 39.0, 31.0, 29.0, 29.0, 25.0, 31.0, 28.0, 13.0, 24.0, 18.0, 15.0, 11.0, 7.0, 10.0, 11.0, 3.0, 6.0, 6.0, 8.0, 6.0, 1.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.640625, -9.3326416015625, -9.024658203125, -8.7166748046875, -8.40869140625, -8.1007080078125, -7.792724609375, -7.4847412109375, -7.1767578125, -6.8687744140625, -6.560791015625, -6.2528076171875, -5.94482421875, -5.6368408203125, -5.328857421875, -5.0208740234375, -4.712890625, -4.4049072265625, -4.096923828125, -3.7889404296875, -3.48095703125, -3.1729736328125, -2.864990234375, -2.5570068359375, -2.2490234375, -1.9410400390625, -1.633056640625, -1.3250732421875, -1.01708984375, -0.7091064453125, -0.401123046875, -0.0931396484375, 0.21484375, 0.5228271484375, 0.830810546875, 1.1387939453125, 1.44677734375, 1.7547607421875, 2.062744140625, 2.3707275390625, 2.6787109375, 2.9866943359375, 3.294677734375, 3.6026611328125, 3.91064453125, 4.2186279296875, 4.526611328125, 4.8345947265625, 5.142578125, 5.4505615234375, 5.758544921875, 6.0665283203125, 6.37451171875, 6.6824951171875, 6.990478515625, 7.2984619140625, 7.6064453125, 7.9144287109375, 8.222412109375, 8.5303955078125, 8.83837890625, 9.1463623046875, 9.454345703125, 9.7623291015625, 10.0703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 10.0, 25.0, 43.0, 65.0, 116.0, 202.0, 309.0, 583.0, 1154.0, 2222.0, 4619.0, 10367.0, 25869.0, 74136.0, 271068.0, 468406.0, 122252.0, 39434.0, 14943.0, 6532.0, 3007.0, 1407.0, 766.0, 409.0, 235.0, 130.0, 69.0, 46.0, 38.0, 27.0, 19.0, 8.0, 3.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14462661743164062, -0.13983917236328125, -0.13505172729492188, -0.1302642822265625, -0.12547683715820312, -0.12068939208984375, -0.11590194702148438, -0.111114501953125, -0.10632705688476562, -0.10153961181640625, -0.09675216674804688, -0.0919647216796875, -0.08717727661132812, -0.08238983154296875, -0.07760238647460938, -0.07281494140625, -0.06802749633789062, -0.06324005126953125, -0.058452606201171875, -0.0536651611328125, -0.048877716064453125, -0.04409027099609375, -0.039302825927734375, -0.034515380859375, -0.029727935791015625, -0.02494049072265625, -0.020153045654296875, -0.0153656005859375, -0.010578155517578125, -0.00579071044921875, -0.001003265380859375, 0.0037841796875, 0.008571624755859375, 0.01335906982421875, 0.018146514892578125, 0.0229339599609375, 0.027721405029296875, 0.03250885009765625, 0.037296295166015625, 0.042083740234375, 0.046871185302734375, 0.05165863037109375, 0.056446075439453125, 0.0612335205078125, 0.06602096557617188, 0.07080841064453125, 0.07559585571289062, 0.08038330078125, 0.08517074584960938, 0.08995819091796875, 0.09474563598632812, 0.0995330810546875, 0.10432052612304688, 0.10910797119140625, 0.11389541625976562, 0.118682861328125, 0.12347030639648438, 0.12825775146484375, 0.13304519653320312, 0.1378326416015625, 0.14262008666992188, 0.14740753173828125, 0.15219497680664062, 0.156982421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 7.0, 9.0, 19.0, 28.0, 38.0, 34.0, 42.0, 74.0, 85.0, 99.0, 95.0, 94.0, 74.0, 58.0, 49.0, 37.0, 39.0, 21.0, 15.0, 18.0, 18.0, 5.0, 4.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.547834396362305e-05, -4.4045038521289825e-05, -4.2611733078956604e-05, -4.117842763662338e-05, -3.974512219429016e-05, -3.831181675195694e-05, -3.687851130962372e-05, -3.54452058672905e-05, -3.4011900424957275e-05, -3.2578594982624054e-05, -3.114528954029083e-05, -2.971198409795761e-05, -2.827867865562439e-05, -2.6845373213291168e-05, -2.5412067770957947e-05, -2.3978762328624725e-05, -2.2545456886291504e-05, -2.1112151443958282e-05, -1.967884600162506e-05, -1.824554055929184e-05, -1.6812235116958618e-05, -1.5378929674625397e-05, -1.3945624232292175e-05, -1.2512318789958954e-05, -1.1079013347625732e-05, -9.645707905292511e-06, -8.21240246295929e-06, -6.779097020626068e-06, -5.345791578292847e-06, -3.912486135959625e-06, -2.479180693626404e-06, -1.0458752512931824e-06, 3.8743019104003906e-07, 1.8207356333732605e-06, 3.254041075706482e-06, 4.687346518039703e-06, 6.120651960372925e-06, 7.553957402706146e-06, 8.987262845039368e-06, 1.0420568287372589e-05, 1.185387372970581e-05, 1.3287179172039032e-05, 1.4720484614372253e-05, 1.6153790056705475e-05, 1.7587095499038696e-05, 1.9020400941371918e-05, 2.045370638370514e-05, 2.188701182603836e-05, 2.3320317268371582e-05, 2.4753622710704803e-05, 2.6186928153038025e-05, 2.7620233595371246e-05, 2.9053539037704468e-05, 3.048684448003769e-05, 3.192014992237091e-05, 3.335345536470413e-05, 3.4786760807037354e-05, 3.6220066249370575e-05, 3.7653371691703796e-05, 3.908667713403702e-05, 4.051998257637024e-05, 4.195328801870346e-05, 4.338659346103668e-05, 4.4819898903369904e-05, 4.6253204345703125e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 7.0, 12.0, 9.0, 31.0, 36.0, 42.0, 56.0, 107.0, 117.0, 196.0, 285.0, 516.0, 880.0, 1378.0, 2424.0, 4218.0, 7789.0, 14527.0, 29154.0, 63117.0, 149142.0, 357280.0, 236798.0, 94094.0, 42381.0, 20182.0, 10445.0, 5497.0, 3108.0, 1785.0, 1062.0, 672.0, 421.0, 262.0, 182.0, 114.0, 70.0, 60.0, 32.0, 26.0, 12.0, 14.0, 3.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10284423828125, -0.09938621520996094, -0.09592819213867188, -0.09247016906738281, -0.08901214599609375, -0.08555412292480469, -0.08209609985351562, -0.07863807678222656, -0.0751800537109375, -0.07172203063964844, -0.06826400756835938, -0.06480598449707031, -0.06134796142578125, -0.05788993835449219, -0.054431915283203125, -0.05097389221191406, -0.047515869140625, -0.04405784606933594, -0.040599822998046875, -0.03714179992675781, -0.03368377685546875, -0.030225753784179688, -0.026767730712890625, -0.023309707641601562, -0.0198516845703125, -0.016393661499023438, -0.012935638427734375, -0.009477615356445312, -0.00601959228515625, -0.0025615692138671875, 0.000896453857421875, 0.0043544769287109375, 0.0078125, 0.011270523071289062, 0.014728546142578125, 0.018186569213867188, 0.02164459228515625, 0.025102615356445312, 0.028560638427734375, 0.03201866149902344, 0.0354766845703125, 0.03893470764160156, 0.042392730712890625, 0.04585075378417969, 0.04930877685546875, 0.05276679992675781, 0.056224822998046875, 0.05968284606933594, 0.063140869140625, 0.06659889221191406, 0.07005691528320312, 0.07351493835449219, 0.07697296142578125, 0.08043098449707031, 0.08388900756835938, 0.08734703063964844, 0.0908050537109375, 0.09426307678222656, 0.09772109985351562, 0.10117912292480469, 0.10463714599609375, 0.10809516906738281, 0.11155319213867188, 0.11501121520996094, 0.11846923828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 7.0, 6.0, 14.0, 15.0, 10.0, 15.0, 28.0, 19.0, 18.0, 23.0, 46.0, 65.0, 68.0, 63.0, 72.0, 82.0, 63.0, 57.0, 66.0, 38.0, 41.0, 39.0, 23.0, 21.0, 19.0, 20.0, 10.0, 11.0, 9.0, 8.0, 0.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0290985107421875, -0.0281832218170166, -0.027267932891845703, -0.026352643966674805, -0.025437355041503906, -0.024522066116333008, -0.02360677719116211, -0.02269148826599121, -0.021776199340820312, -0.020860910415649414, -0.019945621490478516, -0.019030332565307617, -0.01811504364013672, -0.01719975471496582, -0.016284465789794922, -0.015369176864624023, -0.014453887939453125, -0.013538599014282227, -0.012623310089111328, -0.01170802116394043, -0.010792732238769531, -0.009877443313598633, -0.008962154388427734, -0.008046865463256836, -0.0071315765380859375, -0.006216287612915039, -0.005300998687744141, -0.004385709762573242, -0.0034704208374023438, -0.0025551319122314453, -0.0016398429870605469, -0.0007245540618896484, 0.00019073486328125, 0.0011060237884521484, 0.002021312713623047, 0.0029366016387939453, 0.0038518905639648438, 0.004767179489135742, 0.005682468414306641, 0.006597757339477539, 0.0075130462646484375, 0.008428335189819336, 0.009343624114990234, 0.010258913040161133, 0.011174201965332031, 0.01208949089050293, 0.013004779815673828, 0.013920068740844727, 0.014835357666015625, 0.015750646591186523, 0.016665935516357422, 0.01758122444152832, 0.01849651336669922, 0.019411802291870117, 0.020327091217041016, 0.021242380142211914, 0.022157669067382812, 0.02307295799255371, 0.02398824691772461, 0.024903535842895508, 0.025818824768066406, 0.026734113693237305, 0.027649402618408203, 0.0285646915435791, 0.02947998046875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 9.0, 7.0, 10.0, 19.0, 17.0, 22.0, 27.0, 29.0, 32.0, 44.0, 61.0, 51.0, 78.0, 67.0, 59.0, 53.0, 76.0, 56.0, 50.0, 37.0, 26.0, 30.0, 25.0, 23.0, 12.0, 12.0, 16.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-23.4033145904541, -22.75493049621582, -22.106548309326172, -21.45816421508789, -20.80978012084961, -20.161396026611328, -19.51301383972168, -18.8646297454834, -18.21624755859375, -17.56786346435547, -16.91948127746582, -16.27109718322754, -15.622713088989258, -14.974329948425293, -14.325946807861328, -13.677562713623047, -13.029178619384766, -12.3807954788208, -11.73241138458252, -11.084028244018555, -10.435644149780273, -9.787261009216309, -9.138877868652344, -8.490493774414062, -7.842110633850098, -7.193727016448975, -6.545343399047852, -5.896960258483887, -5.248576641082764, -4.600193023681641, -3.9518096446990967, -3.3034262657165527, -2.6550445556640625, -2.0066609382629395, -1.3582775592803955, -0.709894061088562, -0.061510562896728516, 0.5868730545043945, 1.2352564334869385, 1.8836398124694824, 2.5320234298706055, 3.1804070472717285, 3.8287904262542725, 4.477173805236816, 5.1255574226379395, 5.7739410400390625, 6.422324180603027, 7.07070779800415, 7.719091415405273, 8.367474555969238, 9.01585865020752, 9.664241790771484, 10.312625885009766, 10.96100902557373, 11.609392166137695, 12.257776260375977, 12.906159400939941, 13.554542541503906, 14.202926635742188, 14.851309776306152, 15.499692916870117, 16.1480770111084, 16.79646110534668, 17.444843292236328, 18.09322738647461]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 7.0, 11.0, 12.0, 25.0, 12.0, 12.0, 13.0, 21.0, 14.0, 26.0, 21.0, 22.0, 15.0, 27.0, 37.0, 36.0, 41.0, 33.0, 31.0, 41.0, 42.0, 37.0, 37.0, 35.0, 22.0, 37.0, 32.0, 27.0, 30.0, 32.0, 17.0, 23.0, 18.0, 22.0, 19.0, 12.0, 12.0, 9.0, 8.0, 14.0, 3.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-15.122108459472656, -14.668652534484863, -14.21519660949707, -13.761741638183594, -13.3082857131958, -12.854829788208008, -12.401373863220215, -11.947917938232422, -11.494462966918945, -11.041007041931152, -10.58755111694336, -10.134096145629883, -9.68064022064209, -9.227184295654297, -8.773728370666504, -8.320272445678711, -7.866816520690918, -7.413360595703125, -6.95990514755249, -6.506449222564697, -6.0529937744140625, -5.5995378494262695, -5.146081924438477, -4.692625999450684, -4.239170551300049, -3.785714864730835, -3.332259178161621, -2.878803253173828, -2.4253475666046143, -1.9718918800354004, -1.5184359550476074, -1.0649802684783936, -0.6115236282348633, -0.15806788206100464, 0.295387864112854, 0.7488436698913574, 1.2022993564605713, 1.6557550430297852, 2.109210968017578, 2.562666654586792, 3.016122341156006, 3.4695780277252197, 3.9230337142944336, 4.376489639282227, 4.8299455642700195, 5.283401012420654, 5.736856937408447, 6.190312385559082, 6.643768310546875, 7.097224235534668, 7.550679683685303, 8.004135131835938, 8.45759105682373, 8.911046981811523, 9.364502906799316, 9.81795883178711, 10.271413803100586, 10.724869728088379, 11.178325653076172, 11.631780624389648, 12.085236549377441, 12.538692474365234, 12.992148399353027, 13.44560432434082, 13.899060249328613]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 14.0, 20.0, 42.0, 71.0, 73.0, 177.0, 218.0, 388.0, 603.0, 916.0, 1349.0, 2059.0, 3279.0, 4889.0, 7651.0, 11446.0, 17404.0, 26732.0, 40827.0, 62815.0, 94423.0, 132472.0, 159624.0, 148634.0, 111330.0, 76337.0, 50476.0, 32821.0, 21371.0, 13894.0, 9020.0, 5970.0, 3909.0, 2436.0, 1709.0, 1133.0, 750.0, 441.0, 281.0, 203.0, 137.0, 86.0, 52.0, 27.0, 19.0, 7.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.39599609375, -20.6513671875, -19.90673828125, -19.162109375, -18.41748046875, -17.6728515625, -16.92822265625, -16.18359375, -15.43896484375, -14.6943359375, -13.94970703125, -13.205078125, -12.46044921875, -11.7158203125, -10.97119140625, -10.2265625, -9.48193359375, -8.7373046875, -7.99267578125, -7.248046875, -6.50341796875, -5.7587890625, -5.01416015625, -4.26953125, -3.52490234375, -2.7802734375, -2.03564453125, -1.291015625, -0.54638671875, 0.1982421875, 0.94287109375, 1.6875, 2.43212890625, 3.1767578125, 3.92138671875, 4.666015625, 5.41064453125, 6.1552734375, 6.89990234375, 7.64453125, 8.38916015625, 9.1337890625, 9.87841796875, 10.623046875, 11.36767578125, 12.1123046875, 12.85693359375, 13.6015625, 14.34619140625, 15.0908203125, 15.83544921875, 16.580078125, 17.32470703125, 18.0693359375, 18.81396484375, 19.55859375, 20.30322265625, 21.0478515625, 21.79248046875, 22.537109375, 23.28173828125, 24.0263671875, 24.77099609375, 25.515625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 6.0, 11.0, 16.0, 9.0, 16.0, 10.0, 22.0, 18.0, 16.0, 22.0, 17.0, 24.0, 27.0, 35.0, 30.0, 46.0, 31.0, 33.0, 38.0, 31.0, 47.0, 36.0, 48.0, 42.0, 33.0, 40.0, 34.0, 30.0, 23.0, 27.0, 24.0, 25.0, 20.0, 16.0, 16.0, 21.0, 10.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0], "bins": [-16.140625, -15.68310546875, -15.2255859375, -14.76806640625, -14.310546875, -13.85302734375, -13.3955078125, -12.93798828125, -12.48046875, -12.02294921875, -11.5654296875, -11.10791015625, -10.650390625, -10.19287109375, -9.7353515625, -9.27783203125, -8.8203125, -8.36279296875, -7.9052734375, -7.44775390625, -6.990234375, -6.53271484375, -6.0751953125, -5.61767578125, -5.16015625, -4.70263671875, -4.2451171875, -3.78759765625, -3.330078125, -2.87255859375, -2.4150390625, -1.95751953125, -1.5, -1.04248046875, -0.5849609375, -0.12744140625, 0.330078125, 0.78759765625, 1.2451171875, 1.70263671875, 2.16015625, 2.61767578125, 3.0751953125, 3.53271484375, 3.990234375, 4.44775390625, 4.9052734375, 5.36279296875, 5.8203125, 6.27783203125, 6.7353515625, 7.19287109375, 7.650390625, 8.10791015625, 8.5654296875, 9.02294921875, 9.48046875, 9.93798828125, 10.3955078125, 10.85302734375, 11.310546875, 11.76806640625, 12.2255859375, 12.68310546875, 13.140625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 8.0, 16.0, 26.0, 42.0, 62.0, 107.0, 121.0, 236.0, 341.0, 522.0, 789.0, 1190.0, 1922.0, 2890.0, 4623.0, 7024.0, 11229.0, 17359.0, 27376.0, 44151.0, 69343.0, 107371.0, 153791.0, 175974.0, 146711.0, 100123.0, 64508.0, 40520.0, 25401.0, 16048.0, 10271.0, 6606.0, 4138.0, 2765.0, 1757.0, 1093.0, 705.0, 453.0, 329.0, 215.0, 131.0, 90.0, 62.0, 41.0, 25.0, 17.0, 8.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.375, -22.580322265625, -21.78564453125, -20.990966796875, -20.1962890625, -19.401611328125, -18.60693359375, -17.812255859375, -17.017578125, -16.222900390625, -15.42822265625, -14.633544921875, -13.8388671875, -13.044189453125, -12.24951171875, -11.454833984375, -10.66015625, -9.865478515625, -9.07080078125, -8.276123046875, -7.4814453125, -6.686767578125, -5.89208984375, -5.097412109375, -4.302734375, -3.508056640625, -2.71337890625, -1.918701171875, -1.1240234375, -0.329345703125, 0.46533203125, 1.260009765625, 2.0546875, 2.849365234375, 3.64404296875, 4.438720703125, 5.2333984375, 6.028076171875, 6.82275390625, 7.617431640625, 8.412109375, 9.206787109375, 10.00146484375, 10.796142578125, 11.5908203125, 12.385498046875, 13.18017578125, 13.974853515625, 14.76953125, 15.564208984375, 16.35888671875, 17.153564453125, 17.9482421875, 18.742919921875, 19.53759765625, 20.332275390625, 21.126953125, 21.921630859375, 22.71630859375, 23.510986328125, 24.3056640625, 25.100341796875, 25.89501953125, 26.689697265625, 27.484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 11.0, 8.0, 13.0, 18.0, 14.0, 33.0, 24.0, 26.0, 23.0, 20.0, 39.0, 28.0, 28.0, 31.0, 40.0, 30.0, 41.0, 49.0, 47.0, 40.0, 47.0, 30.0, 33.0, 42.0, 26.0, 25.0, 28.0, 23.0, 19.0, 21.0, 21.0, 17.0, 21.0, 9.0, 6.0, 13.0, 6.0, 12.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.109375, -8.8070068359375, -8.504638671875, -8.2022705078125, -7.89990234375, -7.5975341796875, -7.295166015625, -6.9927978515625, -6.6904296875, -6.3880615234375, -6.085693359375, -5.7833251953125, -5.48095703125, -5.1785888671875, -4.876220703125, -4.5738525390625, -4.271484375, -3.9691162109375, -3.666748046875, -3.3643798828125, -3.06201171875, -2.7596435546875, -2.457275390625, -2.1549072265625, -1.8525390625, -1.5501708984375, -1.247802734375, -0.9454345703125, -0.64306640625, -0.3406982421875, -0.038330078125, 0.2640380859375, 0.56640625, 0.8687744140625, 1.171142578125, 1.4735107421875, 1.77587890625, 2.0782470703125, 2.380615234375, 2.6829833984375, 2.9853515625, 3.2877197265625, 3.590087890625, 3.8924560546875, 4.19482421875, 4.4971923828125, 4.799560546875, 5.1019287109375, 5.404296875, 5.7066650390625, 6.009033203125, 6.3114013671875, 6.61376953125, 6.9161376953125, 7.218505859375, 7.5208740234375, 7.8232421875, 8.1256103515625, 8.427978515625, 8.7303466796875, 9.03271484375, 9.3350830078125, 9.637451171875, 9.9398193359375, 10.2421875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 22.0, 24.0, 20.0, 29.0, 38.0, 55.0, 71.0, 114.0, 159.0, 220.0, 288.0, 411.0, 557.0, 820.0, 1153.0, 1653.0, 2470.0, 3955.0, 5889.0, 9954.0, 18027.0, 34920.0, 82351.0, 254467.0, 396237.0, 128260.0, 49039.0, 23127.0, 12568.0, 7358.0, 4620.0, 2945.0, 2091.0, 1328.0, 910.0, 678.0, 424.0, 337.0, 256.0, 188.0, 148.0, 91.0, 70.0, 63.0, 36.0, 31.0, 12.0, 22.0, 11.0, 9.0, 6.0, 3.0, 8.0, 0.0, 1.0, 2.0], "bins": [-7.71875, -7.4791259765625, -7.239501953125, -6.9998779296875, -6.76025390625, -6.5206298828125, -6.281005859375, -6.0413818359375, -5.8017578125, -5.5621337890625, -5.322509765625, -5.0828857421875, -4.84326171875, -4.6036376953125, -4.364013671875, -4.1243896484375, -3.884765625, -3.6451416015625, -3.405517578125, -3.1658935546875, -2.92626953125, -2.6866455078125, -2.447021484375, -2.2073974609375, -1.9677734375, -1.7281494140625, -1.488525390625, -1.2489013671875, -1.00927734375, -0.7696533203125, -0.530029296875, -0.2904052734375, -0.05078125, 0.1888427734375, 0.428466796875, 0.6680908203125, 0.90771484375, 1.1473388671875, 1.386962890625, 1.6265869140625, 1.8662109375, 2.1058349609375, 2.345458984375, 2.5850830078125, 2.82470703125, 3.0643310546875, 3.303955078125, 3.5435791015625, 3.783203125, 4.0228271484375, 4.262451171875, 4.5020751953125, 4.74169921875, 4.9813232421875, 5.220947265625, 5.4605712890625, 5.7001953125, 5.9398193359375, 6.179443359375, 6.4190673828125, 6.65869140625, 6.8983154296875, 7.137939453125, 7.3775634765625, 7.6171875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 6.0, 8.0, 8.0, 8.0, 14.0, 10.0, 24.0, 23.0, 26.0, 37.0, 54.0, 62.0, 81.0, 80.0, 55.0, 88.0, 80.0, 57.0, 55.0, 46.0, 31.0, 28.0, 23.0, 14.0, 9.0, 13.0, 8.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00035953521728515625, -0.00034700334072113037, -0.0003344714641571045, -0.0003219395875930786, -0.00030940771102905273, -0.00029687583446502686, -0.000284343957901001, -0.0002718120813369751, -0.0002592802047729492, -0.00024674832820892334, -0.00023421645164489746, -0.00022168457508087158, -0.0002091526985168457, -0.00019662082195281982, -0.00018408894538879395, -0.00017155706882476807, -0.0001590251922607422, -0.0001464933156967163, -0.00013396143913269043, -0.00012142956256866455, -0.00010889768600463867, -9.636580944061279e-05, -8.383393287658691e-05, -7.130205631256104e-05, -5.8770179748535156e-05, -4.623830318450928e-05, -3.37064266204834e-05, -2.117455005645752e-05, -8.64267349243164e-06, 3.889203071594238e-06, 1.6421079635620117e-05, 2.8952956199645996e-05, 4.1484832763671875e-05, 5.4016709327697754e-05, 6.654858589172363e-05, 7.908046245574951e-05, 9.161233901977539e-05, 0.00010414421558380127, 0.00011667609214782715, 0.00012920796871185303, 0.0001417398452758789, 0.00015427172183990479, 0.00016680359840393066, 0.00017933547496795654, 0.00019186735153198242, 0.0002043992280960083, 0.00021693110466003418, 0.00022946298122406006, 0.00024199485778808594, 0.0002545267343521118, 0.0002670586109161377, 0.0002795904874801636, 0.00029212236404418945, 0.00030465424060821533, 0.0003171861171722412, 0.0003297179937362671, 0.00034224987030029297, 0.00035478174686431885, 0.0003673136234283447, 0.0003798454999923706, 0.0003923773765563965, 0.00040490925312042236, 0.00041744112968444824, 0.0004299730062484741, 0.0004425048828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 10.0, 5.0, 16.0, 8.0, 19.0, 28.0, 37.0, 65.0, 85.0, 116.0, 234.0, 272.0, 435.0, 674.0, 1159.0, 1887.0, 3294.0, 5813.0, 10837.0, 22258.0, 54452.0, 220932.0, 529597.0, 121313.0, 38078.0, 16946.0, 8521.0, 4581.0, 2606.0, 1546.0, 937.0, 615.0, 402.0, 253.0, 147.0, 124.0, 65.0, 47.0, 33.0, 26.0, 32.0, 12.0, 9.0, 4.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0], "bins": [-12.4921875, -12.148193359375, -11.80419921875, -11.460205078125, -11.1162109375, -10.772216796875, -10.42822265625, -10.084228515625, -9.740234375, -9.396240234375, -9.05224609375, -8.708251953125, -8.3642578125, -8.020263671875, -7.67626953125, -7.332275390625, -6.98828125, -6.644287109375, -6.30029296875, -5.956298828125, -5.6123046875, -5.268310546875, -4.92431640625, -4.580322265625, -4.236328125, -3.892333984375, -3.54833984375, -3.204345703125, -2.8603515625, -2.516357421875, -2.17236328125, -1.828369140625, -1.484375, -1.140380859375, -0.79638671875, -0.452392578125, -0.1083984375, 0.235595703125, 0.57958984375, 0.923583984375, 1.267578125, 1.611572265625, 1.95556640625, 2.299560546875, 2.6435546875, 2.987548828125, 3.33154296875, 3.675537109375, 4.01953125, 4.363525390625, 4.70751953125, 5.051513671875, 5.3955078125, 5.739501953125, 6.08349609375, 6.427490234375, 6.771484375, 7.115478515625, 7.45947265625, 7.803466796875, 8.1474609375, 8.491455078125, 8.83544921875, 9.179443359375, 9.5234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 7.0, 4.0, 5.0, 10.0, 20.0, 19.0, 25.0, 30.0, 26.0, 60.0, 102.0, 136.0, 138.0, 150.0, 65.0, 42.0, 28.0, 19.0, 16.0, 20.0, 14.0, 15.0, 10.0, 7.0, 6.0, 6.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1796875, -4.075775146484375, -3.97186279296875, -3.867950439453125, -3.7640380859375, -3.660125732421875, -3.55621337890625, -3.452301025390625, -3.348388671875, -3.244476318359375, -3.14056396484375, -3.036651611328125, -2.9327392578125, -2.828826904296875, -2.72491455078125, -2.621002197265625, -2.51708984375, -2.413177490234375, -2.30926513671875, -2.205352783203125, -2.1014404296875, -1.997528076171875, -1.89361572265625, -1.789703369140625, -1.685791015625, -1.581878662109375, -1.47796630859375, -1.374053955078125, -1.2701416015625, -1.166229248046875, -1.06231689453125, -0.958404541015625, -0.8544921875, -0.750579833984375, -0.64666748046875, -0.542755126953125, -0.4388427734375, -0.334930419921875, -0.23101806640625, -0.127105712890625, -0.023193359375, 0.080718994140625, 0.18463134765625, 0.288543701171875, 0.3924560546875, 0.496368408203125, 0.60028076171875, 0.704193115234375, 0.80810546875, 0.912017822265625, 1.01593017578125, 1.119842529296875, 1.2237548828125, 1.327667236328125, 1.43157958984375, 1.535491943359375, 1.639404296875, 1.743316650390625, 1.84722900390625, 1.951141357421875, 2.0550537109375, 2.158966064453125, 2.26287841796875, 2.366790771484375, 2.470703125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 7.0, 6.0, 10.0, 9.0, 19.0, 23.0, 31.0, 47.0, 42.0, 71.0, 79.0, 77.0, 77.0, 74.0, 91.0, 54.0, 51.0, 35.0, 45.0, 22.0, 33.0, 23.0, 12.0, 9.0, 12.0, 7.0, 3.0, 6.0, 4.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.93549346923828, -27.198890686035156, -26.46228790283203, -25.72568702697754, -24.989084243774414, -24.25248146057129, -23.515880584716797, -22.779277801513672, -22.042675018310547, -21.306072235107422, -20.569469451904297, -19.832868576049805, -19.09626579284668, -18.359663009643555, -17.623062133789062, -16.886459350585938, -16.149856567382812, -15.413253784179688, -14.676651954650879, -13.94005012512207, -13.203447341918945, -12.46684455871582, -11.730242729187012, -10.993640899658203, -10.257038116455078, -9.520435333251953, -8.783833503723145, -8.047231674194336, -7.310628890991211, -6.574026584625244, -5.837424278259277, -5.1008219718933105, -4.364219665527344, -3.627617359161377, -2.89101505279541, -2.1544127464294434, -1.4178104400634766, -0.6812081336975098, 0.05539417266845703, 0.7919964790344238, 1.5285987854003906, 2.2652010917663574, 3.001803398132324, 3.738405704498291, 4.475008010864258, 5.211610317230225, 5.948212623596191, 6.684814929962158, 7.421417236328125, 8.15802001953125, 8.894621849060059, 9.631223678588867, 10.367826461791992, 11.104429244995117, 11.841031074523926, 12.577632904052734, 13.31423568725586, 14.050838470458984, 14.787440299987793, 15.524042129516602, 16.260644912719727, 16.99724769592285, 17.733848571777344, 18.47045135498047, 19.207054138183594]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 8.0, 7.0, 13.0, 9.0, 8.0, 16.0, 10.0, 12.0, 18.0, 25.0, 21.0, 28.0, 26.0, 26.0, 31.0, 28.0, 39.0, 28.0, 34.0, 38.0, 32.0, 33.0, 49.0, 31.0, 37.0, 32.0, 30.0, 32.0, 46.0, 29.0, 32.0, 25.0, 14.0, 15.0, 24.0, 14.0, 17.0, 18.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-14.85803508758545, -14.395015716552734, -13.93199634552002, -13.468976974487305, -13.005958557128906, -12.542938232421875, -12.079919815063477, -11.616900444030762, -11.153881072998047, -10.690861701965332, -10.227842330932617, -9.764822959899902, -9.301803588867188, -8.838785171508789, -8.375765800476074, -7.912746429443359, -7.4497270584106445, -6.98670768737793, -6.523688316345215, -6.060669422149658, -5.597650051116943, -5.1346306800842285, -4.671611785888672, -4.208592414855957, -3.745573043823242, -3.2825536727905273, -2.8195345401763916, -2.356515407562256, -1.893496036529541, -1.4304766654968262, -0.9674575328826904, -0.5044384002685547, -0.041419029235839844, 0.42160022258758545, 0.8846194744110107, 1.347638726234436, 1.8106579780578613, 2.273677349090576, 2.736696481704712, 3.1997156143188477, 3.6627349853515625, 4.125754356384277, 4.588773727416992, 5.051792621612549, 5.514811992645264, 5.9778313636779785, 6.440850257873535, 6.90386962890625, 7.366888999938965, 7.82990837097168, 8.292927742004395, 8.75594711303711, 9.218965530395508, 9.681985855102539, 10.145004272460938, 10.608023643493652, 11.071043014526367, 11.534062385559082, 11.997081756591797, 12.460101127624512, 12.923120498657227, 13.386138916015625, 13.84915828704834, 14.312177658081055, 14.77519702911377]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 11.0, 17.0, 33.0, 29.0, 55.0, 75.0, 129.0, 196.0, 300.0, 519.0, 779.0, 1108.0, 1629.0, 2514.0, 3733.0, 5666.0, 8779.0, 13807.0, 21915.0, 34353.0, 55539.0, 93205.0, 165806.0, 340835.0, 812809.0, 1216229.0, 730975.0, 308890.0, 151014.0, 86002.0, 51068.0, 31821.0, 19738.0, 12268.0, 7874.0, 5041.0, 3258.0, 2182.0, 1384.0, 915.0, 569.0, 430.0, 273.0, 174.0, 110.0, 79.0, 57.0, 38.0, 17.0, 16.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.5, -18.879638671875, -18.25927734375, -17.638916015625, -17.0185546875, -16.398193359375, -15.77783203125, -15.157470703125, -14.537109375, -13.916748046875, -13.29638671875, -12.676025390625, -12.0556640625, -11.435302734375, -10.81494140625, -10.194580078125, -9.57421875, -8.953857421875, -8.33349609375, -7.713134765625, -7.0927734375, -6.472412109375, -5.85205078125, -5.231689453125, -4.611328125, -3.990966796875, -3.37060546875, -2.750244140625, -2.1298828125, -1.509521484375, -0.88916015625, -0.268798828125, 0.3515625, 0.971923828125, 1.59228515625, 2.212646484375, 2.8330078125, 3.453369140625, 4.07373046875, 4.694091796875, 5.314453125, 5.934814453125, 6.55517578125, 7.175537109375, 7.7958984375, 8.416259765625, 9.03662109375, 9.656982421875, 10.27734375, 10.897705078125, 11.51806640625, 12.138427734375, 12.7587890625, 13.379150390625, 13.99951171875, 14.619873046875, 15.240234375, 15.860595703125, 16.48095703125, 17.101318359375, 17.7216796875, 18.342041015625, 18.96240234375, 19.582763671875, 20.203125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 2.0, 6.0, 2.0, 13.0, 8.0, 13.0, 6.0, 8.0, 15.0, 19.0, 19.0, 22.0, 25.0, 18.0, 25.0, 26.0, 30.0, 42.0, 26.0, 36.0, 51.0, 45.0, 43.0, 28.0, 38.0, 34.0, 47.0, 38.0, 41.0, 30.0, 30.0, 27.0, 30.0, 24.0, 21.0, 18.0, 22.0, 14.0, 13.0, 7.0, 11.0, 8.0, 4.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.6875, -12.29248046875, -11.8974609375, -11.50244140625, -11.107421875, -10.71240234375, -10.3173828125, -9.92236328125, -9.52734375, -9.13232421875, -8.7373046875, -8.34228515625, -7.947265625, -7.55224609375, -7.1572265625, -6.76220703125, -6.3671875, -5.97216796875, -5.5771484375, -5.18212890625, -4.787109375, -4.39208984375, -3.9970703125, -3.60205078125, -3.20703125, -2.81201171875, -2.4169921875, -2.02197265625, -1.626953125, -1.23193359375, -0.8369140625, -0.44189453125, -0.046875, 0.34814453125, 0.7431640625, 1.13818359375, 1.533203125, 1.92822265625, 2.3232421875, 2.71826171875, 3.11328125, 3.50830078125, 3.9033203125, 4.29833984375, 4.693359375, 5.08837890625, 5.4833984375, 5.87841796875, 6.2734375, 6.66845703125, 7.0634765625, 7.45849609375, 7.853515625, 8.24853515625, 8.6435546875, 9.03857421875, 9.43359375, 9.82861328125, 10.2236328125, 10.61865234375, 11.013671875, 11.40869140625, 11.8037109375, 12.19873046875, 12.59375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 12.0, 12.0, 20.0, 25.0, 50.0, 74.0, 102.0, 173.0, 297.0, 472.0, 811.0, 1309.0, 2274.0, 3884.0, 6675.0, 11812.0, 21671.0, 38708.0, 73299.0, 140568.0, 287285.0, 611646.0, 1229891.0, 916720.0, 421668.0, 202238.0, 102401.0, 53776.0, 28989.0, 15826.0, 9138.0, 5189.0, 2981.0, 1722.0, 1034.0, 572.0, 354.0, 226.0, 147.0, 92.0, 61.0, 33.0, 18.0, 13.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.953125, -22.25244140625, -21.5517578125, -20.85107421875, -20.150390625, -19.44970703125, -18.7490234375, -18.04833984375, -17.34765625, -16.64697265625, -15.9462890625, -15.24560546875, -14.544921875, -13.84423828125, -13.1435546875, -12.44287109375, -11.7421875, -11.04150390625, -10.3408203125, -9.64013671875, -8.939453125, -8.23876953125, -7.5380859375, -6.83740234375, -6.13671875, -5.43603515625, -4.7353515625, -4.03466796875, -3.333984375, -2.63330078125, -1.9326171875, -1.23193359375, -0.53125, 0.16943359375, 0.8701171875, 1.57080078125, 2.271484375, 2.97216796875, 3.6728515625, 4.37353515625, 5.07421875, 5.77490234375, 6.4755859375, 7.17626953125, 7.876953125, 8.57763671875, 9.2783203125, 9.97900390625, 10.6796875, 11.38037109375, 12.0810546875, 12.78173828125, 13.482421875, 14.18310546875, 14.8837890625, 15.58447265625, 16.28515625, 16.98583984375, 17.6865234375, 18.38720703125, 19.087890625, 19.78857421875, 20.4892578125, 21.18994140625, 21.890625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 11.0, 24.0, 19.0, 20.0, 26.0, 40.0, 48.0, 58.0, 70.0, 85.0, 96.0, 147.0, 168.0, 191.0, 234.0, 275.0, 294.0, 328.0, 336.0, 240.0, 219.0, 202.0, 169.0, 133.0, 127.0, 103.0, 81.0, 69.0, 57.0, 42.0, 29.0, 31.0, 19.0, 22.0, 5.0, 16.0, 4.0, 2.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.484375, -7.247802734375, -7.01123046875, -6.774658203125, -6.5380859375, -6.301513671875, -6.06494140625, -5.828369140625, -5.591796875, -5.355224609375, -5.11865234375, -4.882080078125, -4.6455078125, -4.408935546875, -4.17236328125, -3.935791015625, -3.69921875, -3.462646484375, -3.22607421875, -2.989501953125, -2.7529296875, -2.516357421875, -2.27978515625, -2.043212890625, -1.806640625, -1.570068359375, -1.33349609375, -1.096923828125, -0.8603515625, -0.623779296875, -0.38720703125, -0.150634765625, 0.0859375, 0.322509765625, 0.55908203125, 0.795654296875, 1.0322265625, 1.268798828125, 1.50537109375, 1.741943359375, 1.978515625, 2.215087890625, 2.45166015625, 2.688232421875, 2.9248046875, 3.161376953125, 3.39794921875, 3.634521484375, 3.87109375, 4.107666015625, 4.34423828125, 4.580810546875, 4.8173828125, 5.053955078125, 5.29052734375, 5.527099609375, 5.763671875, 6.000244140625, 6.23681640625, 6.473388671875, 6.7099609375, 6.946533203125, 7.18310546875, 7.419677734375, 7.65625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 9.0, 14.0, 12.0, 20.0, 28.0, 44.0, 56.0, 64.0, 55.0, 71.0, 92.0, 88.0, 78.0, 77.0, 54.0, 44.0, 51.0, 26.0, 21.0, 18.0, 11.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.868572235107422, -24.219207763671875, -23.569843292236328, -22.92047882080078, -22.271114349365234, -21.621749877929688, -20.97238540649414, -20.323020935058594, -19.673656463623047, -19.0242919921875, -18.374927520751953, -17.725563049316406, -17.07619857788086, -16.426834106445312, -15.777469635009766, -15.128105163574219, -14.478740692138672, -13.829376220703125, -13.180011749267578, -12.530647277832031, -11.881282806396484, -11.231918334960938, -10.58255386352539, -9.933189392089844, -9.283824920654297, -8.63446044921875, -7.985095977783203, -7.335731506347656, -6.686367034912109, -6.0370025634765625, -5.387638092041016, -4.738273620605469, -4.088909149169922, -3.439544677734375, -2.790180206298828, -2.1408157348632812, -1.4914512634277344, -0.8420867919921875, -0.19272232055664062, 0.45664215087890625, 1.1060066223144531, 1.75537109375, 2.404735565185547, 3.0541000366210938, 3.7034645080566406, 4.3528289794921875, 5.002193450927734, 5.651557922363281, 6.300922393798828, 6.950286865234375, 7.599651336669922, 8.249015808105469, 8.898380279541016, 9.547744750976562, 10.19710922241211, 10.846473693847656, 11.495838165283203, 12.14520263671875, 12.794567108154297, 13.443931579589844, 14.09329605102539, 14.742660522460938, 15.392024993896484, 16.04138946533203, 16.690753936767578]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 13.0, 5.0, 3.0, 9.0, 12.0, 10.0, 11.0, 11.0, 22.0, 12.0, 25.0, 23.0, 26.0, 28.0, 23.0, 30.0, 33.0, 32.0, 41.0, 37.0, 39.0, 41.0, 63.0, 40.0, 43.0, 30.0, 40.0, 30.0, 30.0, 22.0, 34.0, 32.0, 31.0, 26.0, 25.0, 6.0, 12.0, 8.0, 6.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-15.448772430419922, -15.000678062438965, -14.552583694458008, -14.10448932647705, -13.656394958496094, -13.208300590515137, -12.76020622253418, -12.312111854553223, -11.864017486572266, -11.415923118591309, -10.967828750610352, -10.519734382629395, -10.071640014648438, -9.62354564666748, -9.175451278686523, -8.727356910705566, -8.27926254272461, -7.831168174743652, -7.383073806762695, -6.934979438781738, -6.486885070800781, -6.038790702819824, -5.590696334838867, -5.14260196685791, -4.694507598876953, -4.246413230895996, -3.798318862915039, -3.350224494934082, -2.902130126953125, -2.454035758972168, -2.005941390991211, -1.557847023010254, -1.1097526550292969, -0.6616582870483398, -0.2135639190673828, 0.23453044891357422, 0.6826248168945312, 1.1307191848754883, 1.5788135528564453, 2.0269079208374023, 2.4750022888183594, 2.9230966567993164, 3.3711910247802734, 3.8192853927612305, 4.2673797607421875, 4.7154741287231445, 5.163568496704102, 5.611662864685059, 6.059757232666016, 6.507851600646973, 6.95594596862793, 7.404040336608887, 7.852134704589844, 8.3002290725708, 8.748323440551758, 9.196417808532715, 9.644512176513672, 10.092606544494629, 10.540700912475586, 10.988795280456543, 11.4368896484375, 11.884984016418457, 12.333078384399414, 12.781172752380371, 13.229267120361328]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 11.0, 13.0, 36.0, 39.0, 75.0, 74.0, 128.0, 177.0, 286.0, 407.0, 584.0, 794.0, 1118.0, 1648.0, 2389.0, 3429.0, 4865.0, 7013.0, 10122.0, 14848.0, 21769.0, 32807.0, 49982.0, 75403.0, 115211.0, 181893.0, 180699.0, 115038.0, 75239.0, 49523.0, 32936.0, 22033.0, 14922.0, 10169.0, 6999.0, 4669.0, 3369.0, 2375.0, 1600.0, 1236.0, 817.0, 563.0, 370.0, 273.0, 207.0, 128.0, 87.0, 51.0, 59.0, 23.0, 14.0, 14.0, 12.0, 9.0, 4.0, 4.0], "bins": [-6.25, -6.066162109375, -5.88232421875, -5.698486328125, -5.5146484375, -5.330810546875, -5.14697265625, -4.963134765625, -4.779296875, -4.595458984375, -4.41162109375, -4.227783203125, -4.0439453125, -3.860107421875, -3.67626953125, -3.492431640625, -3.30859375, -3.124755859375, -2.94091796875, -2.757080078125, -2.5732421875, -2.389404296875, -2.20556640625, -2.021728515625, -1.837890625, -1.654052734375, -1.47021484375, -1.286376953125, -1.1025390625, -0.918701171875, -0.73486328125, -0.551025390625, -0.3671875, -0.183349609375, 0.00048828125, 0.184326171875, 0.3681640625, 0.552001953125, 0.73583984375, 0.919677734375, 1.103515625, 1.287353515625, 1.47119140625, 1.655029296875, 1.8388671875, 2.022705078125, 2.20654296875, 2.390380859375, 2.57421875, 2.758056640625, 2.94189453125, 3.125732421875, 3.3095703125, 3.493408203125, 3.67724609375, 3.861083984375, 4.044921875, 4.228759765625, 4.41259765625, 4.596435546875, 4.7802734375, 4.964111328125, 5.14794921875, 5.331787109375, 5.515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 5.0, 6.0, 7.0, 7.0, 7.0, 12.0, 7.0, 9.0, 8.0, 11.0, 11.0, 11.0, 31.0, 17.0, 29.0, 33.0, 29.0, 33.0, 31.0, 38.0, 41.0, 30.0, 50.0, 42.0, 38.0, 46.0, 39.0, 35.0, 48.0, 26.0, 42.0, 38.0, 26.0, 38.0, 22.0, 18.0, 13.0, 17.0, 16.0, 3.0, 7.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.6875, -16.216064453125, -15.74462890625, -15.273193359375, -14.8017578125, -14.330322265625, -13.85888671875, -13.387451171875, -12.916015625, -12.444580078125, -11.97314453125, -11.501708984375, -11.0302734375, -10.558837890625, -10.08740234375, -9.615966796875, -9.14453125, -8.673095703125, -8.20166015625, -7.730224609375, -7.2587890625, -6.787353515625, -6.31591796875, -5.844482421875, -5.373046875, -4.901611328125, -4.43017578125, -3.958740234375, -3.4873046875, -3.015869140625, -2.54443359375, -2.072998046875, -1.6015625, -1.130126953125, -0.65869140625, -0.187255859375, 0.2841796875, 0.755615234375, 1.22705078125, 1.698486328125, 2.169921875, 2.641357421875, 3.11279296875, 3.584228515625, 4.0556640625, 4.527099609375, 4.99853515625, 5.469970703125, 5.94140625, 6.412841796875, 6.88427734375, 7.355712890625, 7.8271484375, 8.298583984375, 8.77001953125, 9.241455078125, 9.712890625, 10.184326171875, 10.65576171875, 11.127197265625, 11.5986328125, 12.070068359375, 12.54150390625, 13.012939453125, 13.484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 20.0, 19.0, 26.0, 49.0, 79.0, 124.0, 188.0, 326.0, 640.0, 1118.0, 1898.0, 3298.0, 6327.0, 11846.0, 23933.0, 49101.0, 103949.0, 232619.0, 327538.0, 148419.0, 69183.0, 32962.0, 16398.0, 8327.0, 4380.0, 2468.0, 1390.0, 760.0, 460.0, 273.0, 148.0, 96.0, 65.0, 38.0, 24.0, 17.0, 10.0, 9.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.7900390625, -9.455078125, -9.1201171875, -8.78515625, -8.4501953125, -8.115234375, -7.7802734375, -7.4453125, -7.1103515625, -6.775390625, -6.4404296875, -6.10546875, -5.7705078125, -5.435546875, -5.1005859375, -4.765625, -4.4306640625, -4.095703125, -3.7607421875, -3.42578125, -3.0908203125, -2.755859375, -2.4208984375, -2.0859375, -1.7509765625, -1.416015625, -1.0810546875, -0.74609375, -0.4111328125, -0.076171875, 0.2587890625, 0.59375, 0.9287109375, 1.263671875, 1.5986328125, 1.93359375, 2.2685546875, 2.603515625, 2.9384765625, 3.2734375, 3.6083984375, 3.943359375, 4.2783203125, 4.61328125, 4.9482421875, 5.283203125, 5.6181640625, 5.953125, 6.2880859375, 6.623046875, 6.9580078125, 7.29296875, 7.6279296875, 7.962890625, 8.2978515625, 8.6328125, 8.9677734375, 9.302734375, 9.6376953125, 9.97265625, 10.3076171875, 10.642578125, 10.9775390625, 11.3125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 8.0, 5.0, 8.0, 4.0, 11.0, 12.0, 15.0, 22.0, 21.0, 18.0, 23.0, 24.0, 29.0, 39.0, 36.0, 27.0, 40.0, 37.0, 35.0, 50.0, 30.0, 35.0, 40.0, 44.0, 38.0, 32.0, 40.0, 31.0, 25.0, 34.0, 25.0, 24.0, 21.0, 17.0, 24.0, 13.0, 10.0, 10.0, 11.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2265625, -8.9149169921875, -8.603271484375, -8.2916259765625, -7.97998046875, -7.6683349609375, -7.356689453125, -7.0450439453125, -6.7333984375, -6.4217529296875, -6.110107421875, -5.7984619140625, -5.48681640625, -5.1751708984375, -4.863525390625, -4.5518798828125, -4.240234375, -3.9285888671875, -3.616943359375, -3.3052978515625, -2.99365234375, -2.6820068359375, -2.370361328125, -2.0587158203125, -1.7470703125, -1.4354248046875, -1.123779296875, -0.8121337890625, -0.50048828125, -0.1888427734375, 0.122802734375, 0.4344482421875, 0.74609375, 1.0577392578125, 1.369384765625, 1.6810302734375, 1.99267578125, 2.3043212890625, 2.615966796875, 2.9276123046875, 3.2392578125, 3.5509033203125, 3.862548828125, 4.1741943359375, 4.48583984375, 4.7974853515625, 5.109130859375, 5.4207763671875, 5.732421875, 6.0440673828125, 6.355712890625, 6.6673583984375, 6.97900390625, 7.2906494140625, 7.602294921875, 7.9139404296875, 8.2255859375, 8.5372314453125, 8.848876953125, 9.1605224609375, 9.47216796875, 9.7838134765625, 10.095458984375, 10.4071044921875, 10.71875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 9.0, 11.0, 28.0, 29.0, 35.0, 60.0, 86.0, 159.0, 263.0, 350.0, 562.0, 936.0, 1603.0, 2739.0, 4992.0, 9343.0, 18660.0, 41564.0, 112768.0, 382750.0, 309052.0, 91986.0, 35294.0, 16325.0, 8187.0, 4524.0, 2420.0, 1455.0, 877.0, 547.0, 356.0, 200.0, 120.0, 87.0, 64.0, 34.0, 26.0, 13.0, 11.0, 10.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09118270874023438, -0.08849334716796875, -0.08580398559570312, -0.0831146240234375, -0.08042526245117188, -0.07773590087890625, -0.07504653930664062, -0.072357177734375, -0.06966781616210938, -0.06697845458984375, -0.06428909301757812, -0.0615997314453125, -0.058910369873046875, -0.05622100830078125, -0.053531646728515625, -0.05084228515625, -0.048152923583984375, -0.04546356201171875, -0.042774200439453125, -0.0400848388671875, -0.037395477294921875, -0.03470611572265625, -0.032016754150390625, -0.029327392578125, -0.026638031005859375, -0.02394866943359375, -0.021259307861328125, -0.0185699462890625, -0.015880584716796875, -0.01319122314453125, -0.010501861572265625, -0.0078125, -0.005123138427734375, -0.00243377685546875, 0.000255584716796875, 0.0029449462890625, 0.005634307861328125, 0.00832366943359375, 0.011013031005859375, 0.013702392578125, 0.016391754150390625, 0.01908111572265625, 0.021770477294921875, 0.0244598388671875, 0.027149200439453125, 0.02983856201171875, 0.032527923583984375, 0.03521728515625, 0.037906646728515625, 0.04059600830078125, 0.043285369873046875, 0.0459747314453125, 0.048664093017578125, 0.05135345458984375, 0.054042816162109375, 0.056732177734375, 0.059421539306640625, 0.06211090087890625, 0.06480026245117188, 0.0674896240234375, 0.07017898559570312, 0.07286834716796875, 0.07555770874023438, 0.0782470703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 2.0, 6.0, 5.0, 6.0, 20.0, 9.0, 20.0, 19.0, 30.0, 38.0, 45.0, 66.0, 89.0, 102.0, 98.0, 100.0, 67.0, 59.0, 47.0, 42.0, 33.0, 30.0, 15.0, 14.0, 5.0, 10.0, 4.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.208087921142578e-05, -4.088599234819412e-05, -3.969110548496246e-05, -3.8496218621730804e-05, -3.7301331758499146e-05, -3.6106444895267487e-05, -3.491155803203583e-05, -3.371667116880417e-05, -3.252178430557251e-05, -3.132689744234085e-05, -3.0132010579109192e-05, -2.8937123715877533e-05, -2.7742236852645874e-05, -2.6547349989414215e-05, -2.5352463126182556e-05, -2.4157576262950897e-05, -2.2962689399719238e-05, -2.176780253648758e-05, -2.057291567325592e-05, -1.937802881002426e-05, -1.8183141946792603e-05, -1.6988255083560944e-05, -1.5793368220329285e-05, -1.4598481357097626e-05, -1.3403594493865967e-05, -1.2208707630634308e-05, -1.1013820767402649e-05, -9.81893390417099e-06, -8.624047040939331e-06, -7.429160177707672e-06, -6.234273314476013e-06, -5.039386451244354e-06, -3.844499588012695e-06, -2.6496127247810364e-06, -1.4547258615493774e-06, -2.598389983177185e-07, 9.350478649139404e-07, 2.1299347281455994e-06, 3.3248215913772583e-06, 4.519708454608917e-06, 5.714595317840576e-06, 6.909482181072235e-06, 8.104369044303894e-06, 9.299255907535553e-06, 1.0494142770767212e-05, 1.1689029633998871e-05, 1.288391649723053e-05, 1.4078803360462189e-05, 1.5273690223693848e-05, 1.6468577086925507e-05, 1.7663463950157166e-05, 1.8858350813388824e-05, 2.0053237676620483e-05, 2.1248124539852142e-05, 2.24430114030838e-05, 2.363789826631546e-05, 2.483278512954712e-05, 2.6027671992778778e-05, 2.7222558856010437e-05, 2.8417445719242096e-05, 2.9612332582473755e-05, 3.0807219445705414e-05, 3.200210630893707e-05, 3.319699317216873e-05, 3.439188003540039e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 9.0, 22.0, 26.0, 37.0, 40.0, 58.0, 91.0, 153.0, 242.0, 307.0, 446.0, 681.0, 964.0, 1485.0, 2172.0, 3011.0, 4638.0, 7070.0, 10625.0, 16863.0, 27107.0, 45790.0, 80796.0, 153832.0, 265836.0, 187773.0, 97723.0, 53346.0, 31233.0, 19369.0, 12330.0, 8008.0, 5325.0, 3576.0, 2361.0, 1691.0, 1103.0, 754.0, 504.0, 381.0, 235.0, 180.0, 118.0, 80.0, 49.0, 22.0, 30.0, 23.0, 16.0, 12.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.051177978515625, -0.0495610237121582, -0.047944068908691406, -0.04632711410522461, -0.04471015930175781, -0.043093204498291016, -0.04147624969482422, -0.03985929489135742, -0.038242340087890625, -0.03662538528442383, -0.03500843048095703, -0.033391475677490234, -0.03177452087402344, -0.03015756607055664, -0.028540611267089844, -0.026923656463623047, -0.02530670166015625, -0.023689746856689453, -0.022072792053222656, -0.02045583724975586, -0.018838882446289062, -0.017221927642822266, -0.015604972839355469, -0.013988018035888672, -0.012371063232421875, -0.010754108428955078, -0.009137153625488281, -0.007520198822021484, -0.0059032440185546875, -0.004286289215087891, -0.0026693344116210938, -0.0010523796081542969, 0.0005645751953125, 0.002181529998779297, 0.0037984848022460938, 0.005415439605712891, 0.0070323944091796875, 0.008649349212646484, 0.010266304016113281, 0.011883258819580078, 0.013500213623046875, 0.015117168426513672, 0.01673412322998047, 0.018351078033447266, 0.019968032836914062, 0.02158498764038086, 0.023201942443847656, 0.024818897247314453, 0.02643585205078125, 0.028052806854248047, 0.029669761657714844, 0.03128671646118164, 0.03290367126464844, 0.034520626068115234, 0.03613758087158203, 0.03775453567504883, 0.039371490478515625, 0.04098844528198242, 0.04260540008544922, 0.044222354888916016, 0.04583930969238281, 0.04745626449584961, 0.049073219299316406, 0.0506901741027832, 0.05230712890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 5.0, 8.0, 5.0, 12.0, 8.0, 14.0, 16.0, 17.0, 22.0, 26.0, 28.0, 33.0, 42.0, 42.0, 48.0, 79.0, 64.0, 54.0, 65.0, 67.0, 45.0, 46.0, 47.0, 37.0, 28.0, 24.0, 16.0, 14.0, 12.0, 17.0, 15.0, 6.0, 6.0, 4.0, 6.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01558685302734375, -0.015092730522155762, -0.014598608016967773, -0.014104485511779785, -0.013610363006591797, -0.013116240501403809, -0.01262211799621582, -0.012127995491027832, -0.011633872985839844, -0.011139750480651855, -0.010645627975463867, -0.010151505470275879, -0.00965738296508789, -0.009163260459899902, -0.008669137954711914, -0.008175015449523926, -0.0076808929443359375, -0.007186770439147949, -0.006692647933959961, -0.006198525428771973, -0.005704402923583984, -0.005210280418395996, -0.004716157913208008, -0.0042220354080200195, -0.0037279129028320312, -0.003233790397644043, -0.0027396678924560547, -0.0022455453872680664, -0.0017514228820800781, -0.0012573003768920898, -0.0007631778717041016, -0.0002690553665161133, 0.000225067138671875, 0.0007191896438598633, 0.0012133121490478516, 0.0017074346542358398, 0.002201557159423828, 0.0026956796646118164, 0.0031898021697998047, 0.003683924674987793, 0.004178047180175781, 0.0046721696853637695, 0.005166292190551758, 0.005660414695739746, 0.006154537200927734, 0.006648659706115723, 0.007142782211303711, 0.007636904716491699, 0.008131027221679688, 0.008625149726867676, 0.009119272232055664, 0.009613394737243652, 0.01010751724243164, 0.010601639747619629, 0.011095762252807617, 0.011589884757995605, 0.012084007263183594, 0.012578129768371582, 0.01307225227355957, 0.013566374778747559, 0.014060497283935547, 0.014554619789123535, 0.015048742294311523, 0.015542864799499512, 0.0160369873046875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 12.0, 10.0, 8.0, 10.0, 20.0, 22.0, 37.0, 49.0, 61.0, 59.0, 72.0, 83.0, 87.0, 79.0, 78.0, 73.0, 49.0, 42.0, 35.0, 27.0, 17.0, 12.0, 14.0, 10.0, 13.0, 7.0, 5.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.857423782348633, -24.2154483795166, -23.57347297668457, -22.931495666503906, -22.289520263671875, -21.647544860839844, -21.005569458007812, -20.36359405517578, -19.72161865234375, -19.07964324951172, -18.437667846679688, -17.795690536499023, -17.153715133666992, -16.51173973083496, -15.86976432800293, -15.227788925170898, -14.585811614990234, -13.943836212158203, -13.301859855651855, -12.659884452819824, -12.017908096313477, -11.375932693481445, -10.733957290649414, -10.091981887817383, -9.450005531311035, -8.808030128479004, -8.166053771972656, -7.524078369140625, -6.8821024894714355, -6.240126609802246, -5.598151206970215, -4.956175327301025, -4.314199447631836, -3.6722235679626465, -3.030247926712036, -2.388272285461426, -1.7462964057922363, -1.1043205261230469, -0.4623448848724365, 0.17963075637817383, 0.8216066360473633, 1.4635823965072632, 2.105558156967163, 2.7475337982177734, 3.389509677886963, 4.031485557556152, 4.673460960388184, 5.315436840057373, 5.9574127197265625, 6.599388599395752, 7.241364479064941, 7.883339881896973, 8.52531623840332, 9.167291641235352, 9.809267044067383, 10.451242446899414, 11.093218803405762, 11.735194206237793, 12.37717056274414, 13.019145965576172, 13.661121368408203, 14.30309772491455, 14.945073127746582, 15.58704948425293, 16.22902488708496]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 13.0, 5.0, 2.0, 10.0, 13.0, 8.0, 12.0, 11.0, 22.0, 12.0, 26.0, 22.0, 26.0, 29.0, 23.0, 30.0, 35.0, 30.0, 42.0, 36.0, 39.0, 41.0, 59.0, 42.0, 43.0, 30.0, 42.0, 28.0, 29.0, 23.0, 36.0, 27.0, 35.0, 27.0, 22.0, 8.0, 12.0, 8.0, 5.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-15.175042152404785, -14.735896110534668, -14.29675006866455, -13.857604026794434, -13.418457984924316, -12.9793119430542, -12.540165901184082, -12.101019859313965, -11.661873817443848, -11.22272777557373, -10.783581733703613, -10.344435691833496, -9.905289649963379, -9.466143608093262, -9.026997566223145, -8.587851524353027, -8.14870548248291, -7.709559440612793, -7.270413398742676, -6.831267356872559, -6.392121315002441, -5.952975273132324, -5.513829231262207, -5.07468318939209, -4.635537147521973, -4.1963911056518555, -3.7572450637817383, -3.318099021911621, -2.878952980041504, -2.4398069381713867, -2.0006608963012695, -1.5615148544311523, -1.1223678588867188, -0.6832218170166016, -0.24407577514648438, 0.1950702667236328, 0.63421630859375, 1.0733623504638672, 1.5125083923339844, 1.9516544342041016, 2.3908004760742188, 2.829946517944336, 3.269092559814453, 3.7082386016845703, 4.1473846435546875, 4.586530685424805, 5.025676727294922, 5.464822769165039, 5.903968811035156, 6.343114852905273, 6.782260894775391, 7.221406936645508, 7.660552978515625, 8.099699020385742, 8.53884506225586, 8.977991104125977, 9.417137145996094, 9.856283187866211, 10.295429229736328, 10.734575271606445, 11.173721313476562, 11.61286735534668, 12.052013397216797, 12.491159439086914, 12.930305480957031]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 5.0, 11.0, 12.0, 18.0, 31.0, 59.0, 63.0, 85.0, 137.0, 208.0, 252.0, 348.0, 535.0, 712.0, 1023.0, 1501.0, 2026.0, 2926.0, 4195.0, 5932.0, 8488.0, 12472.0, 18172.0, 26539.0, 39248.0, 57245.0, 81077.0, 110488.0, 135323.0, 138489.0, 116206.0, 86994.0, 62217.0, 42658.0, 28990.0, 20027.0, 13629.0, 9201.0, 6408.0, 4303.0, 3029.0, 2190.0, 1464.0, 1083.0, 747.0, 574.0, 371.0, 268.0, 189.0, 116.0, 74.0, 63.0, 44.0, 30.0, 28.0, 15.0, 12.0, 2.0, 7.0, 0.0, 4.0], "bins": [-16.65625, -16.137451171875, -15.61865234375, -15.099853515625, -14.5810546875, -14.062255859375, -13.54345703125, -13.024658203125, -12.505859375, -11.987060546875, -11.46826171875, -10.949462890625, -10.4306640625, -9.911865234375, -9.39306640625, -8.874267578125, -8.35546875, -7.836669921875, -7.31787109375, -6.799072265625, -6.2802734375, -5.761474609375, -5.24267578125, -4.723876953125, -4.205078125, -3.686279296875, -3.16748046875, -2.648681640625, -2.1298828125, -1.611083984375, -1.09228515625, -0.573486328125, -0.0546875, 0.464111328125, 0.98291015625, 1.501708984375, 2.0205078125, 2.539306640625, 3.05810546875, 3.576904296875, 4.095703125, 4.614501953125, 5.13330078125, 5.652099609375, 6.1708984375, 6.689697265625, 7.20849609375, 7.727294921875, 8.24609375, 8.764892578125, 9.28369140625, 9.802490234375, 10.3212890625, 10.840087890625, 11.35888671875, 11.877685546875, 12.396484375, 12.915283203125, 13.43408203125, 13.952880859375, 14.4716796875, 14.990478515625, 15.50927734375, 16.028076171875, 16.546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 8.0, 6.0, 8.0, 15.0, 7.0, 14.0, 18.0, 14.0, 16.0, 22.0, 22.0, 25.0, 39.0, 21.0, 33.0, 28.0, 33.0, 35.0, 43.0, 51.0, 42.0, 47.0, 36.0, 27.0, 43.0, 34.0, 33.0, 23.0, 29.0, 37.0, 33.0, 27.0, 21.0, 20.0, 17.0, 17.0, 5.0, 3.0, 11.0, 10.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6328125, -12.2451171875, -11.857421875, -11.4697265625, -11.08203125, -10.6943359375, -10.306640625, -9.9189453125, -9.53125, -9.1435546875, -8.755859375, -8.3681640625, -7.98046875, -7.5927734375, -7.205078125, -6.8173828125, -6.4296875, -6.0419921875, -5.654296875, -5.2666015625, -4.87890625, -4.4912109375, -4.103515625, -3.7158203125, -3.328125, -2.9404296875, -2.552734375, -2.1650390625, -1.77734375, -1.3896484375, -1.001953125, -0.6142578125, -0.2265625, 0.1611328125, 0.548828125, 0.9365234375, 1.32421875, 1.7119140625, 2.099609375, 2.4873046875, 2.875, 3.2626953125, 3.650390625, 4.0380859375, 4.42578125, 4.8134765625, 5.201171875, 5.5888671875, 5.9765625, 6.3642578125, 6.751953125, 7.1396484375, 7.52734375, 7.9150390625, 8.302734375, 8.6904296875, 9.078125, 9.4658203125, 9.853515625, 10.2412109375, 10.62890625, 11.0166015625, 11.404296875, 11.7919921875, 12.1796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 12.0, 14.0, 27.0, 41.0, 56.0, 100.0, 120.0, 196.0, 334.0, 472.0, 681.0, 1010.0, 1541.0, 2365.0, 3527.0, 5305.0, 8195.0, 12017.0, 18615.0, 28099.0, 42576.0, 65513.0, 97276.0, 138864.0, 166588.0, 146003.0, 103842.0, 70287.0, 46232.0, 30440.0, 19827.0, 13173.0, 8481.0, 5668.0, 3792.0, 2462.0, 1634.0, 1113.0, 698.0, 435.0, 336.0, 197.0, 133.0, 94.0, 59.0, 37.0, 31.0, 14.0, 11.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.449951171875, -18.85302734375, -18.256103515625, -17.6591796875, -17.062255859375, -16.46533203125, -15.868408203125, -15.271484375, -14.674560546875, -14.07763671875, -13.480712890625, -12.8837890625, -12.286865234375, -11.68994140625, -11.093017578125, -10.49609375, -9.899169921875, -9.30224609375, -8.705322265625, -8.1083984375, -7.511474609375, -6.91455078125, -6.317626953125, -5.720703125, -5.123779296875, -4.52685546875, -3.929931640625, -3.3330078125, -2.736083984375, -2.13916015625, -1.542236328125, -0.9453125, -0.348388671875, 0.24853515625, 0.845458984375, 1.4423828125, 2.039306640625, 2.63623046875, 3.233154296875, 3.830078125, 4.427001953125, 5.02392578125, 5.620849609375, 6.2177734375, 6.814697265625, 7.41162109375, 8.008544921875, 8.60546875, 9.202392578125, 9.79931640625, 10.396240234375, 10.9931640625, 11.590087890625, 12.18701171875, 12.783935546875, 13.380859375, 13.977783203125, 14.57470703125, 15.171630859375, 15.7685546875, 16.365478515625, 16.96240234375, 17.559326171875, 18.15625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 5.0, 10.0, 14.0, 11.0, 22.0, 10.0, 17.0, 19.0, 25.0, 29.0, 25.0, 26.0, 29.0, 30.0, 27.0, 28.0, 30.0, 36.0, 42.0, 38.0, 37.0, 31.0, 31.0, 38.0, 31.0, 31.0, 35.0, 28.0, 20.0, 29.0, 24.0, 28.0, 19.0, 19.0, 16.0, 13.0, 13.0, 14.0, 12.0, 16.0, 5.0, 9.0, 8.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.34375, -7.11248779296875, -6.8812255859375, -6.64996337890625, -6.418701171875, -6.18743896484375, -5.9561767578125, -5.72491455078125, -5.49365234375, -5.26239013671875, -5.0311279296875, -4.79986572265625, -4.568603515625, -4.33734130859375, -4.1060791015625, -3.87481689453125, -3.6435546875, -3.41229248046875, -3.1810302734375, -2.94976806640625, -2.718505859375, -2.48724365234375, -2.2559814453125, -2.02471923828125, -1.79345703125, -1.56219482421875, -1.3309326171875, -1.09967041015625, -0.868408203125, -0.63714599609375, -0.4058837890625, -0.17462158203125, 0.056640625, 0.28790283203125, 0.5191650390625, 0.75042724609375, 0.981689453125, 1.21295166015625, 1.4442138671875, 1.67547607421875, 1.90673828125, 2.13800048828125, 2.3692626953125, 2.60052490234375, 2.831787109375, 3.06304931640625, 3.2943115234375, 3.52557373046875, 3.7568359375, 3.98809814453125, 4.2193603515625, 4.45062255859375, 4.681884765625, 4.91314697265625, 5.1444091796875, 5.37567138671875, 5.60693359375, 5.83819580078125, 6.0694580078125, 6.30072021484375, 6.531982421875, 6.76324462890625, 6.9945068359375, 7.22576904296875, 7.45703125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 5.0, 10.0, 5.0, 21.0, 22.0, 35.0, 61.0, 72.0, 125.0, 219.0, 365.0, 591.0, 974.0, 1604.0, 2698.0, 4852.0, 9355.0, 19711.0, 48251.0, 170460.0, 567910.0, 140995.0, 42786.0, 17709.0, 8689.0, 4502.0, 2618.0, 1540.0, 920.0, 567.0, 318.0, 179.0, 136.0, 79.0, 48.0, 35.0, 24.0, 13.0, 16.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.7647705078125, -8.467041015625, -8.1693115234375, -7.87158203125, -7.5738525390625, -7.276123046875, -6.9783935546875, -6.6806640625, -6.3829345703125, -6.085205078125, -5.7874755859375, -5.48974609375, -5.1920166015625, -4.894287109375, -4.5965576171875, -4.298828125, -4.0010986328125, -3.703369140625, -3.4056396484375, -3.10791015625, -2.8101806640625, -2.512451171875, -2.2147216796875, -1.9169921875, -1.6192626953125, -1.321533203125, -1.0238037109375, -0.72607421875, -0.4283447265625, -0.130615234375, 0.1671142578125, 0.46484375, 0.7625732421875, 1.060302734375, 1.3580322265625, 1.65576171875, 1.9534912109375, 2.251220703125, 2.5489501953125, 2.8466796875, 3.1444091796875, 3.442138671875, 3.7398681640625, 4.03759765625, 4.3353271484375, 4.633056640625, 4.9307861328125, 5.228515625, 5.5262451171875, 5.823974609375, 6.1217041015625, 6.41943359375, 6.7171630859375, 7.014892578125, 7.3126220703125, 7.6103515625, 7.9080810546875, 8.205810546875, 8.5035400390625, 8.80126953125, 9.0989990234375, 9.396728515625, 9.6944580078125, 9.9921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 4.0, 7.0, 8.0, 16.0, 19.0, 28.0, 35.0, 58.0, 82.0, 129.0, 136.0, 139.0, 78.0, 57.0, 50.0, 33.0, 20.0, 17.0, 11.0, 10.0, 7.0, 10.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004432201385498047, -0.00042659416794776917, -0.00040996819734573364, -0.0003933422267436981, -0.0003767162561416626, -0.0003600902855396271, -0.00034346431493759155, -0.00032683834433555603, -0.0003102123737335205, -0.000293586403131485, -0.00027696043252944946, -0.00026033446192741394, -0.00024370849132537842, -0.0002270825207233429, -0.00021045655012130737, -0.00019383057951927185, -0.00017720460891723633, -0.0001605786383152008, -0.00014395266771316528, -0.00012732669711112976, -0.00011070072650909424, -9.407475590705872e-05, -7.74487853050232e-05, -6.082281470298767e-05, -4.419684410095215e-05, -2.7570873498916626e-05, -1.0944902896881104e-05, 5.681067705154419e-06, 2.230703830718994e-05, 3.8933008909225464e-05, 5.5558979511260986e-05, 7.218495011329651e-05, 8.881092071533203e-05, 0.00010543689131736755, 0.00012206286191940308, 0.0001386888325214386, 0.00015531480312347412, 0.00017194077372550964, 0.00018856674432754517, 0.0002051927149295807, 0.0002218186855316162, 0.00023844465613365173, 0.00025507062673568726, 0.0002716965973377228, 0.0002883225679397583, 0.0003049485385417938, 0.00032157450914382935, 0.00033820047974586487, 0.0003548264503479004, 0.0003714524209499359, 0.00038807839155197144, 0.00040470436215400696, 0.0004213303327560425, 0.000437956303358078, 0.0004545822739601135, 0.00047120824456214905, 0.00048783421516418457, 0.0005044601857662201, 0.0005210861563682556, 0.0005377121269702911, 0.0005543380975723267, 0.0005709640681743622, 0.0005875900387763977, 0.0006042160093784332, 0.0006208419799804688]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 6.0, 6.0, 15.0, 9.0, 18.0, 28.0, 46.0, 65.0, 79.0, 131.0, 204.0, 277.0, 443.0, 664.0, 1066.0, 1802.0, 2972.0, 5168.0, 9203.0, 17493.0, 37200.0, 98466.0, 405229.0, 317002.0, 82323.0, 32528.0, 15721.0, 8532.0, 4685.0, 2734.0, 1554.0, 1012.0, 631.0, 402.0, 282.0, 174.0, 109.0, 91.0, 51.0, 36.0, 25.0, 24.0, 17.0, 13.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.9765625, -7.7342529296875, -7.491943359375, -7.2496337890625, -7.00732421875, -6.7650146484375, -6.522705078125, -6.2803955078125, -6.0380859375, -5.7957763671875, -5.553466796875, -5.3111572265625, -5.06884765625, -4.8265380859375, -4.584228515625, -4.3419189453125, -4.099609375, -3.8572998046875, -3.614990234375, -3.3726806640625, -3.13037109375, -2.8880615234375, -2.645751953125, -2.4034423828125, -2.1611328125, -1.9188232421875, -1.676513671875, -1.4342041015625, -1.19189453125, -0.9495849609375, -0.707275390625, -0.4649658203125, -0.22265625, 0.0196533203125, 0.261962890625, 0.5042724609375, 0.74658203125, 0.9888916015625, 1.231201171875, 1.4735107421875, 1.7158203125, 1.9581298828125, 2.200439453125, 2.4427490234375, 2.68505859375, 2.9273681640625, 3.169677734375, 3.4119873046875, 3.654296875, 3.8966064453125, 4.138916015625, 4.3812255859375, 4.62353515625, 4.8658447265625, 5.108154296875, 5.3504638671875, 5.5927734375, 5.8350830078125, 6.077392578125, 6.3197021484375, 6.56201171875, 6.8043212890625, 7.046630859375, 7.2889404296875, 7.53125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 7.0, 10.0, 13.0, 13.0, 12.0, 11.0, 19.0, 27.0, 43.0, 61.0, 62.0, 82.0, 99.0, 113.0, 104.0, 73.0, 52.0, 42.0, 28.0, 20.0, 20.0, 15.0, 14.0, 9.0, 11.0, 14.0, 2.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.073394775390625, -2.00225830078125, -1.931121826171875, -1.8599853515625, -1.788848876953125, -1.71771240234375, -1.646575927734375, -1.575439453125, -1.504302978515625, -1.43316650390625, -1.362030029296875, -1.2908935546875, -1.219757080078125, -1.14862060546875, -1.077484130859375, -1.00634765625, -0.935211181640625, -0.86407470703125, -0.792938232421875, -0.7218017578125, -0.650665283203125, -0.57952880859375, -0.508392333984375, -0.437255859375, -0.366119384765625, -0.29498291015625, -0.223846435546875, -0.1527099609375, -0.081573486328125, -0.01043701171875, 0.060699462890625, 0.1318359375, 0.202972412109375, 0.27410888671875, 0.345245361328125, 0.4163818359375, 0.487518310546875, 0.55865478515625, 0.629791259765625, 0.700927734375, 0.772064208984375, 0.84320068359375, 0.914337158203125, 0.9854736328125, 1.056610107421875, 1.12774658203125, 1.198883056640625, 1.27001953125, 1.341156005859375, 1.41229248046875, 1.483428955078125, 1.5545654296875, 1.625701904296875, 1.69683837890625, 1.767974853515625, 1.839111328125, 1.910247802734375, 1.98138427734375, 2.052520751953125, 2.1236572265625, 2.194793701171875, 2.26593017578125, 2.337066650390625, 2.408203125]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 7.0, 10.0, 13.0, 26.0, 15.0, 23.0, 44.0, 40.0, 50.0, 57.0, 60.0, 72.0, 73.0, 80.0, 69.0, 55.0, 50.0, 45.0, 40.0, 30.0, 27.0, 19.0, 23.0, 10.0, 11.0, 7.0, 7.0, 5.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.22857666015625, -17.70705223083496, -17.185527801513672, -16.664005279541016, -16.142480850219727, -15.620956420898438, -15.099431991577148, -14.57790756225586, -14.056384086608887, -13.534859657287598, -13.013336181640625, -12.491811752319336, -11.970287322998047, -11.448763847351074, -10.927239418029785, -10.405715942382812, -9.884191513061523, -9.362667083740234, -8.841143608093262, -8.319619178771973, -7.798095226287842, -7.276571273803711, -6.755046844482422, -6.233522891998291, -5.71199893951416, -5.190474987030029, -4.668951034545898, -4.147426605224609, -3.6259026527404785, -3.1043787002563477, -2.5828545093536377, -2.0613303184509277, -1.539804458618164, -1.0182803869247437, -0.49675631523132324, 0.024767756462097168, 0.5462918281555176, 1.0678157806396484, 1.5893399715423584, 2.1108641624450684, 2.632388114929199, 3.15391206741333, 3.67543625831604, 4.19696044921875, 4.718484401702881, 5.240008354187012, 5.761532783508301, 6.283056735992432, 6.8045806884765625, 7.326104640960693, 7.847628593444824, 8.369153022766113, 8.890676498413086, 9.412200927734375, 9.933725357055664, 10.455249786376953, 10.976773262023926, 11.498297691345215, 12.019821166992188, 12.541345596313477, 13.062870025634766, 13.584393501281738, 14.105917930603027, 14.62744140625, 15.148965835571289]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 3.0, 4.0, 7.0, 5.0, 7.0, 7.0, 4.0, 8.0, 10.0, 18.0, 9.0, 19.0, 21.0, 18.0, 23.0, 18.0, 33.0, 27.0, 37.0, 33.0, 42.0, 37.0, 41.0, 49.0, 31.0, 35.0, 43.0, 31.0, 37.0, 35.0, 24.0, 31.0, 37.0, 34.0, 33.0, 21.0, 24.0, 19.0, 11.0, 16.0, 8.0, 14.0, 9.0, 9.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.320955276489258, -12.91276741027832, -12.504578590393066, -12.096389770507812, -11.688201904296875, -11.280014038085938, -10.871825218200684, -10.46363639831543, -10.055448532104492, -9.647260665893555, -9.2390718460083, -8.830883026123047, -8.42269515991211, -8.014507293701172, -7.606318473815918, -7.198130130767822, -6.789941787719727, -6.381753444671631, -5.973565101623535, -5.5653767585754395, -5.157188415527344, -4.749000072479248, -4.340811729431152, -3.9326233863830566, -3.524435043334961, -3.1162467002868652, -2.7080583572387695, -2.299870014190674, -1.8916816711425781, -1.4834933280944824, -1.0753049850463867, -0.667116641998291, -0.2589273452758789, 0.1492609977722168, 0.5574493408203125, 0.9656376838684082, 1.373826026916504, 1.7820143699645996, 2.1902027130126953, 2.598391056060791, 3.0065793991088867, 3.4147677421569824, 3.822956085205078, 4.231144428253174, 4.6393327713012695, 5.047521114349365, 5.455709457397461, 5.863897800445557, 6.272086143493652, 6.680274486541748, 7.088462829589844, 7.4966511726379395, 7.904839515686035, 8.313028335571289, 8.721216201782227, 9.129404067993164, 9.537592887878418, 9.945781707763672, 10.35396957397461, 10.762157440185547, 11.1703462600708, 11.578535079956055, 11.986722946166992, 12.39491081237793, 12.803099632263184]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 11.0, 14.0, 25.0, 58.0, 55.0, 82.0, 115.0, 204.0, 254.0, 395.0, 618.0, 876.0, 1279.0, 1993.0, 2862.0, 4304.0, 6392.0, 9937.0, 15037.0, 23864.0, 37773.0, 62864.0, 110550.0, 211842.0, 500287.0, 1085758.0, 1091073.0, 508403.0, 225155.0, 117620.0, 67637.0, 40105.0, 24477.0, 15359.0, 9722.0, 6058.0, 3859.0, 2576.0, 1670.0, 1107.0, 684.0, 477.0, 299.0, 194.0, 120.0, 96.0, 57.0, 40.0, 25.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.848388671875, -15.33740234375, -14.826416015625, -14.3154296875, -13.804443359375, -13.29345703125, -12.782470703125, -12.271484375, -11.760498046875, -11.24951171875, -10.738525390625, -10.2275390625, -9.716552734375, -9.20556640625, -8.694580078125, -8.18359375, -7.672607421875, -7.16162109375, -6.650634765625, -6.1396484375, -5.628662109375, -5.11767578125, -4.606689453125, -4.095703125, -3.584716796875, -3.07373046875, -2.562744140625, -2.0517578125, -1.540771484375, -1.02978515625, -0.518798828125, -0.0078125, 0.503173828125, 1.01416015625, 1.525146484375, 2.0361328125, 2.547119140625, 3.05810546875, 3.569091796875, 4.080078125, 4.591064453125, 5.10205078125, 5.613037109375, 6.1240234375, 6.635009765625, 7.14599609375, 7.656982421875, 8.16796875, 8.678955078125, 9.18994140625, 9.700927734375, 10.2119140625, 10.722900390625, 11.23388671875, 11.744873046875, 12.255859375, 12.766845703125, 13.27783203125, 13.788818359375, 14.2998046875, 14.810791015625, 15.32177734375, 15.832763671875, 16.34375]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 4.0, 2.0, 3.0, 7.0, 5.0, 9.0, 10.0, 12.0, 23.0, 22.0, 13.0, 16.0, 23.0, 27.0, 32.0, 32.0, 39.0, 36.0, 42.0, 50.0, 51.0, 31.0, 49.0, 36.0, 35.0, 32.0, 33.0, 33.0, 37.0, 36.0, 32.0, 43.0, 20.0, 24.0, 24.0, 17.0, 11.0, 12.0, 7.0, 7.0, 11.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5703125, -11.2197265625, -10.869140625, -10.5185546875, -10.16796875, -9.8173828125, -9.466796875, -9.1162109375, -8.765625, -8.4150390625, -8.064453125, -7.7138671875, -7.36328125, -7.0126953125, -6.662109375, -6.3115234375, -5.9609375, -5.6103515625, -5.259765625, -4.9091796875, -4.55859375, -4.2080078125, -3.857421875, -3.5068359375, -3.15625, -2.8056640625, -2.455078125, -2.1044921875, -1.75390625, -1.4033203125, -1.052734375, -0.7021484375, -0.3515625, -0.0009765625, 0.349609375, 0.7001953125, 1.05078125, 1.4013671875, 1.751953125, 2.1025390625, 2.453125, 2.8037109375, 3.154296875, 3.5048828125, 3.85546875, 4.2060546875, 4.556640625, 4.9072265625, 5.2578125, 5.6083984375, 5.958984375, 6.3095703125, 6.66015625, 7.0107421875, 7.361328125, 7.7119140625, 8.0625, 8.4130859375, 8.763671875, 9.1142578125, 9.46484375, 9.8154296875, 10.166015625, 10.5166015625, 10.8671875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 10.0, 14.0, 21.0, 48.0, 53.0, 81.0, 100.0, 192.0, 288.0, 423.0, 650.0, 1088.0, 1693.0, 2894.0, 4574.0, 7673.0, 13474.0, 23010.0, 41172.0, 75425.0, 143863.0, 290201.0, 617279.0, 1181418.0, 913497.0, 430020.0, 208009.0, 105700.0, 56339.0, 31205.0, 17795.0, 10298.0, 6081.0, 3721.0, 2226.0, 1412.0, 834.0, 556.0, 325.0, 232.0, 147.0, 72.0, 61.0, 37.0, 21.0, 22.0, 12.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.921875, -16.371826171875, -15.82177734375, -15.271728515625, -14.7216796875, -14.171630859375, -13.62158203125, -13.071533203125, -12.521484375, -11.971435546875, -11.42138671875, -10.871337890625, -10.3212890625, -9.771240234375, -9.22119140625, -8.671142578125, -8.12109375, -7.571044921875, -7.02099609375, -6.470947265625, -5.9208984375, -5.370849609375, -4.82080078125, -4.270751953125, -3.720703125, -3.170654296875, -2.62060546875, -2.070556640625, -1.5205078125, -0.970458984375, -0.42041015625, 0.129638671875, 0.6796875, 1.229736328125, 1.77978515625, 2.329833984375, 2.8798828125, 3.429931640625, 3.97998046875, 4.530029296875, 5.080078125, 5.630126953125, 6.18017578125, 6.730224609375, 7.2802734375, 7.830322265625, 8.38037109375, 8.930419921875, 9.48046875, 10.030517578125, 10.58056640625, 11.130615234375, 11.6806640625, 12.230712890625, 12.78076171875, 13.330810546875, 13.880859375, 14.430908203125, 14.98095703125, 15.531005859375, 16.0810546875, 16.631103515625, 17.18115234375, 17.731201171875, 18.28125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 11.0, 13.0, 13.0, 19.0, 16.0, 29.0, 38.0, 42.0, 71.0, 79.0, 83.0, 136.0, 151.0, 165.0, 187.0, 259.0, 264.0, 291.0, 311.0, 304.0, 268.0, 239.0, 188.0, 171.0, 139.0, 117.0, 82.0, 69.0, 75.0, 39.0, 44.0, 33.0, 24.0, 24.0, 8.0, 11.0, 9.0, 10.0, 7.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.71875, -6.5238037109375, -6.328857421875, -6.1339111328125, -5.93896484375, -5.7440185546875, -5.549072265625, -5.3541259765625, -5.1591796875, -4.9642333984375, -4.769287109375, -4.5743408203125, -4.37939453125, -4.1844482421875, -3.989501953125, -3.7945556640625, -3.599609375, -3.4046630859375, -3.209716796875, -3.0147705078125, -2.81982421875, -2.6248779296875, -2.429931640625, -2.2349853515625, -2.0400390625, -1.8450927734375, -1.650146484375, -1.4552001953125, -1.26025390625, -1.0653076171875, -0.870361328125, -0.6754150390625, -0.48046875, -0.2855224609375, -0.090576171875, 0.1043701171875, 0.29931640625, 0.4942626953125, 0.689208984375, 0.8841552734375, 1.0791015625, 1.2740478515625, 1.468994140625, 1.6639404296875, 1.85888671875, 2.0538330078125, 2.248779296875, 2.4437255859375, 2.638671875, 2.8336181640625, 3.028564453125, 3.2235107421875, 3.41845703125, 3.6134033203125, 3.808349609375, 4.0032958984375, 4.1982421875, 4.3931884765625, 4.588134765625, 4.7830810546875, 4.97802734375, 5.1729736328125, 5.367919921875, 5.5628662109375, 5.7578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 12.0, 11.0, 10.0, 7.0, 22.0, 23.0, 29.0, 39.0, 42.0, 55.0, 59.0, 79.0, 62.0, 72.0, 77.0, 72.0, 64.0, 39.0, 37.0, 33.0, 30.0, 20.0, 15.0, 17.0, 13.0, 16.0, 14.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.769121170043945, -14.315149307250977, -13.861177444458008, -13.407205581665039, -12.95323371887207, -12.499261856079102, -12.045289993286133, -11.591318130493164, -11.137346267700195, -10.683374404907227, -10.229402542114258, -9.775430679321289, -9.32145881652832, -8.867486953735352, -8.413515090942383, -7.959543228149414, -7.505570888519287, -7.051599025726318, -6.59762716293335, -6.143655300140381, -5.689683437347412, -5.235711097717285, -4.781739234924316, -4.327767372131348, -3.873795747756958, -3.4198238849639893, -2.9658520221710205, -2.5118799209594727, -2.057908058166504, -1.6039361953735352, -1.1499643325805664, -0.6959924697875977, -0.2420206069946289, 0.21195128560066223, 0.6659231781959534, 1.119895100593567, 1.5738669633865356, 2.027838945388794, 2.4818108081817627, 2.9357826709747314, 3.3897545337677, 3.843726396560669, 4.297698497772217, 4.7516703605651855, 5.205642223358154, 5.659614086151123, 6.113585948944092, 6.5675578117370605, 7.021529674530029, 7.475501537322998, 7.929473400115967, 8.383445739746094, 8.837417602539062, 9.291389465332031, 9.745361328125, 10.199333190917969, 10.653305053710938, 11.107276916503906, 11.561248779296875, 12.015220642089844, 12.469192504882812, 12.923164367675781, 13.37713623046875, 13.831108093261719, 14.285079956054688]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 13.0, 14.0, 15.0, 12.0, 22.0, 24.0, 17.0, 32.0, 28.0, 27.0, 22.0, 27.0, 22.0, 32.0, 39.0, 60.0, 36.0, 37.0, 49.0, 41.0, 39.0, 19.0, 34.0, 35.0, 33.0, 25.0, 26.0, 21.0, 26.0, 22.0, 21.0, 20.0, 9.0, 10.0, 10.0, 7.0, 7.0, 10.0, 4.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-11.539323806762695, -11.187873840332031, -10.836423873901367, -10.484973907470703, -10.133523941040039, -9.782073974609375, -9.430624008178711, -9.079174041748047, -8.727724075317383, -8.376274108886719, -8.024824142456055, -7.673374176025391, -7.321924209594727, -6.9704742431640625, -6.61902379989624, -6.267573833465576, -5.916123390197754, -5.56467342376709, -5.213223457336426, -4.861773490905762, -4.510323524475098, -4.158873558044434, -3.8074231147766113, -3.4559731483459473, -3.104523181915283, -2.753073215484619, -2.401623249053955, -2.050173044204712, -1.6987230777740479, -1.3472731113433838, -0.9958229064941406, -0.6443729400634766, -0.2929220199584961, 0.058528006076812744, 0.4099780321121216, 0.7614281177520752, 1.1128780841827393, 1.4643280506134033, 1.8157782554626465, 2.1672282218933105, 2.5186781883239746, 2.8701281547546387, 3.2215781211853027, 3.573028326034546, 3.92447829246521, 4.275928497314453, 4.627378463745117, 4.978828430175781, 5.330278396606445, 5.681728363037109, 6.033178329467773, 6.3846282958984375, 6.736078262329102, 7.087528228759766, 7.438978672027588, 7.790428638458252, 8.141878128051758, 8.493328094482422, 8.844778060913086, 9.19622802734375, 9.547677993774414, 9.899127960205078, 10.250577926635742, 10.602027893066406, 10.953478813171387]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 7.0, 7.0, 14.0, 25.0, 39.0, 57.0, 111.0, 153.0, 229.0, 393.0, 585.0, 927.0, 1398.0, 2247.0, 3342.0, 5307.0, 8596.0, 13460.0, 21269.0, 34830.0, 57839.0, 95356.0, 158289.0, 227192.0, 162896.0, 98144.0, 59500.0, 36356.0, 22219.0, 13816.0, 8680.0, 5503.0, 3520.0, 2242.0, 1390.0, 978.0, 581.0, 389.0, 242.0, 162.0, 100.0, 67.0, 32.0, 31.0, 11.0, 12.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.48046875, -5.30096435546875, -5.1214599609375, -4.94195556640625, -4.762451171875, -4.58294677734375, -4.4034423828125, -4.22393798828125, -4.04443359375, -3.86492919921875, -3.6854248046875, -3.50592041015625, -3.326416015625, -3.14691162109375, -2.9674072265625, -2.78790283203125, -2.6083984375, -2.42889404296875, -2.2493896484375, -2.06988525390625, -1.890380859375, -1.71087646484375, -1.5313720703125, -1.35186767578125, -1.17236328125, -0.99285888671875, -0.8133544921875, -0.63385009765625, -0.454345703125, -0.27484130859375, -0.0953369140625, 0.08416748046875, 0.263671875, 0.44317626953125, 0.6226806640625, 0.80218505859375, 0.981689453125, 1.16119384765625, 1.3406982421875, 1.52020263671875, 1.69970703125, 1.87921142578125, 2.0587158203125, 2.23822021484375, 2.417724609375, 2.59722900390625, 2.7767333984375, 2.95623779296875, 3.1357421875, 3.31524658203125, 3.4947509765625, 3.67425537109375, 3.853759765625, 4.03326416015625, 4.2127685546875, 4.39227294921875, 4.57177734375, 4.75128173828125, 4.9307861328125, 5.11029052734375, 5.289794921875, 5.46929931640625, 5.6488037109375, 5.82830810546875, 6.0078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 8.0, 2.0, 2.0, 3.0, 10.0, 11.0, 10.0, 8.0, 14.0, 20.0, 24.0, 31.0, 35.0, 20.0, 31.0, 28.0, 33.0, 35.0, 41.0, 60.0, 43.0, 35.0, 37.0, 42.0, 36.0, 38.0, 40.0, 39.0, 26.0, 33.0, 21.0, 26.0, 25.0, 23.0, 23.0, 12.0, 20.0, 7.0, 7.0, 6.0, 8.0, 7.0, 4.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9140625, -12.52490234375, -12.1357421875, -11.74658203125, -11.357421875, -10.96826171875, -10.5791015625, -10.18994140625, -9.80078125, -9.41162109375, -9.0224609375, -8.63330078125, -8.244140625, -7.85498046875, -7.4658203125, -7.07666015625, -6.6875, -6.29833984375, -5.9091796875, -5.52001953125, -5.130859375, -4.74169921875, -4.3525390625, -3.96337890625, -3.57421875, -3.18505859375, -2.7958984375, -2.40673828125, -2.017578125, -1.62841796875, -1.2392578125, -0.85009765625, -0.4609375, -0.07177734375, 0.3173828125, 0.70654296875, 1.095703125, 1.48486328125, 1.8740234375, 2.26318359375, 2.65234375, 3.04150390625, 3.4306640625, 3.81982421875, 4.208984375, 4.59814453125, 4.9873046875, 5.37646484375, 5.765625, 6.15478515625, 6.5439453125, 6.93310546875, 7.322265625, 7.71142578125, 8.1005859375, 8.48974609375, 8.87890625, 9.26806640625, 9.6572265625, 10.04638671875, 10.435546875, 10.82470703125, 11.2138671875, 11.60302734375, 11.9921875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 3.0, 16.0, 14.0, 20.0, 34.0, 48.0, 69.0, 103.0, 144.0, 257.0, 369.0, 610.0, 943.0, 1478.0, 2363.0, 4065.0, 6639.0, 11133.0, 19808.0, 35567.0, 66979.0, 128885.0, 270894.0, 242325.0, 117372.0, 60992.0, 32892.0, 18208.0, 10503.0, 6070.0, 3616.0, 2245.0, 1432.0, 885.0, 546.0, 359.0, 234.0, 135.0, 99.0, 64.0, 48.0, 30.0, 25.0, 12.0, 9.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-6.70703125, -6.49017333984375, -6.2733154296875, -6.05645751953125, -5.839599609375, -5.62274169921875, -5.4058837890625, -5.18902587890625, -4.97216796875, -4.75531005859375, -4.5384521484375, -4.32159423828125, -4.104736328125, -3.88787841796875, -3.6710205078125, -3.45416259765625, -3.2373046875, -3.02044677734375, -2.8035888671875, -2.58673095703125, -2.369873046875, -2.15301513671875, -1.9361572265625, -1.71929931640625, -1.50244140625, -1.28558349609375, -1.0687255859375, -0.85186767578125, -0.635009765625, -0.41815185546875, -0.2012939453125, 0.01556396484375, 0.232421875, 0.44927978515625, 0.6661376953125, 0.88299560546875, 1.099853515625, 1.31671142578125, 1.5335693359375, 1.75042724609375, 1.96728515625, 2.18414306640625, 2.4010009765625, 2.61785888671875, 2.834716796875, 3.05157470703125, 3.2684326171875, 3.48529052734375, 3.7021484375, 3.91900634765625, 4.1358642578125, 4.35272216796875, 4.569580078125, 4.78643798828125, 5.0032958984375, 5.22015380859375, 5.43701171875, 5.65386962890625, 5.8707275390625, 6.08758544921875, 6.304443359375, 6.52130126953125, 6.7381591796875, 6.95501708984375, 7.171875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 4.0, 7.0, 8.0, 10.0, 26.0, 18.0, 25.0, 25.0, 19.0, 32.0, 41.0, 44.0, 43.0, 46.0, 61.0, 45.0, 40.0, 50.0, 44.0, 47.0, 40.0, 43.0, 39.0, 26.0, 32.0, 36.0, 23.0, 16.0, 29.0, 14.0, 11.0, 15.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4127197265625, -8.130126953125, -7.8475341796875, -7.56494140625, -7.2823486328125, -6.999755859375, -6.7171630859375, -6.4345703125, -6.1519775390625, -5.869384765625, -5.5867919921875, -5.30419921875, -5.0216064453125, -4.739013671875, -4.4564208984375, -4.173828125, -3.8912353515625, -3.608642578125, -3.3260498046875, -3.04345703125, -2.7608642578125, -2.478271484375, -2.1956787109375, -1.9130859375, -1.6304931640625, -1.347900390625, -1.0653076171875, -0.78271484375, -0.5001220703125, -0.217529296875, 0.0650634765625, 0.34765625, 0.6302490234375, 0.912841796875, 1.1954345703125, 1.47802734375, 1.7606201171875, 2.043212890625, 2.3258056640625, 2.6083984375, 2.8909912109375, 3.173583984375, 3.4561767578125, 3.73876953125, 4.0213623046875, 4.303955078125, 4.5865478515625, 4.869140625, 5.1517333984375, 5.434326171875, 5.7169189453125, 5.99951171875, 6.2821044921875, 6.564697265625, 6.8472900390625, 7.1298828125, 7.4124755859375, 7.695068359375, 7.9776611328125, 8.26025390625, 8.5428466796875, 8.825439453125, 9.1080322265625, 9.390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 20.0, 20.0, 33.0, 42.0, 80.0, 130.0, 218.0, 377.0, 638.0, 1242.0, 2300.0, 4305.0, 8614.0, 18495.0, 45377.0, 140358.0, 496019.0, 219848.0, 63615.0, 24285.0, 11041.0, 5334.0, 2695.0, 1533.0, 786.0, 455.0, 269.0, 136.0, 91.0, 67.0, 38.0, 19.0, 19.0, 17.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1024169921875, -0.09928131103515625, -0.0961456298828125, -0.09300994873046875, -0.089874267578125, -0.08673858642578125, -0.0836029052734375, -0.08046722412109375, -0.07733154296875, -0.07419586181640625, -0.0710601806640625, -0.06792449951171875, -0.064788818359375, -0.06165313720703125, -0.0585174560546875, -0.05538177490234375, -0.05224609375, -0.04911041259765625, -0.0459747314453125, -0.04283905029296875, -0.039703369140625, -0.03656768798828125, -0.0334320068359375, -0.03029632568359375, -0.02716064453125, -0.02402496337890625, -0.0208892822265625, -0.01775360107421875, -0.014617919921875, -0.01148223876953125, -0.0083465576171875, -0.00521087646484375, -0.0020751953125, 0.00106048583984375, 0.0041961669921875, 0.00733184814453125, 0.010467529296875, 0.01360321044921875, 0.0167388916015625, 0.01987457275390625, 0.02301025390625, 0.02614593505859375, 0.0292816162109375, 0.03241729736328125, 0.035552978515625, 0.03868865966796875, 0.0418243408203125, 0.04496002197265625, 0.048095703125, 0.05123138427734375, 0.0543670654296875, 0.05750274658203125, 0.060638427734375, 0.06377410888671875, 0.0669097900390625, 0.07004547119140625, 0.07318115234375, 0.07631683349609375, 0.0794525146484375, 0.08258819580078125, 0.085723876953125, 0.08885955810546875, 0.0919952392578125, 0.09513092041015625, 0.0982666015625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 12.0, 10.0, 11.0, 16.0, 23.0, 32.0, 51.0, 81.0, 95.0, 110.0, 120.0, 123.0, 85.0, 79.0, 34.0, 40.0, 23.0, 20.0, 10.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.8287991881370544e-05, -2.707168459892273e-05, -2.5855377316474915e-05, -2.46390700340271e-05, -2.3422762751579285e-05, -2.220645546913147e-05, -2.0990148186683655e-05, -1.977384090423584e-05, -1.8557533621788025e-05, -1.734122633934021e-05, -1.6124919056892395e-05, -1.490861177444458e-05, -1.3692304491996765e-05, -1.247599720954895e-05, -1.1259689927101135e-05, -1.004338264465332e-05, -8.827075362205505e-06, -7.6107680797576904e-06, -6.3944607973098755e-06, -5.1781535148620605e-06, -3.961846232414246e-06, -2.7455389499664307e-06, -1.5292316675186157e-06, -3.129243850708008e-07, 9.033828973770142e-07, 2.119690179824829e-06, 3.335997462272644e-06, 4.552304744720459e-06, 5.768612027168274e-06, 6.984919309616089e-06, 8.201226592063904e-06, 9.417533874511719e-06, 1.0633841156959534e-05, 1.1850148439407349e-05, 1.3066455721855164e-05, 1.4282763004302979e-05, 1.5499070286750793e-05, 1.671537756919861e-05, 1.7931684851646423e-05, 1.9147992134094238e-05, 2.0364299416542053e-05, 2.1580606698989868e-05, 2.2796913981437683e-05, 2.4013221263885498e-05, 2.5229528546333313e-05, 2.6445835828781128e-05, 2.7662143111228943e-05, 2.8878450393676758e-05, 3.0094757676124573e-05, 3.131106495857239e-05, 3.25273722410202e-05, 3.374367952346802e-05, 3.495998680591583e-05, 3.617629408836365e-05, 3.739260137081146e-05, 3.860890865325928e-05, 3.982521593570709e-05, 4.104152321815491e-05, 4.225783050060272e-05, 4.347413778305054e-05, 4.469044506549835e-05, 4.590675234794617e-05, 4.712305963039398e-05, 4.83393669128418e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 9.0, 6.0, 13.0, 23.0, 29.0, 39.0, 69.0, 101.0, 139.0, 209.0, 296.0, 399.0, 626.0, 1003.0, 1403.0, 2251.0, 3351.0, 5395.0, 8725.0, 14306.0, 24880.0, 44877.0, 83687.0, 170014.0, 303265.0, 181209.0, 88670.0, 47336.0, 25983.0, 14956.0, 9202.0, 5665.0, 3482.0, 2384.0, 1555.0, 976.0, 671.0, 428.0, 291.0, 200.0, 142.0, 96.0, 57.0, 49.0, 37.0, 18.0, 21.0, 8.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.061004638671875, -0.05918598175048828, -0.05736732482910156, -0.055548667907714844, -0.053730010986328125, -0.051911354064941406, -0.05009269714355469, -0.04827404022216797, -0.04645538330078125, -0.04463672637939453, -0.04281806945800781, -0.040999412536621094, -0.039180755615234375, -0.037362098693847656, -0.03554344177246094, -0.03372478485107422, -0.0319061279296875, -0.03008747100830078, -0.028268814086914062, -0.026450157165527344, -0.024631500244140625, -0.022812843322753906, -0.020994186401367188, -0.01917552947998047, -0.01735687255859375, -0.015538215637207031, -0.013719558715820312, -0.011900901794433594, -0.010082244873046875, -0.008263587951660156, -0.0064449310302734375, -0.004626274108886719, -0.0028076171875, -0.0009889602661132812, 0.0008296966552734375, 0.0026483535766601562, 0.004467010498046875, 0.006285667419433594, 0.008104324340820312, 0.009922981262207031, 0.01174163818359375, 0.013560295104980469, 0.015378952026367188, 0.017197608947753906, 0.019016265869140625, 0.020834922790527344, 0.022653579711914062, 0.02447223663330078, 0.0262908935546875, 0.02810955047607422, 0.029928207397460938, 0.031746864318847656, 0.033565521240234375, 0.035384178161621094, 0.03720283508300781, 0.03902149200439453, 0.04084014892578125, 0.04265880584716797, 0.04447746276855469, 0.046296119689941406, 0.048114776611328125, 0.049933433532714844, 0.05175209045410156, 0.05357074737548828, 0.055389404296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 2.0, 7.0, 5.0, 9.0, 8.0, 8.0, 14.0, 12.0, 14.0, 31.0, 30.0, 32.0, 56.0, 55.0, 87.0, 98.0, 114.0, 84.0, 66.0, 47.0, 40.0, 35.0, 35.0, 19.0, 9.0, 15.0, 16.0, 10.0, 7.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0233154296875, -0.022629261016845703, -0.021943092346191406, -0.02125692367553711, -0.020570755004882812, -0.019884586334228516, -0.01919841766357422, -0.018512248992919922, -0.017826080322265625, -0.017139911651611328, -0.01645374298095703, -0.015767574310302734, -0.015081405639648438, -0.01439523696899414, -0.013709068298339844, -0.013022899627685547, -0.01233673095703125, -0.011650562286376953, -0.010964393615722656, -0.01027822494506836, -0.009592056274414062, -0.008905887603759766, -0.008219718933105469, -0.007533550262451172, -0.006847381591796875, -0.006161212921142578, -0.005475044250488281, -0.004788875579833984, -0.0041027069091796875, -0.0034165382385253906, -0.0027303695678710938, -0.002044200897216797, -0.0013580322265625, -0.0006718635559082031, 1.430511474609375e-05, 0.0007004737854003906, 0.0013866424560546875, 0.0020728111267089844, 0.0027589797973632812, 0.003445148468017578, 0.004131317138671875, 0.004817485809326172, 0.005503654479980469, 0.006189823150634766, 0.0068759918212890625, 0.007562160491943359, 0.008248329162597656, 0.008934497833251953, 0.00962066650390625, 0.010306835174560547, 0.010993003845214844, 0.01167917251586914, 0.012365341186523438, 0.013051509857177734, 0.013737678527832031, 0.014423847198486328, 0.015110015869140625, 0.015796184539794922, 0.01648235321044922, 0.017168521881103516, 0.017854690551757812, 0.01854085922241211, 0.019227027893066406, 0.019913196563720703, 0.020599365234375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 0.0, 4.0, 6.0, 5.0, 17.0, 7.0, 8.0, 17.0, 28.0, 25.0, 28.0, 45.0, 49.0, 52.0, 66.0, 69.0, 68.0, 85.0, 73.0, 50.0, 57.0, 44.0, 27.0, 35.0, 29.0, 17.0, 16.0, 17.0, 11.0, 18.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.563196182250977, -14.122038841247559, -13.680880546569824, -13.239723205566406, -12.798564910888672, -12.357407569885254, -11.916250228881836, -11.475091934204102, -11.033934593200684, -10.592777252197266, -10.151618957519531, -9.710461616516113, -9.269303321838379, -8.828145980834961, -8.386987686157227, -7.945830345153809, -7.504672527313232, -7.063514709472656, -6.62235689163208, -6.181199073791504, -5.740041732788086, -5.29888391494751, -4.857726097106934, -4.416568756103516, -3.9754106998443604, -3.534252882003784, -3.093095302581787, -2.651937484741211, -2.2107796669006348, -1.7696220874786377, -1.3284642696380615, -0.8873066902160645, -0.4461488723754883, -0.0049911439418792725, 0.43616658449172974, 0.8773243427276611, 1.3184820413589478, 1.7596397399902344, 2.2007975578308105, 2.6419551372528076, 3.083112955093384, 3.52427077293396, 3.965428352355957, 4.406586170196533, 4.847743988037109, 5.288901329040527, 5.730059623718262, 6.17121696472168, 6.612374782562256, 7.053532600402832, 7.494690418243408, 7.935848236083984, 8.377005577087402, 8.81816291809082, 9.259321212768555, 9.700478553771973, 10.141636848449707, 10.582794189453125, 11.02395248413086, 11.465109825134277, 11.906268119812012, 12.34742546081543, 12.788583755493164, 13.229741096496582, 13.6708984375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 5.0, 8.0, 13.0, 15.0, 14.0, 16.0, 19.0, 27.0, 15.0, 31.0, 28.0, 28.0, 22.0, 23.0, 28.0, 28.0, 40.0, 60.0, 36.0, 36.0, 50.0, 43.0, 37.0, 21.0, 33.0, 35.0, 32.0, 26.0, 23.0, 24.0, 25.0, 22.0, 22.0, 18.0, 10.0, 11.0, 10.0, 7.0, 8.0, 8.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-11.358976364135742, -11.0121431350708, -10.66530990600586, -10.318476676940918, -9.971643447875977, -9.624809265136719, -9.277976036071777, -8.931142807006836, -8.584309577941895, -8.237476348876953, -7.890643119812012, -7.543809413909912, -7.196976184844971, -6.850142955780029, -6.50330924987793, -6.156476020812988, -5.809642791748047, -5.4628095626831055, -5.115976333618164, -4.7691426277160645, -4.422309398651123, -4.075476169586182, -3.728642702102661, -3.3818092346191406, -3.034976005554199, -2.688142776489258, -2.3413093090057373, -1.9944759607315063, -1.6476426124572754, -1.3008092641830444, -0.9539759159088135, -0.607142448425293, -0.26030826568603516, 0.0865250825881958, 0.43335843086242676, 0.7801917791366577, 1.1270251274108887, 1.4738584756851196, 1.8206918239593506, 2.167525291442871, 2.5143585205078125, 2.861191749572754, 3.2080252170562744, 3.554858684539795, 3.9016919136047363, 4.248525142669678, 4.595358848571777, 4.942192077636719, 5.28902530670166, 5.635858535766602, 5.982691764831543, 6.329525470733643, 6.676358699798584, 7.023191928863525, 7.370025634765625, 7.716858863830566, 8.063692092895508, 8.41052532196045, 8.75735855102539, 9.104191780090332, 9.451025009155273, 9.797859191894531, 10.144692420959473, 10.491525650024414, 10.838358879089355]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 7.0, 6.0, 5.0, 18.0, 20.0, 42.0, 76.0, 109.0, 183.0, 294.0, 418.0, 656.0, 940.0, 1411.0, 2083.0, 3143.0, 4756.0, 7119.0, 10683.0, 16511.0, 25458.0, 38957.0, 60034.0, 92265.0, 136147.0, 171176.0, 155680.0, 110745.0, 72740.0, 47503.0, 30773.0, 20141.0, 12894.0, 8611.0, 5638.0, 3678.0, 2601.0, 1735.0, 1125.0, 786.0, 513.0, 326.0, 209.0, 135.0, 86.0, 51.0, 26.0, 22.0, 10.0, 7.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6640625, -15.1370849609375, -14.610107421875, -14.0831298828125, -13.55615234375, -13.0291748046875, -12.502197265625, -11.9752197265625, -11.4482421875, -10.9212646484375, -10.394287109375, -9.8673095703125, -9.34033203125, -8.8133544921875, -8.286376953125, -7.7593994140625, -7.232421875, -6.7054443359375, -6.178466796875, -5.6514892578125, -5.12451171875, -4.5975341796875, -4.070556640625, -3.5435791015625, -3.0166015625, -2.4896240234375, -1.962646484375, -1.4356689453125, -0.90869140625, -0.3817138671875, 0.145263671875, 0.6722412109375, 1.19921875, 1.7261962890625, 2.253173828125, 2.7801513671875, 3.30712890625, 3.8341064453125, 4.361083984375, 4.8880615234375, 5.4150390625, 5.9420166015625, 6.468994140625, 6.9959716796875, 7.52294921875, 8.0499267578125, 8.576904296875, 9.1038818359375, 9.630859375, 10.1578369140625, 10.684814453125, 11.2117919921875, 11.73876953125, 12.2657470703125, 12.792724609375, 13.3197021484375, 13.8466796875, 14.3736572265625, 14.900634765625, 15.4276123046875, 15.95458984375, 16.4815673828125, 17.008544921875, 17.5355224609375, 18.0625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 7.0, 4.0, 9.0, 19.0, 21.0, 16.0, 26.0, 18.0, 20.0, 28.0, 31.0, 28.0, 27.0, 33.0, 34.0, 35.0, 44.0, 42.0, 38.0, 44.0, 42.0, 34.0, 31.0, 41.0, 39.0, 30.0, 29.0, 24.0, 27.0, 21.0, 27.0, 26.0, 17.0, 9.0, 9.0, 6.0, 10.0, 7.0, 9.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 3.0], "bins": [-10.9609375, -10.63916015625, -10.3173828125, -9.99560546875, -9.673828125, -9.35205078125, -9.0302734375, -8.70849609375, -8.38671875, -8.06494140625, -7.7431640625, -7.42138671875, -7.099609375, -6.77783203125, -6.4560546875, -6.13427734375, -5.8125, -5.49072265625, -5.1689453125, -4.84716796875, -4.525390625, -4.20361328125, -3.8818359375, -3.56005859375, -3.23828125, -2.91650390625, -2.5947265625, -2.27294921875, -1.951171875, -1.62939453125, -1.3076171875, -0.98583984375, -0.6640625, -0.34228515625, -0.0205078125, 0.30126953125, 0.623046875, 0.94482421875, 1.2666015625, 1.58837890625, 1.91015625, 2.23193359375, 2.5537109375, 2.87548828125, 3.197265625, 3.51904296875, 3.8408203125, 4.16259765625, 4.484375, 4.80615234375, 5.1279296875, 5.44970703125, 5.771484375, 6.09326171875, 6.4150390625, 6.73681640625, 7.05859375, 7.38037109375, 7.7021484375, 8.02392578125, 8.345703125, 8.66748046875, 8.9892578125, 9.31103515625, 9.6328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 2.0, 10.0, 15.0, 12.0, 19.0, 31.0, 43.0, 73.0, 120.0, 143.0, 186.0, 312.0, 490.0, 690.0, 1052.0, 1650.0, 2533.0, 3803.0, 5947.0, 9108.0, 13965.0, 21705.0, 33965.0, 52193.0, 80499.0, 121986.0, 164923.0, 166876.0, 127040.0, 84343.0, 54756.0, 35421.0, 22743.0, 14782.0, 9333.0, 6243.0, 4080.0, 2529.0, 1699.0, 1063.0, 703.0, 486.0, 333.0, 216.0, 151.0, 96.0, 67.0, 37.0, 27.0, 17.0, 13.0, 10.0, 13.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0], "bins": [-15.9609375, -15.4468994140625, -14.932861328125, -14.4188232421875, -13.90478515625, -13.3907470703125, -12.876708984375, -12.3626708984375, -11.8486328125, -11.3345947265625, -10.820556640625, -10.3065185546875, -9.79248046875, -9.2784423828125, -8.764404296875, -8.2503662109375, -7.736328125, -7.2222900390625, -6.708251953125, -6.1942138671875, -5.68017578125, -5.1661376953125, -4.652099609375, -4.1380615234375, -3.6240234375, -3.1099853515625, -2.595947265625, -2.0819091796875, -1.56787109375, -1.0538330078125, -0.539794921875, -0.0257568359375, 0.48828125, 1.0023193359375, 1.516357421875, 2.0303955078125, 2.54443359375, 3.0584716796875, 3.572509765625, 4.0865478515625, 4.6005859375, 5.1146240234375, 5.628662109375, 6.1427001953125, 6.65673828125, 7.1707763671875, 7.684814453125, 8.1988525390625, 8.712890625, 9.2269287109375, 9.740966796875, 10.2550048828125, 10.76904296875, 11.2830810546875, 11.797119140625, 12.3111572265625, 12.8251953125, 13.3392333984375, 13.853271484375, 14.3673095703125, 14.88134765625, 15.3953857421875, 15.909423828125, 16.4234619140625, 16.9375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 10.0, 7.0, 4.0, 14.0, 12.0, 5.0, 11.0, 15.0, 26.0, 16.0, 24.0, 30.0, 30.0, 52.0, 39.0, 42.0, 43.0, 54.0, 38.0, 44.0, 46.0, 38.0, 32.0, 32.0, 40.0, 41.0, 28.0, 34.0, 36.0, 25.0, 17.0, 15.0, 21.0, 11.0, 10.0, 10.0, 16.0, 6.0, 7.0, 10.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.46624755859375, -5.2410888671875, -5.01593017578125, -4.790771484375, -4.56561279296875, -4.3404541015625, -4.11529541015625, -3.89013671875, -3.66497802734375, -3.4398193359375, -3.21466064453125, -2.989501953125, -2.76434326171875, -2.5391845703125, -2.31402587890625, -2.0888671875, -1.86370849609375, -1.6385498046875, -1.41339111328125, -1.188232421875, -0.96307373046875, -0.7379150390625, -0.51275634765625, -0.28759765625, -0.06243896484375, 0.1627197265625, 0.38787841796875, 0.613037109375, 0.83819580078125, 1.0633544921875, 1.28851318359375, 1.513671875, 1.73883056640625, 1.9639892578125, 2.18914794921875, 2.414306640625, 2.63946533203125, 2.8646240234375, 3.08978271484375, 3.31494140625, 3.54010009765625, 3.7652587890625, 3.99041748046875, 4.215576171875, 4.44073486328125, 4.6658935546875, 4.89105224609375, 5.1162109375, 5.34136962890625, 5.5665283203125, 5.79168701171875, 6.016845703125, 6.24200439453125, 6.4671630859375, 6.69232177734375, 6.91748046875, 7.14263916015625, 7.3677978515625, 7.59295654296875, 7.818115234375, 8.04327392578125, 8.2684326171875, 8.49359130859375, 8.71875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 6.0, 9.0, 7.0, 14.0, 6.0, 10.0, 14.0, 22.0, 39.0, 52.0, 77.0, 91.0, 105.0, 157.0, 199.0, 281.0, 379.0, 603.0, 844.0, 1141.0, 1684.0, 2651.0, 4367.0, 7512.0, 13319.0, 26496.0, 60820.0, 182130.0, 484326.0, 152807.0, 53272.0, 23887.0, 12107.0, 6989.0, 4151.0, 2483.0, 1618.0, 1165.0, 768.0, 542.0, 380.0, 258.0, 189.0, 146.0, 120.0, 92.0, 68.0, 49.0, 33.0, 12.0, 16.0, 13.0, 9.0, 7.0, 8.0, 9.0, 4.0, 4.0, 1.0, 2.0], "bins": [-6.61328125, -6.40936279296875, -6.2054443359375, -6.00152587890625, -5.797607421875, -5.59368896484375, -5.3897705078125, -5.18585205078125, -4.98193359375, -4.77801513671875, -4.5740966796875, -4.37017822265625, -4.166259765625, -3.96234130859375, -3.7584228515625, -3.55450439453125, -3.3505859375, -3.14666748046875, -2.9427490234375, -2.73883056640625, -2.534912109375, -2.33099365234375, -2.1270751953125, -1.92315673828125, -1.71923828125, -1.51531982421875, -1.3114013671875, -1.10748291015625, -0.903564453125, -0.69964599609375, -0.4957275390625, -0.29180908203125, -0.087890625, 0.11602783203125, 0.3199462890625, 0.52386474609375, 0.727783203125, 0.93170166015625, 1.1356201171875, 1.33953857421875, 1.54345703125, 1.74737548828125, 1.9512939453125, 2.15521240234375, 2.359130859375, 2.56304931640625, 2.7669677734375, 2.97088623046875, 3.1748046875, 3.37872314453125, 3.5826416015625, 3.78656005859375, 3.990478515625, 4.19439697265625, 4.3983154296875, 4.60223388671875, 4.80615234375, 5.01007080078125, 5.2139892578125, 5.41790771484375, 5.621826171875, 5.82574462890625, 6.0296630859375, 6.23358154296875, 6.4375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 3.0, 1.0, 3.0, 13.0, 7.0, 12.0, 6.0, 22.0, 27.0, 47.0, 64.0, 89.0, 111.0, 118.0, 110.0, 109.0, 72.0, 52.0, 45.0, 24.0, 16.0, 17.0, 15.0, 7.0, 6.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003857612609863281, -0.0003718957304954529, -0.00035803020000457764, -0.0003441646695137024, -0.00033029913902282715, -0.0003164336085319519, -0.00030256807804107666, -0.0002887025475502014, -0.00027483701705932617, -0.00026097148656845093, -0.0002471059560775757, -0.00023324042558670044, -0.0002193748950958252, -0.00020550936460494995, -0.0001916438341140747, -0.00017777830362319946, -0.00016391277313232422, -0.00015004724264144897, -0.00013618171215057373, -0.00012231618165969849, -0.00010845065116882324, -9.4585120677948e-05, -8.071959018707275e-05, -6.685405969619751e-05, -5.2988529205322266e-05, -3.912299871444702e-05, -2.5257468223571777e-05, -1.1391937732696533e-05, 2.473592758178711e-06, 1.6339123249053955e-05, 3.02046537399292e-05, 4.407018423080444e-05, 5.793571472167969e-05, 7.180124521255493e-05, 8.566677570343018e-05, 9.953230619430542e-05, 0.00011339783668518066, 0.0001272633671760559, 0.00014112889766693115, 0.0001549944281578064, 0.00016885995864868164, 0.00018272548913955688, 0.00019659101963043213, 0.00021045655012130737, 0.00022432208061218262, 0.00023818761110305786, 0.0002520531415939331, 0.00026591867208480835, 0.0002797842025756836, 0.00029364973306655884, 0.0003075152635574341, 0.0003213807940483093, 0.00033524632453918457, 0.0003491118550300598, 0.00036297738552093506, 0.0003768429160118103, 0.00039070844650268555, 0.0004045739769935608, 0.00041843950748443604, 0.0004323050379753113, 0.0004461705684661865, 0.00046003609895706177, 0.000473901629447937, 0.00048776715993881226, 0.0005016326904296875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 12.0, 24.0, 41.0, 49.0, 65.0, 95.0, 152.0, 188.0, 345.0, 575.0, 915.0, 1403.0, 2309.0, 3930.0, 6838.0, 12589.0, 25726.0, 61059.0, 187469.0, 481603.0, 158240.0, 54627.0, 22939.0, 11578.0, 6313.0, 3620.0, 2171.0, 1350.0, 847.0, 502.0, 321.0, 207.0, 153.0, 76.0, 65.0, 36.0, 45.0, 22.0, 16.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.83203125, -6.62139892578125, -6.4107666015625, -6.20013427734375, -5.989501953125, -5.77886962890625, -5.5682373046875, -5.35760498046875, -5.14697265625, -4.93634033203125, -4.7257080078125, -4.51507568359375, -4.304443359375, -4.09381103515625, -3.8831787109375, -3.67254638671875, -3.4619140625, -3.25128173828125, -3.0406494140625, -2.83001708984375, -2.619384765625, -2.40875244140625, -2.1981201171875, -1.98748779296875, -1.77685546875, -1.56622314453125, -1.3555908203125, -1.14495849609375, -0.934326171875, -0.72369384765625, -0.5130615234375, -0.30242919921875, -0.091796875, 0.11883544921875, 0.3294677734375, 0.54010009765625, 0.750732421875, 0.96136474609375, 1.1719970703125, 1.38262939453125, 1.59326171875, 1.80389404296875, 2.0145263671875, 2.22515869140625, 2.435791015625, 2.64642333984375, 2.8570556640625, 3.06768798828125, 3.2783203125, 3.48895263671875, 3.6995849609375, 3.91021728515625, 4.120849609375, 4.33148193359375, 4.5421142578125, 4.75274658203125, 4.96337890625, 5.17401123046875, 5.3846435546875, 5.59527587890625, 5.805908203125, 6.01654052734375, 6.2271728515625, 6.43780517578125, 6.6484375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 10.0, 8.0, 11.0, 16.0, 25.0, 21.0, 42.0, 55.0, 60.0, 85.0, 87.0, 90.0, 102.0, 74.0, 58.0, 44.0, 38.0, 33.0, 24.0, 22.0, 15.0, 9.0, 13.0, 9.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.1143951416015625, -2.054962158203125, -1.9955291748046875, -1.93609619140625, -1.8766632080078125, -1.817230224609375, -1.7577972412109375, -1.6983642578125, -1.6389312744140625, -1.579498291015625, -1.5200653076171875, -1.46063232421875, -1.4011993408203125, -1.341766357421875, -1.2823333740234375, -1.222900390625, -1.1634674072265625, -1.104034423828125, -1.0446014404296875, -0.98516845703125, -0.9257354736328125, -0.866302490234375, -0.8068695068359375, -0.7474365234375, -0.6880035400390625, -0.628570556640625, -0.5691375732421875, -0.50970458984375, -0.4502716064453125, -0.390838623046875, -0.3314056396484375, -0.27197265625, -0.2125396728515625, -0.153106689453125, -0.0936737060546875, -0.03424072265625, 0.0251922607421875, 0.084625244140625, 0.1440582275390625, 0.2034912109375, 0.2629241943359375, 0.322357177734375, 0.3817901611328125, 0.44122314453125, 0.5006561279296875, 0.560089111328125, 0.6195220947265625, 0.678955078125, 0.7383880615234375, 0.797821044921875, 0.8572540283203125, 0.91668701171875, 0.9761199951171875, 1.035552978515625, 1.0949859619140625, 1.1544189453125, 1.2138519287109375, 1.273284912109375, 1.3327178955078125, 1.39215087890625, 1.4515838623046875, 1.511016845703125, 1.5704498291015625, 1.6298828125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 7.0, 5.0, 9.0, 7.0, 16.0, 23.0, 17.0, 25.0, 36.0, 44.0, 44.0, 59.0, 58.0, 69.0, 76.0, 75.0, 61.0, 74.0, 45.0, 35.0, 34.0, 35.0, 23.0, 23.0, 16.0, 14.0, 12.0, 17.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-15.12641716003418, -14.716930389404297, -14.307442665100098, -13.897955894470215, -13.488469123840332, -13.078981399536133, -12.66949462890625, -12.260007858276367, -11.850521087646484, -11.441034317016602, -11.031546592712402, -10.62205982208252, -10.212573051452637, -9.803085327148438, -9.393598556518555, -8.984111785888672, -8.574624061584473, -8.16513729095459, -7.755650043487549, -7.346162796020508, -6.936676025390625, -6.527188777923584, -6.117701530456543, -5.70821475982666, -5.298727512359619, -4.889240264892578, -4.479753494262695, -4.070266246795654, -3.6607792377471924, -3.2512922286987305, -2.8418049812316895, -2.4323179721832275, -2.0228309631347656, -1.6133439540863037, -1.2038568258285522, -0.7943696975708008, -0.38488268852233887, 0.024604320526123047, 0.43409156799316406, 0.843578577041626, 1.253065586090088, 1.6625525951385498, 2.0720396041870117, 2.4815268516540527, 2.8910138607025146, 3.3005008697509766, 3.7099881172180176, 4.119475364685059, 4.528962135314941, 4.938449382781982, 5.347936153411865, 5.757423400878906, 6.166910171508789, 6.57639741897583, 6.985884666442871, 7.395371437072754, 7.804858684539795, 8.214345932006836, 8.623832702636719, 9.033319473266602, 9.4428071975708, 9.852293968200684, 10.261781692504883, 10.671268463134766, 11.080755233764648]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 4.0, 7.0, 10.0, 10.0, 20.0, 11.0, 14.0, 25.0, 14.0, 26.0, 33.0, 38.0, 26.0, 26.0, 36.0, 45.0, 43.0, 45.0, 44.0, 44.0, 65.0, 37.0, 35.0, 41.0, 39.0, 28.0, 33.0, 20.0, 24.0, 22.0, 14.0, 15.0, 24.0, 14.0, 17.0, 11.0, 8.0, 7.0, 5.0, 8.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.485816955566406, -12.1128568649292, -11.739895820617676, -11.366935729980469, -10.993975639343262, -10.621015548706055, -10.248054504394531, -9.875094413757324, -9.502134323120117, -9.12917423248291, -8.756213188171387, -8.38325309753418, -8.010293006896973, -7.637332439422607, -7.264371871948242, -6.891411781311035, -6.518450736999512, -6.1454901695251465, -5.7725300788879395, -5.399569511413574, -5.026609420776367, -4.653648853302002, -4.280688285827637, -3.9077279567718506, -3.5347676277160645, -3.1618072986602783, -2.788846969604492, -2.415886402130127, -2.042926073074341, -1.6699657440185547, -1.2970051765441895, -0.9240448474884033, -0.5510835647583008, -0.17812317609786987, 0.19483721256256104, 0.5677976608276367, 0.9407579898834229, 1.313718318939209, 1.6866788864135742, 2.0596392154693604, 2.4325995445251465, 2.8055598735809326, 3.1785202026367188, 3.551480770111084, 3.92444109916687, 4.297401428222656, 4.6703619956970215, 5.043322563171387, 5.416282653808594, 5.789243221282959, 6.162203311920166, 6.535163879394531, 6.908123970031738, 7.2810845375061035, 7.654045104980469, 8.027005195617676, 8.399965286254883, 8.77292537689209, 9.145886421203613, 9.51884651184082, 9.891806602478027, 10.264766693115234, 10.637727737426758, 11.010687828063965, 11.383648872375488]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 18.0, 38.0, 50.0, 58.0, 96.0, 153.0, 237.0, 306.0, 449.0, 633.0, 1044.0, 1446.0, 2139.0, 3230.0, 4677.0, 6987.0, 10612.0, 16066.0, 25605.0, 41004.0, 67841.0, 119586.0, 236120.0, 547163.0, 1134106.0, 1036710.0, 460742.0, 203126.0, 106629.0, 61419.0, 37184.0, 23650.0, 15120.0, 9817.0, 6541.0, 4540.0, 2935.0, 2021.0, 1360.0, 944.0, 609.0, 485.0, 278.0, 190.0, 117.0, 68.0, 51.0, 26.0, 24.0, 11.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.1171875, -12.6927490234375, -12.268310546875, -11.8438720703125, -11.41943359375, -10.9949951171875, -10.570556640625, -10.1461181640625, -9.7216796875, -9.2972412109375, -8.872802734375, -8.4483642578125, -8.02392578125, -7.5994873046875, -7.175048828125, -6.7506103515625, -6.326171875, -5.9017333984375, -5.477294921875, -5.0528564453125, -4.62841796875, -4.2039794921875, -3.779541015625, -3.3551025390625, -2.9306640625, -2.5062255859375, -2.081787109375, -1.6573486328125, -1.23291015625, -0.8084716796875, -0.384033203125, 0.0404052734375, 0.46484375, 0.8892822265625, 1.313720703125, 1.7381591796875, 2.16259765625, 2.5870361328125, 3.011474609375, 3.4359130859375, 3.8603515625, 4.2847900390625, 4.709228515625, 5.1336669921875, 5.55810546875, 5.9825439453125, 6.406982421875, 6.8314208984375, 7.255859375, 7.6802978515625, 8.104736328125, 8.5291748046875, 8.95361328125, 9.3780517578125, 9.802490234375, 10.2269287109375, 10.6513671875, 11.0758056640625, 11.500244140625, 11.9246826171875, 12.34912109375, 12.7735595703125, 13.197998046875, 13.6224365234375, 14.046875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 15.0, 13.0, 11.0, 12.0, 16.0, 25.0, 31.0, 21.0, 27.0, 32.0, 30.0, 29.0, 47.0, 42.0, 42.0, 43.0, 41.0, 50.0, 40.0, 38.0, 45.0, 38.0, 34.0, 30.0, 26.0, 18.0, 29.0, 18.0, 16.0, 28.0, 15.0, 12.0, 13.0, 9.0, 10.0, 6.0, 2.0, 5.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.375, -9.0889892578125, -8.802978515625, -8.5169677734375, -8.23095703125, -7.9449462890625, -7.658935546875, -7.3729248046875, -7.0869140625, -6.8009033203125, -6.514892578125, -6.2288818359375, -5.94287109375, -5.6568603515625, -5.370849609375, -5.0848388671875, -4.798828125, -4.5128173828125, -4.226806640625, -3.9407958984375, -3.65478515625, -3.3687744140625, -3.082763671875, -2.7967529296875, -2.5107421875, -2.2247314453125, -1.938720703125, -1.6527099609375, -1.36669921875, -1.0806884765625, -0.794677734375, -0.5086669921875, -0.22265625, 0.0633544921875, 0.349365234375, 0.6353759765625, 0.92138671875, 1.2073974609375, 1.493408203125, 1.7794189453125, 2.0654296875, 2.3514404296875, 2.637451171875, 2.9234619140625, 3.20947265625, 3.4954833984375, 3.781494140625, 4.0675048828125, 4.353515625, 4.6395263671875, 4.925537109375, 5.2115478515625, 5.49755859375, 5.7835693359375, 6.069580078125, 6.3555908203125, 6.6416015625, 6.9276123046875, 7.213623046875, 7.4996337890625, 7.78564453125, 8.0716552734375, 8.357666015625, 8.6436767578125, 8.9296875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 22.0, 20.0, 29.0, 67.0, 78.0, 116.0, 197.0, 289.0, 440.0, 721.0, 1113.0, 1728.0, 2791.0, 4706.0, 7585.0, 12773.0, 21989.0, 38384.0, 68661.0, 127729.0, 246432.0, 492261.0, 962413.0, 1046553.0, 556630.0, 278099.0, 143320.0, 76708.0, 42095.0, 24460.0, 14160.0, 8397.0, 5022.0, 3122.0, 1913.0, 1221.0, 721.0, 484.0, 302.0, 189.0, 106.0, 80.0, 52.0, 32.0, 30.0, 17.0, 10.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.6640625, -12.2431640625, -11.822265625, -11.4013671875, -10.98046875, -10.5595703125, -10.138671875, -9.7177734375, -9.296875, -8.8759765625, -8.455078125, -8.0341796875, -7.61328125, -7.1923828125, -6.771484375, -6.3505859375, -5.9296875, -5.5087890625, -5.087890625, -4.6669921875, -4.24609375, -3.8251953125, -3.404296875, -2.9833984375, -2.5625, -2.1416015625, -1.720703125, -1.2998046875, -0.87890625, -0.4580078125, -0.037109375, 0.3837890625, 0.8046875, 1.2255859375, 1.646484375, 2.0673828125, 2.48828125, 2.9091796875, 3.330078125, 3.7509765625, 4.171875, 4.5927734375, 5.013671875, 5.4345703125, 5.85546875, 6.2763671875, 6.697265625, 7.1181640625, 7.5390625, 7.9599609375, 8.380859375, 8.8017578125, 9.22265625, 9.6435546875, 10.064453125, 10.4853515625, 10.90625, 11.3271484375, 11.748046875, 12.1689453125, 12.58984375, 13.0107421875, 13.431640625, 13.8525390625, 14.2734375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 12.0, 13.0, 20.0, 13.0, 24.0, 31.0, 38.0, 53.0, 67.0, 71.0, 96.0, 110.0, 140.0, 176.0, 190.0, 235.0, 231.0, 262.0, 296.0, 256.0, 277.0, 239.0, 195.0, 178.0, 152.0, 139.0, 105.0, 90.0, 78.0, 63.0, 36.0, 40.0, 30.0, 24.0, 17.0, 17.0, 13.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.29150390625, -4.1416015625, -3.99169921875, -3.841796875, -3.69189453125, -3.5419921875, -3.39208984375, -3.2421875, -3.09228515625, -2.9423828125, -2.79248046875, -2.642578125, -2.49267578125, -2.3427734375, -2.19287109375, -2.04296875, -1.89306640625, -1.7431640625, -1.59326171875, -1.443359375, -1.29345703125, -1.1435546875, -0.99365234375, -0.84375, -0.69384765625, -0.5439453125, -0.39404296875, -0.244140625, -0.09423828125, 0.0556640625, 0.20556640625, 0.35546875, 0.50537109375, 0.6552734375, 0.80517578125, 0.955078125, 1.10498046875, 1.2548828125, 1.40478515625, 1.5546875, 1.70458984375, 1.8544921875, 2.00439453125, 2.154296875, 2.30419921875, 2.4541015625, 2.60400390625, 2.75390625, 2.90380859375, 3.0537109375, 3.20361328125, 3.353515625, 3.50341796875, 3.6533203125, 3.80322265625, 3.953125, 4.10302734375, 4.2529296875, 4.40283203125, 4.552734375, 4.70263671875, 4.8525390625, 5.00244140625, 5.15234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 10.0, 17.0, 6.0, 13.0, 27.0, 23.0, 29.0, 34.0, 52.0, 52.0, 54.0, 73.0, 78.0, 82.0, 72.0, 68.0, 53.0, 41.0, 41.0, 28.0, 29.0, 15.0, 21.0, 7.0, 12.0, 9.0, 6.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.724020004272461, -12.34917163848877, -11.974323272705078, -11.599475860595703, -11.224627494812012, -10.84977912902832, -10.474930763244629, -10.100082397460938, -9.725234031677246, -9.350385665893555, -8.975537300109863, -8.600688934326172, -8.225841522216797, -7.8509931564331055, -7.476144790649414, -7.101296424865723, -6.7264485359191895, -6.351600170135498, -5.976752281188965, -5.601903915405273, -5.227055549621582, -4.852207183837891, -4.477359294891357, -4.102510929107666, -3.7276628017425537, -3.3528146743774414, -2.97796630859375, -2.6031181812286377, -2.2282700538635254, -1.853421688079834, -1.4785735607147217, -1.1037251949310303, -0.728877067565918, -0.3540288507938385, 0.020819365978240967, 0.39566755294799805, 0.7705157995223999, 1.1453640460968018, 1.520212173461914, 1.8950605392456055, 2.2699086666107178, 2.64475679397583, 3.0196051597595215, 3.394453287124634, 3.769301414489746, 4.1441497802734375, 4.518998146057129, 4.89384651184082, 5.2686944007873535, 5.643542766571045, 6.018390655517578, 6.3932390213012695, 6.768087387084961, 7.142935752868652, 7.5177836418151855, 7.892632007598877, 8.26747989654541, 8.642328262329102, 9.017176628112793, 9.392024993896484, 9.76687240600586, 10.14172077178955, 10.516569137573242, 10.891417503356934, 11.266265869140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 5.0, 3.0, 9.0, 11.0, 8.0, 14.0, 14.0, 18.0, 24.0, 27.0, 31.0, 26.0, 45.0, 35.0, 36.0, 36.0, 40.0, 45.0, 50.0, 38.0, 38.0, 48.0, 49.0, 37.0, 41.0, 33.0, 35.0, 25.0, 24.0, 29.0, 14.0, 13.0, 14.0, 16.0, 18.0, 6.0, 9.0, 6.0, 12.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.55821418762207, -10.219274520874023, -9.880335807800293, -9.541396141052246, -9.2024564743042, -8.863517761230469, -8.524578094482422, -8.185638427734375, -7.846699237823486, -7.507760047912598, -7.168820381164551, -6.829881191253662, -6.490942001342773, -6.152002334594727, -5.813063144683838, -5.474123954772949, -5.135184288024902, -4.796245098114014, -4.457305431365967, -4.118366241455078, -3.7794268131256104, -3.4404873847961426, -3.101548194885254, -2.762608766555786, -2.4236693382263184, -2.0847299098968506, -1.7457906007766724, -1.4068512916564941, -1.0679118633270264, -0.7289724349975586, -0.3900332450866699, -0.05109381675720215, 0.2878446578979492, 0.6267840266227722, 0.9657233953475952, 1.3046627044677734, 1.6436021327972412, 1.982541561126709, 2.3214807510375977, 2.6604201793670654, 2.999359607696533, 3.338299036026001, 3.6772384643554688, 4.016177654266357, 4.355116844177246, 4.694056510925293, 5.032995700836182, 5.37193489074707, 5.710874557495117, 6.049813747406006, 6.388753414154053, 6.727692604064941, 7.066632270812988, 7.405571460723877, 7.744510650634766, 8.083450317382812, 8.42238998413086, 8.761329650878906, 9.100268363952637, 9.439208030700684, 9.77814769744873, 10.117086410522461, 10.456026077270508, 10.794965744018555, 11.133904457092285]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 13.0, 13.0, 23.0, 36.0, 45.0, 95.0, 118.0, 213.0, 314.0, 508.0, 823.0, 1220.0, 1925.0, 3258.0, 5084.0, 8349.0, 14001.0, 22886.0, 37916.0, 62770.0, 104852.0, 181318.0, 243079.0, 144075.0, 85531.0, 51110.0, 30742.0, 18615.0, 11272.0, 6895.0, 4270.0, 2667.0, 1661.0, 1020.0, 664.0, 407.0, 265.0, 172.0, 107.0, 84.0, 45.0, 39.0, 22.0, 14.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.796875, -4.6385498046875, -4.480224609375, -4.3218994140625, -4.16357421875, -4.0052490234375, -3.846923828125, -3.6885986328125, -3.5302734375, -3.3719482421875, -3.213623046875, -3.0552978515625, -2.89697265625, -2.7386474609375, -2.580322265625, -2.4219970703125, -2.263671875, -2.1053466796875, -1.947021484375, -1.7886962890625, -1.63037109375, -1.4720458984375, -1.313720703125, -1.1553955078125, -0.9970703125, -0.8387451171875, -0.680419921875, -0.5220947265625, -0.36376953125, -0.2054443359375, -0.047119140625, 0.1112060546875, 0.26953125, 0.4278564453125, 0.586181640625, 0.7445068359375, 0.90283203125, 1.0611572265625, 1.219482421875, 1.3778076171875, 1.5361328125, 1.6944580078125, 1.852783203125, 2.0111083984375, 2.16943359375, 2.3277587890625, 2.486083984375, 2.6444091796875, 2.802734375, 2.9610595703125, 3.119384765625, 3.2777099609375, 3.43603515625, 3.5943603515625, 3.752685546875, 3.9110107421875, 4.0693359375, 4.2276611328125, 4.385986328125, 4.5443115234375, 4.70263671875, 4.8609619140625, 5.019287109375, 5.1776123046875, 5.3359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 5.0, 3.0, 11.0, 10.0, 14.0, 14.0, 11.0, 11.0, 29.0, 32.0, 35.0, 28.0, 29.0, 27.0, 51.0, 29.0, 42.0, 41.0, 45.0, 49.0, 56.0, 41.0, 50.0, 42.0, 37.0, 32.0, 21.0, 32.0, 28.0, 28.0, 19.0, 19.0, 14.0, 12.0, 10.0, 14.0, 5.0, 3.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -11.0595703125, -10.705078125, -10.3505859375, -9.99609375, -9.6416015625, -9.287109375, -8.9326171875, -8.578125, -8.2236328125, -7.869140625, -7.5146484375, -7.16015625, -6.8056640625, -6.451171875, -6.0966796875, -5.7421875, -5.3876953125, -5.033203125, -4.6787109375, -4.32421875, -3.9697265625, -3.615234375, -3.2607421875, -2.90625, -2.5517578125, -2.197265625, -1.8427734375, -1.48828125, -1.1337890625, -0.779296875, -0.4248046875, -0.0703125, 0.2841796875, 0.638671875, 0.9931640625, 1.34765625, 1.7021484375, 2.056640625, 2.4111328125, 2.765625, 3.1201171875, 3.474609375, 3.8291015625, 4.18359375, 4.5380859375, 4.892578125, 5.2470703125, 5.6015625, 5.9560546875, 6.310546875, 6.6650390625, 7.01953125, 7.3740234375, 7.728515625, 8.0830078125, 8.4375, 8.7919921875, 9.146484375, 9.5009765625, 9.85546875, 10.2099609375, 10.564453125, 10.9189453125, 11.2734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 16.0, 12.0, 24.0, 35.0, 52.0, 94.0, 150.0, 246.0, 377.0, 655.0, 1230.0, 2096.0, 3941.0, 7163.0, 14434.0, 29396.0, 63144.0, 140342.0, 327822.0, 252303.0, 107750.0, 48965.0, 23585.0, 11332.0, 5992.0, 3147.0, 1766.0, 1008.0, 547.0, 352.0, 211.0, 138.0, 80.0, 41.0, 37.0, 16.0, 19.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3359375, -7.112548828125, -6.88916015625, -6.665771484375, -6.4423828125, -6.218994140625, -5.99560546875, -5.772216796875, -5.548828125, -5.325439453125, -5.10205078125, -4.878662109375, -4.6552734375, -4.431884765625, -4.20849609375, -3.985107421875, -3.76171875, -3.538330078125, -3.31494140625, -3.091552734375, -2.8681640625, -2.644775390625, -2.42138671875, -2.197998046875, -1.974609375, -1.751220703125, -1.52783203125, -1.304443359375, -1.0810546875, -0.857666015625, -0.63427734375, -0.410888671875, -0.1875, 0.035888671875, 0.25927734375, 0.482666015625, 0.7060546875, 0.929443359375, 1.15283203125, 1.376220703125, 1.599609375, 1.822998046875, 2.04638671875, 2.269775390625, 2.4931640625, 2.716552734375, 2.93994140625, 3.163330078125, 3.38671875, 3.610107421875, 3.83349609375, 4.056884765625, 4.2802734375, 4.503662109375, 4.72705078125, 4.950439453125, 5.173828125, 5.397216796875, 5.62060546875, 5.843994140625, 6.0673828125, 6.290771484375, 6.51416015625, 6.737548828125, 6.9609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 4.0, 12.0, 5.0, 13.0, 11.0, 14.0, 29.0, 13.0, 26.0, 32.0, 27.0, 38.0, 45.0, 47.0, 41.0, 47.0, 49.0, 40.0, 44.0, 54.0, 46.0, 51.0, 37.0, 40.0, 38.0, 32.0, 33.0, 21.0, 20.0, 18.0, 21.0, 9.0, 11.0, 6.0, 7.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0078125, -7.7628173828125, -7.517822265625, -7.2728271484375, -7.02783203125, -6.7828369140625, -6.537841796875, -6.2928466796875, -6.0478515625, -5.8028564453125, -5.557861328125, -5.3128662109375, -5.06787109375, -4.8228759765625, -4.577880859375, -4.3328857421875, -4.087890625, -3.8428955078125, -3.597900390625, -3.3529052734375, -3.10791015625, -2.8629150390625, -2.617919921875, -2.3729248046875, -2.1279296875, -1.8829345703125, -1.637939453125, -1.3929443359375, -1.14794921875, -0.9029541015625, -0.657958984375, -0.4129638671875, -0.16796875, 0.0770263671875, 0.322021484375, 0.5670166015625, 0.81201171875, 1.0570068359375, 1.302001953125, 1.5469970703125, 1.7919921875, 2.0369873046875, 2.281982421875, 2.5269775390625, 2.77197265625, 3.0169677734375, 3.261962890625, 3.5069580078125, 3.751953125, 3.9969482421875, 4.241943359375, 4.4869384765625, 4.73193359375, 4.9769287109375, 5.221923828125, 5.4669189453125, 5.7119140625, 5.9569091796875, 6.201904296875, 6.4468994140625, 6.69189453125, 6.9368896484375, 7.181884765625, 7.4268798828125, 7.671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 12.0, 5.0, 18.0, 27.0, 38.0, 67.0, 96.0, 173.0, 306.0, 503.0, 941.0, 1757.0, 3297.0, 6407.0, 13640.0, 30827.0, 82238.0, 286014.0, 428900.0, 117603.0, 41102.0, 17396.0, 8309.0, 4138.0, 2082.0, 1088.0, 642.0, 376.0, 206.0, 121.0, 63.0, 60.0, 28.0, 20.0, 18.0, 12.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09710693359375, -0.0943450927734375, -0.091583251953125, -0.0888214111328125, -0.0860595703125, -0.0832977294921875, -0.080535888671875, -0.0777740478515625, -0.07501220703125, -0.0722503662109375, -0.069488525390625, -0.0667266845703125, -0.06396484375, -0.0612030029296875, -0.058441162109375, -0.0556793212890625, -0.05291748046875, -0.0501556396484375, -0.047393798828125, -0.0446319580078125, -0.0418701171875, -0.0391082763671875, -0.036346435546875, -0.0335845947265625, -0.03082275390625, -0.0280609130859375, -0.025299072265625, -0.0225372314453125, -0.019775390625, -0.0170135498046875, -0.014251708984375, -0.0114898681640625, -0.00872802734375, -0.0059661865234375, -0.003204345703125, -0.0004425048828125, 0.0023193359375, 0.0050811767578125, 0.007843017578125, 0.0106048583984375, 0.01336669921875, 0.0161285400390625, 0.018890380859375, 0.0216522216796875, 0.0244140625, 0.0271759033203125, 0.029937744140625, 0.0326995849609375, 0.03546142578125, 0.0382232666015625, 0.040985107421875, 0.0437469482421875, 0.0465087890625, 0.0492706298828125, 0.052032470703125, 0.0547943115234375, 0.05755615234375, 0.0603179931640625, 0.063079833984375, 0.0658416748046875, 0.068603515625, 0.0713653564453125, 0.074127197265625, 0.0768890380859375, 0.07965087890625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 5.0, 2.0, 7.0, 10.0, 12.0, 12.0, 23.0, 21.0, 29.0, 42.0, 35.0, 79.0, 71.0, 90.0, 91.0, 75.0, 72.0, 72.0, 49.0, 46.0, 42.0, 24.0, 24.0, 12.0, 18.0, 12.0, 5.0, 7.0, 3.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4139881134033203e-05, -2.332683652639389e-05, -2.2513791918754578e-05, -2.1700747311115265e-05, -2.0887702703475952e-05, -2.007465809583664e-05, -1.9261613488197327e-05, -1.8448568880558014e-05, -1.76355242729187e-05, -1.682247966527939e-05, -1.6009435057640076e-05, -1.5196390450000763e-05, -1.438334584236145e-05, -1.3570301234722137e-05, -1.2757256627082825e-05, -1.1944212019443512e-05, -1.11311674118042e-05, -1.0318122804164886e-05, -9.505078196525574e-06, -8.692033588886261e-06, -7.878988981246948e-06, -7.0659443736076355e-06, -6.252899765968323e-06, -5.43985515832901e-06, -4.626810550689697e-06, -3.8137659430503845e-06, -3.0007213354110718e-06, -2.187676727771759e-06, -1.3746321201324463e-06, -5.615875124931335e-07, 2.514570951461792e-07, 1.064501702785492e-06, 1.8775463104248047e-06, 2.6905909180641174e-06, 3.50363552570343e-06, 4.316680133342743e-06, 5.129724740982056e-06, 5.942769348621368e-06, 6.755813956260681e-06, 7.568858563899994e-06, 8.381903171539307e-06, 9.19494777917862e-06, 1.0007992386817932e-05, 1.0821036994457245e-05, 1.1634081602096558e-05, 1.244712620973587e-05, 1.3260170817375183e-05, 1.4073215425014496e-05, 1.4886260032653809e-05, 1.569930464029312e-05, 1.6512349247932434e-05, 1.7325393855571747e-05, 1.813843846321106e-05, 1.8951483070850372e-05, 1.9764527678489685e-05, 2.0577572286128998e-05, 2.139061689376831e-05, 2.2203661501407623e-05, 2.3016706109046936e-05, 2.382975071668625e-05, 2.464279532432556e-05, 2.5455839931964874e-05, 2.6268884539604187e-05, 2.70819291472435e-05, 2.7894973754882812e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 11.0, 17.0, 22.0, 18.0, 34.0, 53.0, 71.0, 104.0, 148.0, 182.0, 300.0, 443.0, 611.0, 969.0, 1435.0, 2237.0, 3529.0, 5738.0, 9180.0, 15344.0, 26679.0, 49353.0, 98675.0, 221162.0, 313428.0, 143149.0, 68566.0, 35551.0, 19910.0, 11707.0, 7084.0, 4487.0, 2827.0, 1772.0, 1250.0, 803.0, 549.0, 331.0, 248.0, 161.0, 127.0, 88.0, 52.0, 62.0, 27.0, 20.0, 13.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.05413818359375, -0.052405357360839844, -0.05067253112792969, -0.04893970489501953, -0.047206878662109375, -0.04547405242919922, -0.04374122619628906, -0.042008399963378906, -0.04027557373046875, -0.038542747497558594, -0.03680992126464844, -0.03507709503173828, -0.033344268798828125, -0.03161144256591797, -0.029878616333007812, -0.028145790100097656, -0.0264129638671875, -0.024680137634277344, -0.022947311401367188, -0.02121448516845703, -0.019481658935546875, -0.01774883270263672, -0.016016006469726562, -0.014283180236816406, -0.01255035400390625, -0.010817527770996094, -0.009084701538085938, -0.007351875305175781, -0.005619049072265625, -0.0038862228393554688, -0.0021533966064453125, -0.00042057037353515625, 0.001312255859375, 0.0030450820922851562, 0.0047779083251953125, 0.006510734558105469, 0.008243560791015625, 0.009976387023925781, 0.011709213256835938, 0.013442039489746094, 0.01517486572265625, 0.016907691955566406, 0.018640518188476562, 0.02037334442138672, 0.022106170654296875, 0.02383899688720703, 0.025571823120117188, 0.027304649353027344, 0.0290374755859375, 0.030770301818847656, 0.03250312805175781, 0.03423595428466797, 0.035968780517578125, 0.03770160675048828, 0.03943443298339844, 0.041167259216308594, 0.04290008544921875, 0.044632911682128906, 0.04636573791503906, 0.04809856414794922, 0.049831390380859375, 0.05156421661376953, 0.05329704284667969, 0.055029869079589844, 0.0567626953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 11.0, 9.0, 13.0, 14.0, 25.0, 24.0, 47.0, 47.0, 54.0, 87.0, 90.0, 95.0, 80.0, 83.0, 60.0, 51.0, 43.0, 35.0, 31.0, 13.0, 6.0, 12.0, 11.0, 9.0, 7.0, 7.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02423095703125, -0.023545026779174805, -0.02285909652709961, -0.022173166275024414, -0.02148723602294922, -0.020801305770874023, -0.020115375518798828, -0.019429445266723633, -0.018743515014648438, -0.018057584762573242, -0.017371654510498047, -0.01668572425842285, -0.015999794006347656, -0.015313863754272461, -0.014627933502197266, -0.01394200325012207, -0.013256072998046875, -0.01257014274597168, -0.011884212493896484, -0.011198282241821289, -0.010512351989746094, -0.009826421737670898, -0.009140491485595703, -0.008454561233520508, -0.0077686309814453125, -0.007082700729370117, -0.006396770477294922, -0.0057108402252197266, -0.005024909973144531, -0.004338979721069336, -0.0036530494689941406, -0.0029671192169189453, -0.00228118896484375, -0.0015952587127685547, -0.0009093284606933594, -0.00022339820861816406, 0.00046253204345703125, 0.0011484622955322266, 0.0018343925476074219, 0.002520322799682617, 0.0032062530517578125, 0.003892183303833008, 0.004578113555908203, 0.0052640438079833984, 0.005949974060058594, 0.006635904312133789, 0.007321834564208984, 0.00800776481628418, 0.008693695068359375, 0.00937962532043457, 0.010065555572509766, 0.010751485824584961, 0.011437416076660156, 0.012123346328735352, 0.012809276580810547, 0.013495206832885742, 0.014181137084960938, 0.014867067337036133, 0.015552997589111328, 0.016238927841186523, 0.01692485809326172, 0.017610788345336914, 0.01829671859741211, 0.018982648849487305, 0.0196685791015625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 12.0, 5.0, 15.0, 10.0, 12.0, 6.0, 27.0, 26.0, 30.0, 40.0, 51.0, 56.0, 59.0, 68.0, 80.0, 95.0, 75.0, 53.0, 50.0, 42.0, 41.0, 31.0, 24.0, 13.0, 19.0, 7.0, 11.0, 8.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.837623596191406, -12.457071304321289, -12.076518058776855, -11.695965766906738, -11.315413475036621, -10.934860229492188, -10.55430793762207, -10.173755645751953, -9.793203353881836, -9.412651062011719, -9.032097816467285, -8.651545524597168, -8.27099323272705, -7.890440464019775, -7.5098876953125, -7.129335403442383, -6.748782157897949, -6.368229389190674, -5.987677097320557, -5.607124328613281, -5.226572036743164, -4.846019268035889, -4.465466499328613, -4.084914207458496, -3.7043614387512207, -3.3238089084625244, -2.943256378173828, -2.5627036094665527, -2.1821510791778564, -1.8015985488891602, -1.4210457801818848, -1.0404932498931885, -0.6599416732788086, -0.27938908338546753, 0.10116350650787354, 0.4817161560058594, 0.8622686862945557, 1.242821216583252, 1.6233739852905273, 2.0039265155792236, 2.38447904586792, 2.765031576156616, 3.1455841064453125, 3.526136875152588, 3.906689405441284, 4.2872419357299805, 4.667794704437256, 5.048347473144531, 5.428899765014648, 5.809452533721924, 6.190004825592041, 6.570557594299316, 6.951109886169434, 7.331662654876709, 7.712215423583984, 8.092767715454102, 8.473320007324219, 8.853872299194336, 9.23442554473877, 9.614977836608887, 9.995530128479004, 10.376083374023438, 10.756635665893555, 11.137187957763672, 11.517741203308105]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 3.0, 4.0, 8.0, 13.0, 7.0, 13.0, 14.0, 19.0, 23.0, 28.0, 32.0, 26.0, 42.0, 35.0, 35.0, 38.0, 40.0, 43.0, 53.0, 37.0, 38.0, 49.0, 46.0, 40.0, 41.0, 32.0, 35.0, 25.0, 25.0, 29.0, 14.0, 13.0, 13.0, 15.0, 19.0, 8.0, 8.0, 6.0, 12.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.551474571228027, -10.214794158935547, -9.878113746643066, -9.541433334350586, -9.204751968383789, -8.868071556091309, -8.531391143798828, -8.194710731506348, -7.858030319213867, -7.521349906921387, -7.184669017791748, -6.847988605499268, -6.511308193206787, -6.174627304077148, -5.837946891784668, -5.5012664794921875, -5.164585590362549, -4.827905178070068, -4.49122428894043, -4.154543876647949, -3.8178634643554688, -3.481182813644409, -3.1445021629333496, -2.807821750640869, -2.4711410999298096, -2.13446044921875, -1.7977800369262695, -1.46109938621521, -1.12441885471344, -0.7877383232116699, -0.45105767250061035, -0.11437726020812988, 0.2223033905029297, 0.5589839220046997, 0.8956645131111145, 1.2323451042175293, 1.5690256357192993, 1.9057061672210693, 2.242386817932129, 2.5790672302246094, 2.915747880935669, 3.2524285316467285, 3.589108943939209, 3.9257895946502686, 4.262470245361328, 4.599150657653809, 4.935831069946289, 5.2725114822387695, 5.609192371368408, 5.945872783660889, 6.282553672790527, 6.619234085083008, 6.955914497375488, 7.292594909667969, 7.629275798797607, 7.965956211090088, 8.302637100219727, 8.639317512512207, 8.975997924804688, 9.312679290771484, 9.649359703063965, 9.986040115356445, 10.322720527648926, 10.659400939941406, 10.996081352233887]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 6.0, 9.0, 19.0, 23.0, 33.0, 51.0, 89.0, 128.0, 188.0, 303.0, 431.0, 630.0, 1037.0, 1554.0, 2485.0, 3813.0, 5908.0, 9127.0, 14785.0, 23414.0, 37807.0, 60297.0, 97338.0, 149092.0, 184619.0, 161603.0, 110660.0, 68438.0, 42264.0, 26585.0, 16637.0, 10305.0, 6655.0, 4278.0, 2787.0, 1780.0, 1192.0, 729.0, 506.0, 315.0, 230.0, 136.0, 104.0, 61.0, 39.0, 25.0, 14.0, 5.0, 9.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.1015625, -14.6241455078125, -14.146728515625, -13.6693115234375, -13.19189453125, -12.7144775390625, -12.237060546875, -11.7596435546875, -11.2822265625, -10.8048095703125, -10.327392578125, -9.8499755859375, -9.37255859375, -8.8951416015625, -8.417724609375, -7.9403076171875, -7.462890625, -6.9854736328125, -6.508056640625, -6.0306396484375, -5.55322265625, -5.0758056640625, -4.598388671875, -4.1209716796875, -3.6435546875, -3.1661376953125, -2.688720703125, -2.2113037109375, -1.73388671875, -1.2564697265625, -0.779052734375, -0.3016357421875, 0.17578125, 0.6531982421875, 1.130615234375, 1.6080322265625, 2.08544921875, 2.5628662109375, 3.040283203125, 3.5177001953125, 3.9951171875, 4.4725341796875, 4.949951171875, 5.4273681640625, 5.90478515625, 6.3822021484375, 6.859619140625, 7.3370361328125, 7.814453125, 8.2918701171875, 8.769287109375, 9.2467041015625, 9.72412109375, 10.2015380859375, 10.678955078125, 11.1563720703125, 11.6337890625, 12.1112060546875, 12.588623046875, 13.0660400390625, 13.54345703125, 14.0208740234375, 14.498291015625, 14.9757080078125, 15.453125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 12.0, 4.0, 4.0, 13.0, 11.0, 16.0, 15.0, 33.0, 26.0, 33.0, 31.0, 50.0, 30.0, 40.0, 59.0, 46.0, 44.0, 50.0, 43.0, 59.0, 48.0, 35.0, 44.0, 38.0, 24.0, 23.0, 27.0, 30.0, 12.0, 10.0, 15.0, 21.0, 14.0, 11.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.20361328125, -9.8681640625, -9.53271484375, -9.197265625, -8.86181640625, -8.5263671875, -8.19091796875, -7.85546875, -7.52001953125, -7.1845703125, -6.84912109375, -6.513671875, -6.17822265625, -5.8427734375, -5.50732421875, -5.171875, -4.83642578125, -4.5009765625, -4.16552734375, -3.830078125, -3.49462890625, -3.1591796875, -2.82373046875, -2.48828125, -2.15283203125, -1.8173828125, -1.48193359375, -1.146484375, -0.81103515625, -0.4755859375, -0.14013671875, 0.1953125, 0.53076171875, 0.8662109375, 1.20166015625, 1.537109375, 1.87255859375, 2.2080078125, 2.54345703125, 2.87890625, 3.21435546875, 3.5498046875, 3.88525390625, 4.220703125, 4.55615234375, 4.8916015625, 5.22705078125, 5.5625, 5.89794921875, 6.2333984375, 6.56884765625, 6.904296875, 7.23974609375, 7.5751953125, 7.91064453125, 8.24609375, 8.58154296875, 8.9169921875, 9.25244140625, 9.587890625, 9.92333984375, 10.2587890625, 10.59423828125, 10.9296875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 9.0, 5.0, 19.0, 15.0, 31.0, 35.0, 55.0, 86.0, 142.0, 234.0, 301.0, 492.0, 771.0, 1072.0, 1645.0, 2530.0, 3949.0, 5939.0, 9393.0, 14424.0, 22582.0, 35446.0, 57123.0, 90513.0, 136463.0, 177362.0, 164778.0, 117317.0, 75118.0, 47258.0, 30229.0, 18806.0, 11924.0, 7929.0, 4981.0, 3237.0, 2195.0, 1417.0, 933.0, 629.0, 412.0, 263.0, 185.0, 91.0, 74.0, 44.0, 34.0, 30.0, 21.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.1953125, -14.7320556640625, -14.268798828125, -13.8055419921875, -13.34228515625, -12.8790283203125, -12.415771484375, -11.9525146484375, -11.4892578125, -11.0260009765625, -10.562744140625, -10.0994873046875, -9.63623046875, -9.1729736328125, -8.709716796875, -8.2464599609375, -7.783203125, -7.3199462890625, -6.856689453125, -6.3934326171875, -5.93017578125, -5.4669189453125, -5.003662109375, -4.5404052734375, -4.0771484375, -3.6138916015625, -3.150634765625, -2.6873779296875, -2.22412109375, -1.7608642578125, -1.297607421875, -0.8343505859375, -0.37109375, 0.0921630859375, 0.555419921875, 1.0186767578125, 1.48193359375, 1.9451904296875, 2.408447265625, 2.8717041015625, 3.3349609375, 3.7982177734375, 4.261474609375, 4.7247314453125, 5.18798828125, 5.6512451171875, 6.114501953125, 6.5777587890625, 7.041015625, 7.5042724609375, 7.967529296875, 8.4307861328125, 8.89404296875, 9.3572998046875, 9.820556640625, 10.2838134765625, 10.7470703125, 11.2103271484375, 11.673583984375, 12.1368408203125, 12.60009765625, 13.0633544921875, 13.526611328125, 13.9898681640625, 14.453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 7.0, 14.0, 7.0, 13.0, 10.0, 19.0, 19.0, 20.0, 19.0, 31.0, 25.0, 31.0, 33.0, 25.0, 43.0, 34.0, 42.0, 39.0, 44.0, 39.0, 45.0, 41.0, 39.0, 32.0, 46.0, 33.0, 32.0, 31.0, 36.0, 24.0, 22.0, 17.0, 14.0, 10.0, 7.0, 8.0, 6.0, 9.0, 10.0, 4.0, 11.0, 1.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.897216796875, -5.70068359375, -5.504150390625, -5.3076171875, -5.111083984375, -4.91455078125, -4.718017578125, -4.521484375, -4.324951171875, -4.12841796875, -3.931884765625, -3.7353515625, -3.538818359375, -3.34228515625, -3.145751953125, -2.94921875, -2.752685546875, -2.55615234375, -2.359619140625, -2.1630859375, -1.966552734375, -1.77001953125, -1.573486328125, -1.376953125, -1.180419921875, -0.98388671875, -0.787353515625, -0.5908203125, -0.394287109375, -0.19775390625, -0.001220703125, 0.1953125, 0.391845703125, 0.58837890625, 0.784912109375, 0.9814453125, 1.177978515625, 1.37451171875, 1.571044921875, 1.767578125, 1.964111328125, 2.16064453125, 2.357177734375, 2.5537109375, 2.750244140625, 2.94677734375, 3.143310546875, 3.33984375, 3.536376953125, 3.73291015625, 3.929443359375, 4.1259765625, 4.322509765625, 4.51904296875, 4.715576171875, 4.912109375, 5.108642578125, 5.30517578125, 5.501708984375, 5.6982421875, 5.894775390625, 6.09130859375, 6.287841796875, 6.484375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 5.0, 11.0, 15.0, 20.0, 23.0, 48.0, 45.0, 80.0, 102.0, 140.0, 184.0, 246.0, 379.0, 495.0, 658.0, 948.0, 1287.0, 1819.0, 2568.0, 3829.0, 5613.0, 8548.0, 13409.0, 21923.0, 39432.0, 83774.0, 294225.0, 363538.0, 95729.0, 42721.0, 23762.0, 14255.0, 9108.0, 6041.0, 4002.0, 2809.0, 1955.0, 1356.0, 963.0, 694.0, 486.0, 366.0, 260.0, 185.0, 144.0, 95.0, 74.0, 66.0, 36.0, 33.0, 17.0, 12.0, 8.0, 11.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.98651123046875, -4.8206787109375, -4.65484619140625, -4.489013671875, -4.32318115234375, -4.1573486328125, -3.99151611328125, -3.82568359375, -3.65985107421875, -3.4940185546875, -3.32818603515625, -3.162353515625, -2.99652099609375, -2.8306884765625, -2.66485595703125, -2.4990234375, -2.33319091796875, -2.1673583984375, -2.00152587890625, -1.835693359375, -1.66986083984375, -1.5040283203125, -1.33819580078125, -1.17236328125, -1.00653076171875, -0.8406982421875, -0.67486572265625, -0.509033203125, -0.34320068359375, -0.1773681640625, -0.01153564453125, 0.154296875, 0.32012939453125, 0.4859619140625, 0.65179443359375, 0.817626953125, 0.98345947265625, 1.1492919921875, 1.31512451171875, 1.48095703125, 1.64678955078125, 1.8126220703125, 1.97845458984375, 2.144287109375, 2.31011962890625, 2.4759521484375, 2.64178466796875, 2.8076171875, 2.97344970703125, 3.1392822265625, 3.30511474609375, 3.470947265625, 3.63677978515625, 3.8026123046875, 3.96844482421875, 4.13427734375, 4.30010986328125, 4.4659423828125, 4.63177490234375, 4.797607421875, 4.96343994140625, 5.1292724609375, 5.29510498046875, 5.4609375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 12.0, 11.0, 18.0, 20.0, 18.0, 33.0, 54.0, 74.0, 109.0, 124.0, 119.0, 102.0, 79.0, 47.0, 45.0, 27.0, 16.0, 18.0, 14.0, 8.0, 10.0, 7.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000400543212890625, -0.0003887563943862915, -0.000376969575881958, -0.0003651827573776245, -0.000353395938873291, -0.0003416091203689575, -0.000329822301864624, -0.00031803548336029053, -0.00030624866485595703, -0.00029446184635162354, -0.00028267502784729004, -0.00027088820934295654, -0.00025910139083862305, -0.00024731457233428955, -0.00023552775382995605, -0.00022374093532562256, -0.00021195411682128906, -0.00020016729831695557, -0.00018838047981262207, -0.00017659366130828857, -0.00016480684280395508, -0.00015302002429962158, -0.00014123320579528809, -0.0001294463872909546, -0.0001176595687866211, -0.0001058727502822876, -9.40859317779541e-05, -8.22991132736206e-05, -7.051229476928711e-05, -5.872547626495361e-05, -4.693865776062012e-05, -3.515183925628662e-05, -2.3365020751953125e-05, -1.1578202247619629e-05, 2.086162567138672e-07, 1.1995434761047363e-05, 2.378225326538086e-05, 3.5569071769714355e-05, 4.735589027404785e-05, 5.914270877838135e-05, 7.092952728271484e-05, 8.271634578704834e-05, 9.450316429138184e-05, 0.00010628998279571533, 0.00011807680130004883, 0.00012986361980438232, 0.00014165043830871582, 0.00015343725681304932, 0.0001652240753173828, 0.0001770108938217163, 0.0001887977123260498, 0.0002005845308303833, 0.0002123713493347168, 0.0002241581678390503, 0.0002359449863433838, 0.0002477318048477173, 0.0002595186233520508, 0.0002713054418563843, 0.0002830922603607178, 0.00029487907886505127, 0.00030666589736938477, 0.00031845271587371826, 0.00033023953437805176, 0.00034202635288238525, 0.00035381317138671875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 9.0, 9.0, 11.0, 12.0, 16.0, 29.0, 34.0, 53.0, 56.0, 95.0, 106.0, 167.0, 196.0, 256.0, 357.0, 465.0, 617.0, 858.0, 1152.0, 1559.0, 2048.0, 3119.0, 4691.0, 6945.0, 10769.0, 18133.0, 31651.0, 64151.0, 192684.0, 466662.0, 121991.0, 49001.0, 25845.0, 15126.0, 9430.0, 6091.0, 4017.0, 2788.0, 1922.0, 1390.0, 1064.0, 723.0, 581.0, 407.0, 329.0, 244.0, 195.0, 127.0, 116.0, 76.0, 46.0, 41.0, 30.0, 28.0, 11.0, 15.0, 10.0, 6.0, 4.0, 1.0, 3.0], "bins": [-5.33203125, -5.1671142578125, -5.002197265625, -4.8372802734375, -4.67236328125, -4.5074462890625, -4.342529296875, -4.1776123046875, -4.0126953125, -3.8477783203125, -3.682861328125, -3.5179443359375, -3.35302734375, -3.1881103515625, -3.023193359375, -2.8582763671875, -2.693359375, -2.5284423828125, -2.363525390625, -2.1986083984375, -2.03369140625, -1.8687744140625, -1.703857421875, -1.5389404296875, -1.3740234375, -1.2091064453125, -1.044189453125, -0.8792724609375, -0.71435546875, -0.5494384765625, -0.384521484375, -0.2196044921875, -0.0546875, 0.1102294921875, 0.275146484375, 0.4400634765625, 0.60498046875, 0.7698974609375, 0.934814453125, 1.0997314453125, 1.2646484375, 1.4295654296875, 1.594482421875, 1.7593994140625, 1.92431640625, 2.0892333984375, 2.254150390625, 2.4190673828125, 2.583984375, 2.7489013671875, 2.913818359375, 3.0787353515625, 3.24365234375, 3.4085693359375, 3.573486328125, 3.7384033203125, 3.9033203125, 4.0682373046875, 4.233154296875, 4.3980712890625, 4.56298828125, 4.7279052734375, 4.892822265625, 5.0577392578125, 5.22265625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 6.0, 11.0, 6.0, 10.0, 15.0, 14.0, 13.0, 17.0, 28.0, 30.0, 38.0, 38.0, 74.0, 99.0, 138.0, 105.0, 61.0, 49.0, 43.0, 28.0, 27.0, 22.0, 20.0, 17.0, 14.0, 10.0, 14.0, 5.0, 5.0, 5.0, 2.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.8359375, -1.7796173095703125, -1.723297119140625, -1.6669769287109375, -1.61065673828125, -1.5543365478515625, -1.498016357421875, -1.4416961669921875, -1.3853759765625, -1.3290557861328125, -1.272735595703125, -1.2164154052734375, -1.16009521484375, -1.1037750244140625, -1.047454833984375, -0.9911346435546875, -0.934814453125, -0.8784942626953125, -0.822174072265625, -0.7658538818359375, -0.70953369140625, -0.6532135009765625, -0.596893310546875, -0.5405731201171875, -0.4842529296875, -0.4279327392578125, -0.371612548828125, -0.3152923583984375, -0.25897216796875, -0.2026519775390625, -0.146331787109375, -0.0900115966796875, -0.03369140625, 0.0226287841796875, 0.078948974609375, 0.1352691650390625, 0.19158935546875, 0.2479095458984375, 0.304229736328125, 0.3605499267578125, 0.4168701171875, 0.4731903076171875, 0.529510498046875, 0.5858306884765625, 0.64215087890625, 0.6984710693359375, 0.754791259765625, 0.8111114501953125, 0.867431640625, 0.9237518310546875, 0.980072021484375, 1.0363922119140625, 1.09271240234375, 1.1490325927734375, 1.205352783203125, 1.2616729736328125, 1.3179931640625, 1.3743133544921875, 1.430633544921875, 1.4869537353515625, 1.54327392578125, 1.5995941162109375, 1.655914306640625, 1.7122344970703125, 1.7685546875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 10.0, 9.0, 13.0, 15.0, 21.0, 19.0, 18.0, 39.0, 54.0, 64.0, 69.0, 90.0, 95.0, 88.0, 67.0, 79.0, 49.0, 47.0, 32.0, 26.0, 16.0, 18.0, 15.0, 9.0, 4.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.278871536254883, -11.865873336791992, -11.452875137329102, -11.039876937866211, -10.62687873840332, -10.21388053894043, -9.800882339477539, -9.387884140014648, -8.974885940551758, -8.561887741088867, -8.148889541625977, -7.735891342163086, -7.322893142700195, -6.909894943237305, -6.496896743774414, -6.083898544311523, -5.670900344848633, -5.257902145385742, -4.844903945922852, -4.431905746459961, -4.01890754699707, -3.6059093475341797, -3.192911148071289, -2.7799129486083984, -2.366914749145508, -1.9539165496826172, -1.5409183502197266, -1.127920150756836, -0.7149219512939453, -0.3019237518310547, 0.11107444763183594, 0.5240726470947266, 0.9370708465576172, 1.3500690460205078, 1.7630672454833984, 2.176065444946289, 2.5890636444091797, 3.0020618438720703, 3.415060043334961, 3.8280582427978516, 4.241056442260742, 4.654054641723633, 5.067052841186523, 5.480051040649414, 5.893049240112305, 6.306047439575195, 6.719045639038086, 7.132043838500977, 7.545042037963867, 7.958040237426758, 8.371038436889648, 8.784036636352539, 9.19703483581543, 9.61003303527832, 10.023031234741211, 10.436029434204102, 10.849027633666992, 11.262025833129883, 11.675024032592773, 12.088022232055664, 12.501020431518555, 12.914018630981445, 13.327016830444336, 13.740015029907227, 14.153013229370117]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 8.0, 11.0, 3.0, 10.0, 17.0, 17.0, 30.0, 32.0, 26.0, 33.0, 25.0, 41.0, 43.0, 42.0, 43.0, 50.0, 52.0, 43.0, 49.0, 41.0, 45.0, 34.0, 41.0, 38.0, 27.0, 21.0, 37.0, 20.0, 11.0, 16.0, 18.0, 15.0, 10.0, 10.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.460538864135742, -10.117257118225098, -9.77397632598877, -9.430694580078125, -9.087413787841797, -8.744132041931152, -8.400850296020508, -8.05756950378418, -7.714288234710693, -7.371006965637207, -7.027725696563721, -6.684444427490234, -6.34116268157959, -5.997881889343262, -5.654600143432617, -5.311318874359131, -4.9680376052856445, -4.624756336212158, -4.281475067138672, -3.9381935596466064, -3.59491229057312, -3.251631021499634, -2.9083495140075684, -2.565068244934082, -2.2217869758605957, -1.8785057067871094, -1.5352243185043335, -1.1919429302215576, -0.8486616611480713, -0.505380392074585, -0.16209888458251953, 0.1811823844909668, 0.5244646072387695, 0.8677459359169006, 1.2110272645950317, 1.5543086528778076, 1.897589921951294, 2.2408711910247803, 2.5841526985168457, 2.927433967590332, 3.2707152366638184, 3.6139965057373047, 3.957277774810791, 4.300559043884277, 4.643840789794922, 4.98712158203125, 5.3304033279418945, 5.673684597015381, 6.016965866088867, 6.3602471351623535, 6.70352840423584, 7.046810150146484, 7.3900909423828125, 7.733372688293457, 8.076654434204102, 8.41993522644043, 8.763216018676758, 9.106497764587402, 9.44977855682373, 9.793060302734375, 10.136341094970703, 10.479622840881348, 10.822904586791992, 11.16618537902832, 11.509467124938965]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 12.0, 27.0, 26.0, 41.0, 54.0, 102.0, 151.0, 216.0, 302.0, 533.0, 722.0, 1192.0, 1763.0, 2739.0, 4335.0, 6697.0, 10830.0, 17671.0, 29432.0, 51614.0, 93585.0, 189113.0, 464765.0, 1163421.0, 1213545.0, 503527.0, 202421.0, 99707.0, 54058.0, 31453.0, 19023.0, 11303.0, 7055.0, 4554.0, 2789.0, 1924.0, 1146.0, 813.0, 528.0, 345.0, 227.0, 177.0, 119.0, 57.0, 47.0, 44.0, 18.0, 12.0, 20.0, 7.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-13.140625, -12.71728515625, -12.2939453125, -11.87060546875, -11.447265625, -11.02392578125, -10.6005859375, -10.17724609375, -9.75390625, -9.33056640625, -8.9072265625, -8.48388671875, -8.060546875, -7.63720703125, -7.2138671875, -6.79052734375, -6.3671875, -5.94384765625, -5.5205078125, -5.09716796875, -4.673828125, -4.25048828125, -3.8271484375, -3.40380859375, -2.98046875, -2.55712890625, -2.1337890625, -1.71044921875, -1.287109375, -0.86376953125, -0.4404296875, -0.01708984375, 0.40625, 0.82958984375, 1.2529296875, 1.67626953125, 2.099609375, 2.52294921875, 2.9462890625, 3.36962890625, 3.79296875, 4.21630859375, 4.6396484375, 5.06298828125, 5.486328125, 5.90966796875, 6.3330078125, 6.75634765625, 7.1796875, 7.60302734375, 8.0263671875, 8.44970703125, 8.873046875, 9.29638671875, 9.7197265625, 10.14306640625, 10.56640625, 10.98974609375, 11.4130859375, 11.83642578125, 12.259765625, 12.68310546875, 13.1064453125, 13.52978515625, 13.953125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 6.0, 12.0, 17.0, 22.0, 22.0, 20.0, 30.0, 34.0, 29.0, 32.0, 41.0, 48.0, 49.0, 46.0, 52.0, 53.0, 40.0, 38.0, 31.0, 41.0, 46.0, 36.0, 34.0, 28.0, 15.0, 23.0, 17.0, 20.0, 18.0, 16.0, 11.0, 13.0, 5.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0625, -7.7965087890625, -7.530517578125, -7.2645263671875, -6.99853515625, -6.7325439453125, -6.466552734375, -6.2005615234375, -5.9345703125, -5.6685791015625, -5.402587890625, -5.1365966796875, -4.87060546875, -4.6046142578125, -4.338623046875, -4.0726318359375, -3.806640625, -3.5406494140625, -3.274658203125, -3.0086669921875, -2.74267578125, -2.4766845703125, -2.210693359375, -1.9447021484375, -1.6787109375, -1.4127197265625, -1.146728515625, -0.8807373046875, -0.61474609375, -0.3487548828125, -0.082763671875, 0.1832275390625, 0.44921875, 0.7152099609375, 0.981201171875, 1.2471923828125, 1.51318359375, 1.7791748046875, 2.045166015625, 2.3111572265625, 2.5771484375, 2.8431396484375, 3.109130859375, 3.3751220703125, 3.64111328125, 3.9071044921875, 4.173095703125, 4.4390869140625, 4.705078125, 4.9710693359375, 5.237060546875, 5.5030517578125, 5.76904296875, 6.0350341796875, 6.301025390625, 6.5670166015625, 6.8330078125, 7.0989990234375, 7.364990234375, 7.6309814453125, 7.89697265625, 8.1629638671875, 8.428955078125, 8.6949462890625, 8.9609375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 14.0, 22.0, 45.0, 44.0, 85.0, 107.0, 193.0, 290.0, 452.0, 757.0, 1189.0, 1841.0, 2942.0, 4827.0, 7776.0, 12973.0, 22376.0, 38537.0, 67906.0, 125119.0, 235156.0, 463489.0, 915855.0, 1079565.0, 576475.0, 289165.0, 151946.0, 82862.0, 46184.0, 26588.0, 15604.0, 9105.0, 5548.0, 3468.0, 2120.0, 1373.0, 852.0, 555.0, 326.0, 202.0, 115.0, 87.0, 58.0, 33.0, 26.0, 15.0, 9.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.5208740234375, -11.151123046875, -10.7813720703125, -10.41162109375, -10.0418701171875, -9.672119140625, -9.3023681640625, -8.9326171875, -8.5628662109375, -8.193115234375, -7.8233642578125, -7.45361328125, -7.0838623046875, -6.714111328125, -6.3443603515625, -5.974609375, -5.6048583984375, -5.235107421875, -4.8653564453125, -4.49560546875, -4.1258544921875, -3.756103515625, -3.3863525390625, -3.0166015625, -2.6468505859375, -2.277099609375, -1.9073486328125, -1.53759765625, -1.1678466796875, -0.798095703125, -0.4283447265625, -0.05859375, 0.3111572265625, 0.680908203125, 1.0506591796875, 1.42041015625, 1.7901611328125, 2.159912109375, 2.5296630859375, 2.8994140625, 3.2691650390625, 3.638916015625, 4.0086669921875, 4.37841796875, 4.7481689453125, 5.117919921875, 5.4876708984375, 5.857421875, 6.2271728515625, 6.596923828125, 6.9666748046875, 7.33642578125, 7.7061767578125, 8.075927734375, 8.4456787109375, 8.8154296875, 9.1851806640625, 9.554931640625, 9.9246826171875, 10.29443359375, 10.6641845703125, 11.033935546875, 11.4036865234375, 11.7734375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 8.0, 9.0, 18.0, 13.0, 16.0, 27.0, 17.0, 28.0, 42.0, 42.0, 73.0, 81.0, 94.0, 92.0, 109.0, 140.0, 150.0, 214.0, 216.0, 226.0, 253.0, 261.0, 234.0, 227.0, 219.0, 176.0, 181.0, 155.0, 115.0, 91.0, 81.0, 87.0, 80.0, 70.0, 39.0, 38.0, 23.0, 27.0, 16.0, 15.0, 11.0, 8.0, 10.0, 15.0, 2.0, 8.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.74609375, -3.627227783203125, -3.50836181640625, -3.389495849609375, -3.2706298828125, -3.151763916015625, -3.03289794921875, -2.914031982421875, -2.795166015625, -2.676300048828125, -2.55743408203125, -2.438568115234375, -2.3197021484375, -2.200836181640625, -2.08197021484375, -1.963104248046875, -1.84423828125, -1.725372314453125, -1.60650634765625, -1.487640380859375, -1.3687744140625, -1.249908447265625, -1.13104248046875, -1.012176513671875, -0.893310546875, -0.774444580078125, -0.65557861328125, -0.536712646484375, -0.4178466796875, -0.298980712890625, -0.18011474609375, -0.061248779296875, 0.0576171875, 0.176483154296875, 0.29534912109375, 0.414215087890625, 0.5330810546875, 0.651947021484375, 0.77081298828125, 0.889678955078125, 1.008544921875, 1.127410888671875, 1.24627685546875, 1.365142822265625, 1.4840087890625, 1.602874755859375, 1.72174072265625, 1.840606689453125, 1.95947265625, 2.078338623046875, 2.19720458984375, 2.316070556640625, 2.4349365234375, 2.553802490234375, 2.67266845703125, 2.791534423828125, 2.910400390625, 3.029266357421875, 3.14813232421875, 3.266998291015625, 3.3858642578125, 3.504730224609375, 3.62359619140625, 3.742462158203125, 3.861328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 10.0, 7.0, 4.0, 13.0, 14.0, 22.0, 21.0, 25.0, 28.0, 38.0, 39.0, 53.0, 70.0, 62.0, 66.0, 62.0, 64.0, 57.0, 60.0, 60.0, 48.0, 34.0, 21.0, 28.0, 10.0, 11.0, 17.0, 11.0, 6.0, 5.0, 9.0, 1.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.726858139038086, -9.414864540100098, -9.102869987487793, -8.790876388549805, -8.4788818359375, -8.166888236999512, -7.854894161224365, -7.542900085449219, -7.230906009674072, -6.918911933898926, -6.606917858123779, -6.294923782348633, -5.9829301834106445, -5.67093563079834, -5.358942031860352, -5.046947956085205, -4.734953880310059, -4.422959804534912, -4.110965728759766, -3.7989718914031982, -3.4869778156280518, -3.1749837398529053, -2.862989902496338, -2.5509958267211914, -2.239001750946045, -1.9270076751708984, -1.6150137186050415, -1.3030197620391846, -0.9910256862640381, -0.6790316104888916, -0.36703765392303467, -0.055043697357177734, 0.25695133209228516, 0.5689453482627869, 0.8809393644332886, 1.1929333209991455, 1.504927396774292, 1.8169214725494385, 2.128915309906006, 2.4409093856811523, 2.752903461456299, 3.0648975372314453, 3.376891613006592, 3.688885450363159, 4.000879287719727, 4.312873840332031, 4.6248674392700195, 4.936861515045166, 5.2488555908203125, 5.560849666595459, 5.8728437423706055, 6.184837818145752, 6.496831893920898, 6.808825492858887, 7.120819568634033, 7.43281364440918, 7.744807720184326, 8.056801795959473, 8.368795394897461, 8.680789947509766, 8.992783546447754, 9.304778099060059, 9.616771697998047, 9.928766250610352, 10.24075984954834]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 5.0, 5.0, 11.0, 12.0, 16.0, 27.0, 13.0, 21.0, 28.0, 27.0, 34.0, 23.0, 34.0, 31.0, 32.0, 38.0, 32.0, 27.0, 38.0, 38.0, 39.0, 36.0, 38.0, 34.0, 38.0, 30.0, 32.0, 26.0, 24.0, 32.0, 24.0, 21.0, 16.0, 15.0, 17.0, 10.0, 14.0, 8.0, 6.0, 8.0, 3.0, 4.0, 4.0, 4.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.376368522644043, -8.120339393615723, -7.864309787750244, -7.608280181884766, -7.352251052856445, -7.096221446990967, -6.840191841125488, -6.584162712097168, -6.3281331062316895, -6.072103500366211, -5.816074371337891, -5.560044765472412, -5.304015159606934, -5.047986030578613, -4.791956424713135, -4.535926818847656, -4.279897689819336, -4.023868083953857, -3.767838954925537, -3.5118093490600586, -3.255779981613159, -2.9997506141662598, -2.7437210083007812, -2.487691640853882, -2.2316622734069824, -1.975632905960083, -1.719603419303894, -1.463573932647705, -1.2075445652008057, -0.9515151977539062, -0.6954857110977173, -0.4394562244415283, -0.1834278106689453, 0.07260161638259888, 0.32863104343414307, 0.5846604704856873, 0.8406898975372314, 1.0967192649841309, 1.3527487516403198, 1.6087782382965088, 1.8648076057434082, 2.1208369731903076, 2.376866340637207, 2.6328959465026855, 2.888925313949585, 3.1449546813964844, 3.400984287261963, 3.6570136547088623, 3.9130430221557617, 4.16907262802124, 4.4251017570495605, 4.681131362915039, 4.937160491943359, 5.193190097808838, 5.449219703674316, 5.705248832702637, 5.961278438568115, 6.217308044433594, 6.473337173461914, 6.729366779327393, 6.985396385192871, 7.241425514221191, 7.49745512008667, 7.753484725952148, 8.009513854980469]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 0.0, 1.0, 7.0, 10.0, 16.0, 30.0, 28.0, 36.0, 52.0, 85.0, 108.0, 205.0, 246.0, 362.0, 525.0, 801.0, 1147.0, 1532.0, 2253.0, 3491.0, 4802.0, 7180.0, 10320.0, 15066.0, 21953.0, 32256.0, 46988.0, 68994.0, 102851.0, 149837.0, 175320.0, 128830.0, 87230.0, 58885.0, 39802.0, 27424.0, 18609.0, 12746.0, 8954.0, 6064.0, 4174.0, 2901.0, 2054.0, 1358.0, 920.0, 652.0, 439.0, 334.0, 193.0, 171.0, 97.0, 71.0, 51.0, 39.0, 19.0, 16.0, 15.0, 3.0, 5.0, 1.0, 6.0, 3.0], "bins": [-3.375, -3.270477294921875, -3.16595458984375, -3.061431884765625, -2.9569091796875, -2.852386474609375, -2.74786376953125, -2.643341064453125, -2.538818359375, -2.434295654296875, -2.32977294921875, -2.225250244140625, -2.1207275390625, -2.016204833984375, -1.91168212890625, -1.807159423828125, -1.70263671875, -1.598114013671875, -1.49359130859375, -1.389068603515625, -1.2845458984375, -1.180023193359375, -1.07550048828125, -0.970977783203125, -0.866455078125, -0.761932373046875, -0.65740966796875, -0.552886962890625, -0.4483642578125, -0.343841552734375, -0.23931884765625, -0.134796142578125, -0.0302734375, 0.074249267578125, 0.17877197265625, 0.283294677734375, 0.3878173828125, 0.492340087890625, 0.59686279296875, 0.701385498046875, 0.805908203125, 0.910430908203125, 1.01495361328125, 1.119476318359375, 1.2239990234375, 1.328521728515625, 1.43304443359375, 1.537567138671875, 1.64208984375, 1.746612548828125, 1.85113525390625, 1.955657958984375, 2.0601806640625, 2.164703369140625, 2.26922607421875, 2.373748779296875, 2.478271484375, 2.582794189453125, 2.68731689453125, 2.791839599609375, 2.8963623046875, 3.000885009765625, 3.10540771484375, 3.209930419921875, 3.314453125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 4.0, 11.0, 5.0, 5.0, 6.0, 18.0, 19.0, 21.0, 22.0, 30.0, 24.0, 28.0, 31.0, 29.0, 23.0, 46.0, 38.0, 27.0, 29.0, 40.0, 35.0, 35.0, 43.0, 36.0, 31.0, 45.0, 33.0, 29.0, 18.0, 29.0, 30.0, 23.0, 20.0, 23.0, 13.0, 15.0, 14.0, 11.0, 11.0, 8.0, 6.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0], "bins": [-9.2109375, -8.94677734375, -8.6826171875, -8.41845703125, -8.154296875, -7.89013671875, -7.6259765625, -7.36181640625, -7.09765625, -6.83349609375, -6.5693359375, -6.30517578125, -6.041015625, -5.77685546875, -5.5126953125, -5.24853515625, -4.984375, -4.72021484375, -4.4560546875, -4.19189453125, -3.927734375, -3.66357421875, -3.3994140625, -3.13525390625, -2.87109375, -2.60693359375, -2.3427734375, -2.07861328125, -1.814453125, -1.55029296875, -1.2861328125, -1.02197265625, -0.7578125, -0.49365234375, -0.2294921875, 0.03466796875, 0.298828125, 0.56298828125, 0.8271484375, 1.09130859375, 1.35546875, 1.61962890625, 1.8837890625, 2.14794921875, 2.412109375, 2.67626953125, 2.9404296875, 3.20458984375, 3.46875, 3.73291015625, 3.9970703125, 4.26123046875, 4.525390625, 4.78955078125, 5.0537109375, 5.31787109375, 5.58203125, 5.84619140625, 6.1103515625, 6.37451171875, 6.638671875, 6.90283203125, 7.1669921875, 7.43115234375, 7.6953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 9.0, 4.0, 16.0, 15.0, 22.0, 39.0, 42.0, 85.0, 105.0, 187.0, 258.0, 443.0, 704.0, 1083.0, 1676.0, 2576.0, 4240.0, 7072.0, 12025.0, 20585.0, 36663.0, 66157.0, 124681.0, 259980.0, 243950.0, 118406.0, 63256.0, 35131.0, 19867.0, 11413.0, 6748.0, 4047.0, 2600.0, 1575.0, 1047.0, 600.0, 455.0, 288.0, 177.0, 115.0, 66.0, 52.0, 26.0, 19.0, 15.0, 11.0, 6.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.8125, -4.66192626953125, -4.5113525390625, -4.36077880859375, -4.210205078125, -4.05963134765625, -3.9090576171875, -3.75848388671875, -3.60791015625, -3.45733642578125, -3.3067626953125, -3.15618896484375, -3.005615234375, -2.85504150390625, -2.7044677734375, -2.55389404296875, -2.4033203125, -2.25274658203125, -2.1021728515625, -1.95159912109375, -1.801025390625, -1.65045166015625, -1.4998779296875, -1.34930419921875, -1.19873046875, -1.04815673828125, -0.8975830078125, -0.74700927734375, -0.596435546875, -0.44586181640625, -0.2952880859375, -0.14471435546875, 0.005859375, 0.15643310546875, 0.3070068359375, 0.45758056640625, 0.608154296875, 0.75872802734375, 0.9093017578125, 1.05987548828125, 1.21044921875, 1.36102294921875, 1.5115966796875, 1.66217041015625, 1.812744140625, 1.96331787109375, 2.1138916015625, 2.26446533203125, 2.4150390625, 2.56561279296875, 2.7161865234375, 2.86676025390625, 3.017333984375, 3.16790771484375, 3.3184814453125, 3.46905517578125, 3.61962890625, 3.77020263671875, 3.9207763671875, 4.07135009765625, 4.221923828125, 4.37249755859375, 4.5230712890625, 4.67364501953125, 4.82421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 8.0, 6.0, 7.0, 13.0, 10.0, 8.0, 16.0, 18.0, 9.0, 20.0, 23.0, 22.0, 35.0, 41.0, 34.0, 39.0, 38.0, 38.0, 52.0, 46.0, 60.0, 28.0, 40.0, 41.0, 34.0, 33.0, 36.0, 26.0, 33.0, 25.0, 26.0, 24.0, 15.0, 10.0, 19.0, 16.0, 20.0, 7.0, 9.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.59375, -5.40582275390625, -5.2178955078125, -5.02996826171875, -4.842041015625, -4.65411376953125, -4.4661865234375, -4.27825927734375, -4.09033203125, -3.90240478515625, -3.7144775390625, -3.52655029296875, -3.338623046875, -3.15069580078125, -2.9627685546875, -2.77484130859375, -2.5869140625, -2.39898681640625, -2.2110595703125, -2.02313232421875, -1.835205078125, -1.64727783203125, -1.4593505859375, -1.27142333984375, -1.08349609375, -0.89556884765625, -0.7076416015625, -0.51971435546875, -0.331787109375, -0.14385986328125, 0.0440673828125, 0.23199462890625, 0.419921875, 0.60784912109375, 0.7957763671875, 0.98370361328125, 1.171630859375, 1.35955810546875, 1.5474853515625, 1.73541259765625, 1.92333984375, 2.11126708984375, 2.2991943359375, 2.48712158203125, 2.675048828125, 2.86297607421875, 3.0509033203125, 3.23883056640625, 3.4267578125, 3.61468505859375, 3.8026123046875, 3.99053955078125, 4.178466796875, 4.36639404296875, 4.5543212890625, 4.74224853515625, 4.93017578125, 5.11810302734375, 5.3060302734375, 5.49395751953125, 5.681884765625, 5.86981201171875, 6.0577392578125, 6.24566650390625, 6.43359375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 12.0, 25.0, 21.0, 41.0, 62.0, 92.0, 133.0, 219.0, 335.0, 548.0, 1046.0, 1884.0, 3550.0, 7335.0, 15973.0, 38816.0, 114181.0, 465517.0, 274356.0, 73175.0, 27466.0, 11777.0, 5561.0, 2865.0, 1460.0, 816.0, 478.0, 288.0, 182.0, 101.0, 81.0, 55.0, 35.0, 24.0, 12.0, 12.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06649494171142578, -0.06426429748535156, -0.062033653259277344, -0.059803009033203125, -0.057572364807128906, -0.05534172058105469, -0.05311107635498047, -0.05088043212890625, -0.04864978790283203, -0.04641914367675781, -0.044188499450683594, -0.041957855224609375, -0.039727210998535156, -0.03749656677246094, -0.03526592254638672, -0.0330352783203125, -0.03080463409423828, -0.028573989868164062, -0.026343345642089844, -0.024112701416015625, -0.021882057189941406, -0.019651412963867188, -0.01742076873779297, -0.01519012451171875, -0.012959480285644531, -0.010728836059570312, -0.008498191833496094, -0.006267547607421875, -0.004036903381347656, -0.0018062591552734375, 0.00042438507080078125, 0.002655029296875, 0.004885673522949219, 0.0071163177490234375, 0.009346961975097656, 0.011577606201171875, 0.013808250427246094, 0.016038894653320312, 0.01826953887939453, 0.02050018310546875, 0.02273082733154297, 0.024961471557617188, 0.027192115783691406, 0.029422760009765625, 0.031653404235839844, 0.03388404846191406, 0.03611469268798828, 0.0383453369140625, 0.04057598114013672, 0.04280662536621094, 0.045037269592285156, 0.047267913818359375, 0.049498558044433594, 0.05172920227050781, 0.05395984649658203, 0.05619049072265625, 0.05842113494873047, 0.06065177917480469, 0.0628824234008789, 0.06511306762695312, 0.06734371185302734, 0.06957435607910156, 0.07180500030517578, 0.07403564453125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 5.0, 11.0, 17.0, 20.0, 21.0, 20.0, 39.0, 29.0, 28.0, 50.0, 43.0, 65.0, 79.0, 68.0, 86.0, 58.0, 44.0, 50.0, 39.0, 41.0, 36.0, 19.0, 27.0, 14.0, 12.0, 12.0, 10.0, 4.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5966594219207764e-05, -1.5482306480407715e-05, -1.4998018741607666e-05, -1.4513731002807617e-05, -1.4029443264007568e-05, -1.354515552520752e-05, -1.306086778640747e-05, -1.2576580047607422e-05, -1.2092292308807373e-05, -1.1608004570007324e-05, -1.1123716831207275e-05, -1.0639429092407227e-05, -1.0155141353607178e-05, -9.670853614807129e-06, -9.18656587600708e-06, -8.702278137207031e-06, -8.217990398406982e-06, -7.733702659606934e-06, -7.249414920806885e-06, -6.765127182006836e-06, -6.280839443206787e-06, -5.796551704406738e-06, -5.3122639656066895e-06, -4.827976226806641e-06, -4.343688488006592e-06, -3.859400749206543e-06, -3.375113010406494e-06, -2.8908252716064453e-06, -2.4065375328063965e-06, -1.9222497940063477e-06, -1.4379620552062988e-06, -9.5367431640625e-07, -4.6938657760620117e-07, 1.4901161193847656e-08, 4.991888999938965e-07, 9.834766387939453e-07, 1.4677643775939941e-06, 1.952052116394043e-06, 2.436339855194092e-06, 2.9206275939941406e-06, 3.4049153327941895e-06, 3.889203071594238e-06, 4.373490810394287e-06, 4.857778549194336e-06, 5.342066287994385e-06, 5.826354026794434e-06, 6.310641765594482e-06, 6.794929504394531e-06, 7.27921724319458e-06, 7.763504981994629e-06, 8.247792720794678e-06, 8.732080459594727e-06, 9.216368198394775e-06, 9.700655937194824e-06, 1.0184943675994873e-05, 1.0669231414794922e-05, 1.115351915359497e-05, 1.163780689239502e-05, 1.2122094631195068e-05, 1.2606382369995117e-05, 1.3090670108795166e-05, 1.3574957847595215e-05, 1.4059245586395264e-05, 1.4543533325195312e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 7.0, 10.0, 20.0, 23.0, 41.0, 36.0, 50.0, 83.0, 118.0, 156.0, 265.0, 369.0, 574.0, 859.0, 1325.0, 2076.0, 3417.0, 5398.0, 9050.0, 15272.0, 27485.0, 52245.0, 110586.0, 263152.0, 297874.0, 126575.0, 58532.0, 30364.0, 16879.0, 9701.0, 5916.0, 3623.0, 2331.0, 1405.0, 911.0, 591.0, 419.0, 242.0, 179.0, 123.0, 86.0, 66.0, 38.0, 23.0, 18.0, 14.0, 10.0, 5.0, 1.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.042327880859375, -0.04092073440551758, -0.039513587951660156, -0.038106441497802734, -0.03669929504394531, -0.03529214859008789, -0.03388500213623047, -0.03247785568237305, -0.031070709228515625, -0.029663562774658203, -0.02825641632080078, -0.02684926986694336, -0.025442123413085938, -0.024034976959228516, -0.022627830505371094, -0.021220684051513672, -0.01981353759765625, -0.018406391143798828, -0.016999244689941406, -0.015592098236083984, -0.014184951782226562, -0.01277780532836914, -0.011370658874511719, -0.009963512420654297, -0.008556365966796875, -0.007149219512939453, -0.005742073059082031, -0.004334926605224609, -0.0029277801513671875, -0.0015206336975097656, -0.00011348724365234375, 0.0012936592102050781, 0.0027008056640625, 0.004107952117919922, 0.005515098571777344, 0.006922245025634766, 0.008329391479492188, 0.00973653793334961, 0.011143684387207031, 0.012550830841064453, 0.013957977294921875, 0.015365123748779297, 0.01677227020263672, 0.01817941665649414, 0.019586563110351562, 0.020993709564208984, 0.022400856018066406, 0.023808002471923828, 0.02521514892578125, 0.026622295379638672, 0.028029441833496094, 0.029436588287353516, 0.030843734741210938, 0.03225088119506836, 0.03365802764892578, 0.0350651741027832, 0.036472320556640625, 0.03787946701049805, 0.03928661346435547, 0.04069375991821289, 0.04210090637207031, 0.043508052825927734, 0.044915199279785156, 0.04632234573364258, 0.0477294921875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 8.0, 13.0, 13.0, 10.0, 11.0, 18.0, 20.0, 16.0, 22.0, 37.0, 32.0, 42.0, 63.0, 56.0, 65.0, 70.0, 71.0, 68.0, 54.0, 60.0, 32.0, 32.0, 20.0, 25.0, 18.0, 15.0, 19.0, 13.0, 13.0, 8.0, 6.0, 7.0, 7.0, 3.0, 4.0, 6.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0138397216796875, -0.013415932655334473, -0.012992143630981445, -0.012568354606628418, -0.01214456558227539, -0.011720776557922363, -0.011296987533569336, -0.010873198509216309, -0.010449409484863281, -0.010025620460510254, -0.009601831436157227, -0.0091780424118042, -0.008754253387451172, -0.008330464363098145, -0.007906675338745117, -0.00748288631439209, -0.0070590972900390625, -0.006635308265686035, -0.006211519241333008, -0.0057877302169799805, -0.005363941192626953, -0.004940152168273926, -0.0045163631439208984, -0.004092574119567871, -0.0036687850952148438, -0.0032449960708618164, -0.002821207046508789, -0.0023974180221557617, -0.0019736289978027344, -0.001549839973449707, -0.0011260509490966797, -0.0007022619247436523, -0.000278472900390625, 0.00014531612396240234, 0.0005691051483154297, 0.000992894172668457, 0.0014166831970214844, 0.0018404722213745117, 0.002264261245727539, 0.0026880502700805664, 0.0031118392944335938, 0.003535628318786621, 0.0039594173431396484, 0.004383206367492676, 0.004806995391845703, 0.0052307844161987305, 0.005654573440551758, 0.006078362464904785, 0.0065021514892578125, 0.00692594051361084, 0.007349729537963867, 0.0077735185623168945, 0.008197307586669922, 0.00862109661102295, 0.009044885635375977, 0.009468674659729004, 0.009892463684082031, 0.010316252708435059, 0.010740041732788086, 0.011163830757141113, 0.01158761978149414, 0.012011408805847168, 0.012435197830200195, 0.012858986854553223, 0.01328277587890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 9.0, 7.0, 7.0, 10.0, 13.0, 20.0, 28.0, 20.0, 28.0, 37.0, 35.0, 46.0, 63.0, 61.0, 64.0, 61.0, 64.0, 61.0, 61.0, 50.0, 53.0, 38.0, 33.0, 19.0, 22.0, 11.0, 16.0, 11.0, 12.0, 4.0, 2.0, 3.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.415369987487793, -9.116798400878906, -8.818225860595703, -8.519654273986816, -8.221081733703613, -7.922509670257568, -7.623937606811523, -7.325366020202637, -7.026793479919434, -6.728221416473389, -6.429649353027344, -6.131077289581299, -5.832505226135254, -5.533933162689209, -5.235361099243164, -4.936789512634277, -4.638217449188232, -4.3396453857421875, -4.041073322296143, -3.7425012588500977, -3.4439291954040527, -3.145357131958008, -2.846785306930542, -2.548213243484497, -2.249641180038452, -1.9510691165924072, -1.6524970531463623, -1.353925108909607, -1.055353045463562, -0.7567809820175171, -0.4582090377807617, -0.1596369743347168, 0.13893508911132812, 0.43750712275505066, 0.7360791563987732, 1.0346511602401733, 1.3332232236862183, 1.6317952871322632, 1.9303672313690186, 2.2289392948150635, 2.5275113582611084, 2.8260834217071533, 3.1246554851531982, 3.423227310180664, 3.721799373626709, 4.020371437072754, 4.318943500518799, 4.617515563964844, 4.916087627410889, 5.214659690856934, 5.5132317543029785, 5.811803817749023, 6.110375881195068, 6.408947944641113, 6.70751953125, 7.006092071533203, 7.30466365814209, 7.603235721588135, 7.90180778503418, 8.200379371643066, 8.49895191192627, 8.797523498535156, 9.09609603881836, 9.394667625427246, 9.69324016571045]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 4.0, 6.0, 10.0, 13.0, 17.0, 24.0, 14.0, 21.0, 33.0, 21.0, 36.0, 22.0, 31.0, 34.0, 35.0, 37.0, 29.0, 27.0, 42.0, 39.0, 33.0, 40.0, 37.0, 34.0, 33.0, 36.0, 30.0, 23.0, 28.0, 32.0, 22.0, 22.0, 16.0, 14.0, 16.0, 13.0, 13.0, 8.0, 7.0, 7.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.27824592590332, -8.024688720703125, -7.771131992340088, -7.517574787139893, -7.264017581939697, -7.01046085357666, -6.756903648376465, -6.5033464431762695, -6.249789237976074, -5.996232032775879, -5.742675304412842, -5.4891180992126465, -5.235560894012451, -4.982004165649414, -4.728446960449219, -4.474889755249023, -4.221333026885986, -3.96777606010437, -3.714218854904175, -3.4606618881225586, -3.2071046829223633, -2.953547716140747, -2.699990749359131, -2.4464335441589355, -2.1928765773773193, -1.9393194913864136, -1.6857624053955078, -1.4322054386138916, -1.1786483526229858, -0.9250912666320801, -0.6715342998504639, -0.4179772138595581, -0.16441965103149414, 0.08913740515708923, 0.3426944613456726, 0.5962514877319336, 0.8498085737228394, 1.1033656597137451, 1.3569226264953613, 1.610479712486267, 1.8640367984771729, 2.117593765258789, 2.3711509704589844, 2.6247079372406006, 2.878264904022217, 3.131822109222412, 3.3853790760040283, 3.6389360427856445, 3.89249324798584, 4.146050453186035, 4.399607181549072, 4.653164386749268, 4.906721591949463, 5.1602783203125, 5.413835525512695, 5.667392730712891, 5.920949935913086, 6.174507141113281, 6.428063869476318, 6.681621074676514, 6.935178279876709, 7.188735008239746, 7.442292213439941, 7.695849418640137, 7.949406147003174]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 9.0, 8.0, 14.0, 7.0, 27.0, 32.0, 66.0, 91.0, 96.0, 144.0, 238.0, 300.0, 503.0, 731.0, 997.0, 1585.0, 2219.0, 3173.0, 4813.0, 7260.0, 10564.0, 15976.0, 23473.0, 35166.0, 53109.0, 79963.0, 116303.0, 151975.0, 156402.0, 123993.0, 85801.0, 57605.0, 38227.0, 25322.0, 16996.0, 11382.0, 7661.0, 5200.0, 3415.0, 2418.0, 1637.0, 1180.0, 760.0, 565.0, 350.0, 239.0, 176.0, 134.0, 79.0, 62.0, 38.0, 24.0, 16.0, 24.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.3740234375, -10.029296875, -9.6845703125, -9.33984375, -8.9951171875, -8.650390625, -8.3056640625, -7.9609375, -7.6162109375, -7.271484375, -6.9267578125, -6.58203125, -6.2373046875, -5.892578125, -5.5478515625, -5.203125, -4.8583984375, -4.513671875, -4.1689453125, -3.82421875, -3.4794921875, -3.134765625, -2.7900390625, -2.4453125, -2.1005859375, -1.755859375, -1.4111328125, -1.06640625, -0.7216796875, -0.376953125, -0.0322265625, 0.3125, 0.6572265625, 1.001953125, 1.3466796875, 1.69140625, 2.0361328125, 2.380859375, 2.7255859375, 3.0703125, 3.4150390625, 3.759765625, 4.1044921875, 4.44921875, 4.7939453125, 5.138671875, 5.4833984375, 5.828125, 6.1728515625, 6.517578125, 6.8623046875, 7.20703125, 7.5517578125, 7.896484375, 8.2412109375, 8.5859375, 8.9306640625, 9.275390625, 9.6201171875, 9.96484375, 10.3095703125, 10.654296875, 10.9990234375, 11.34375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 10.0, 13.0, 15.0, 20.0, 16.0, 14.0, 10.0, 21.0, 26.0, 28.0, 28.0, 22.0, 34.0, 37.0, 36.0, 39.0, 34.0, 36.0, 30.0, 48.0, 38.0, 31.0, 31.0, 24.0, 46.0, 27.0, 26.0, 24.0, 40.0, 29.0, 22.0, 21.0, 13.0, 13.0, 14.0, 9.0, 17.0, 14.0, 6.0, 3.0, 5.0, 6.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.578125, -7.34375, -7.109375, -6.875, -6.640625, -6.40625, -6.171875, -5.9375, -5.703125, -5.46875, -5.234375, -5.0, -4.765625, -4.53125, -4.296875, -4.0625, -3.828125, -3.59375, -3.359375, -3.125, -2.890625, -2.65625, -2.421875, -2.1875, -1.953125, -1.71875, -1.484375, -1.25, -1.015625, -0.78125, -0.546875, -0.3125, -0.078125, 0.15625, 0.390625, 0.625, 0.859375, 1.09375, 1.328125, 1.5625, 1.796875, 2.03125, 2.265625, 2.5, 2.734375, 2.96875, 3.203125, 3.4375, 3.671875, 3.90625, 4.140625, 4.375, 4.609375, 4.84375, 5.078125, 5.3125, 5.546875, 5.78125, 6.015625, 6.25, 6.484375, 6.71875, 6.953125, 7.1875, 7.421875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 12.0, 27.0, 39.0, 48.0, 67.0, 109.0, 165.0, 239.0, 392.0, 585.0, 890.0, 1341.0, 2266.0, 3488.0, 5780.0, 9450.0, 15327.0, 25507.0, 43968.0, 73461.0, 120157.0, 176806.0, 194582.0, 145023.0, 91883.0, 54576.0, 32120.0, 19281.0, 11827.0, 7242.0, 4330.0, 2724.0, 1730.0, 1070.0, 697.0, 441.0, 298.0, 203.0, 152.0, 86.0, 57.0, 36.0, 25.0, 16.0, 9.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.4140625, -12.984375, -12.5546875, -12.125, -11.6953125, -11.265625, -10.8359375, -10.40625, -9.9765625, -9.546875, -9.1171875, -8.6875, -8.2578125, -7.828125, -7.3984375, -6.96875, -6.5390625, -6.109375, -5.6796875, -5.25, -4.8203125, -4.390625, -3.9609375, -3.53125, -3.1015625, -2.671875, -2.2421875, -1.8125, -1.3828125, -0.953125, -0.5234375, -0.09375, 0.3359375, 0.765625, 1.1953125, 1.625, 2.0546875, 2.484375, 2.9140625, 3.34375, 3.7734375, 4.203125, 4.6328125, 5.0625, 5.4921875, 5.921875, 6.3515625, 6.78125, 7.2109375, 7.640625, 8.0703125, 8.5, 8.9296875, 9.359375, 9.7890625, 10.21875, 10.6484375, 11.078125, 11.5078125, 11.9375, 12.3671875, 12.796875, 13.2265625, 13.65625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 10.0, 11.0, 10.0, 12.0, 19.0, 19.0, 19.0, 25.0, 32.0, 26.0, 35.0, 31.0, 41.0, 19.0, 41.0, 32.0, 44.0, 44.0, 41.0, 46.0, 43.0, 44.0, 28.0, 36.0, 31.0, 36.0, 33.0, 27.0, 24.0, 24.0, 12.0, 20.0, 9.0, 13.0, 4.0, 4.0, 8.0, 6.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.9815673828125, -4.814697265625, -4.6478271484375, -4.48095703125, -4.3140869140625, -4.147216796875, -3.9803466796875, -3.8134765625, -3.6466064453125, -3.479736328125, -3.3128662109375, -3.14599609375, -2.9791259765625, -2.812255859375, -2.6453857421875, -2.478515625, -2.3116455078125, -2.144775390625, -1.9779052734375, -1.81103515625, -1.6441650390625, -1.477294921875, -1.3104248046875, -1.1435546875, -0.9766845703125, -0.809814453125, -0.6429443359375, -0.47607421875, -0.3092041015625, -0.142333984375, 0.0245361328125, 0.19140625, 0.3582763671875, 0.525146484375, 0.6920166015625, 0.85888671875, 1.0257568359375, 1.192626953125, 1.3594970703125, 1.5263671875, 1.6932373046875, 1.860107421875, 2.0269775390625, 2.19384765625, 2.3607177734375, 2.527587890625, 2.6944580078125, 2.861328125, 3.0281982421875, 3.195068359375, 3.3619384765625, 3.52880859375, 3.6956787109375, 3.862548828125, 4.0294189453125, 4.1962890625, 4.3631591796875, 4.530029296875, 4.6968994140625, 4.86376953125, 5.0306396484375, 5.197509765625, 5.3643798828125, 5.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 7.0, 4.0, 6.0, 3.0, 14.0, 19.0, 32.0, 44.0, 58.0, 88.0, 142.0, 198.0, 297.0, 449.0, 695.0, 1081.0, 1809.0, 2763.0, 4538.0, 7446.0, 12833.0, 22741.0, 42992.0, 93394.0, 291004.0, 352117.0, 106238.0, 47553.0, 24713.0, 14048.0, 8097.0, 4900.0, 3059.0, 1851.0, 1158.0, 759.0, 482.0, 303.0, 204.0, 139.0, 91.0, 59.0, 40.0, 29.0, 25.0, 7.0, 10.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.0390625, -5.85076904296875, -5.6624755859375, -5.47418212890625, -5.285888671875, -5.09759521484375, -4.9093017578125, -4.72100830078125, -4.53271484375, -4.34442138671875, -4.1561279296875, -3.96783447265625, -3.779541015625, -3.59124755859375, -3.4029541015625, -3.21466064453125, -3.0263671875, -2.83807373046875, -2.6497802734375, -2.46148681640625, -2.273193359375, -2.08489990234375, -1.8966064453125, -1.70831298828125, -1.52001953125, -1.33172607421875, -1.1434326171875, -0.95513916015625, -0.766845703125, -0.57855224609375, -0.3902587890625, -0.20196533203125, -0.013671875, 0.17462158203125, 0.3629150390625, 0.55120849609375, 0.739501953125, 0.92779541015625, 1.1160888671875, 1.30438232421875, 1.49267578125, 1.68096923828125, 1.8692626953125, 2.05755615234375, 2.245849609375, 2.43414306640625, 2.6224365234375, 2.81072998046875, 2.9990234375, 3.18731689453125, 3.3756103515625, 3.56390380859375, 3.752197265625, 3.94049072265625, 4.1287841796875, 4.31707763671875, 4.50537109375, 4.69366455078125, 4.8819580078125, 5.07025146484375, 5.258544921875, 5.44683837890625, 5.6351318359375, 5.82342529296875, 6.01171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 10.0, 6.0, 5.0, 9.0, 19.0, 17.0, 30.0, 40.0, 56.0, 48.0, 81.0, 112.0, 118.0, 103.0, 95.0, 52.0, 47.0, 27.0, 22.0, 25.0, 17.0, 16.0, 12.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.00040841102600097656, -0.00039785727858543396, -0.00038730353116989136, -0.00037674978375434875, -0.00036619603633880615, -0.00035564228892326355, -0.00034508854150772095, -0.00033453479409217834, -0.00032398104667663574, -0.00031342729926109314, -0.00030287355184555054, -0.00029231980443000793, -0.00028176605701446533, -0.00027121230959892273, -0.0002606585621833801, -0.0002501048147678375, -0.00023955106735229492, -0.00022899731993675232, -0.00021844357252120972, -0.00020788982510566711, -0.0001973360776901245, -0.0001867823302745819, -0.0001762285828590393, -0.0001656748354434967, -0.0001551210880279541, -0.0001445673406124115, -0.0001340135931968689, -0.0001234598457813263, -0.00011290609836578369, -0.00010235235095024109, -9.179860353469849e-05, -8.124485611915588e-05, -7.069110870361328e-05, -6.013736128807068e-05, -4.9583613872528076e-05, -3.9029866456985474e-05, -2.847611904144287e-05, -1.792237162590027e-05, -7.368624210357666e-06, 3.1851232051849365e-06, 1.3738870620727539e-05, 2.429261803627014e-05, 3.4846365451812744e-05, 4.540011286735535e-05, 5.595386028289795e-05, 6.650760769844055e-05, 7.706135511398315e-05, 8.761510252952576e-05, 9.816884994506836e-05, 0.00010872259736061096, 0.00011927634477615356, 0.00012983009219169617, 0.00014038383960723877, 0.00015093758702278137, 0.00016149133443832397, 0.00017204508185386658, 0.00018259882926940918, 0.00019315257668495178, 0.00020370632410049438, 0.000214260071516037, 0.0002248138189315796, 0.0002353675663471222, 0.0002459213137626648, 0.0002564750611782074, 0.00026702880859375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 12.0, 27.0, 39.0, 40.0, 68.0, 99.0, 117.0, 165.0, 220.0, 320.0, 475.0, 672.0, 1035.0, 1533.0, 2407.0, 3807.0, 6028.0, 9937.0, 16951.0, 30147.0, 60186.0, 151420.0, 437100.0, 178522.0, 67272.0, 32915.0, 18218.0, 10535.0, 6494.0, 4011.0, 2636.0, 1586.0, 1121.0, 740.0, 516.0, 324.0, 238.0, 182.0, 127.0, 81.0, 71.0, 50.0, 28.0, 24.0, 18.0, 7.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.60723876953125, -5.4176025390625, -5.22796630859375, -5.038330078125, -4.84869384765625, -4.6590576171875, -4.46942138671875, -4.27978515625, -4.09014892578125, -3.9005126953125, -3.71087646484375, -3.521240234375, -3.33160400390625, -3.1419677734375, -2.95233154296875, -2.7626953125, -2.57305908203125, -2.3834228515625, -2.19378662109375, -2.004150390625, -1.81451416015625, -1.6248779296875, -1.43524169921875, -1.24560546875, -1.05596923828125, -0.8663330078125, -0.67669677734375, -0.487060546875, -0.29742431640625, -0.1077880859375, 0.08184814453125, 0.271484375, 0.46112060546875, 0.6507568359375, 0.84039306640625, 1.030029296875, 1.21966552734375, 1.4093017578125, 1.59893798828125, 1.78857421875, 1.97821044921875, 2.1678466796875, 2.35748291015625, 2.547119140625, 2.73675537109375, 2.9263916015625, 3.11602783203125, 3.3056640625, 3.49530029296875, 3.6849365234375, 3.87457275390625, 4.064208984375, 4.25384521484375, 4.4434814453125, 4.63311767578125, 4.82275390625, 5.01239013671875, 5.2020263671875, 5.39166259765625, 5.581298828125, 5.77093505859375, 5.9605712890625, 6.15020751953125, 6.33984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 10.0, 12.0, 18.0, 18.0, 11.0, 23.0, 22.0, 27.0, 40.0, 33.0, 52.0, 78.0, 86.0, 91.0, 70.0, 65.0, 69.0, 47.0, 37.0, 31.0, 33.0, 17.0, 15.0, 18.0, 20.0, 6.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.89453125, -1.832183837890625, -1.76983642578125, -1.707489013671875, -1.6451416015625, -1.582794189453125, -1.52044677734375, -1.458099365234375, -1.395751953125, -1.333404541015625, -1.27105712890625, -1.208709716796875, -1.1463623046875, -1.084014892578125, -1.02166748046875, -0.959320068359375, -0.89697265625, -0.834625244140625, -0.77227783203125, -0.709930419921875, -0.6475830078125, -0.585235595703125, -0.52288818359375, -0.460540771484375, -0.398193359375, -0.335845947265625, -0.27349853515625, -0.211151123046875, -0.1488037109375, -0.086456298828125, -0.02410888671875, 0.038238525390625, 0.1005859375, 0.162933349609375, 0.22528076171875, 0.287628173828125, 0.3499755859375, 0.412322998046875, 0.47467041015625, 0.537017822265625, 0.599365234375, 0.661712646484375, 0.72406005859375, 0.786407470703125, 0.8487548828125, 0.911102294921875, 0.97344970703125, 1.035797119140625, 1.09814453125, 1.160491943359375, 1.22283935546875, 1.285186767578125, 1.3475341796875, 1.409881591796875, 1.47222900390625, 1.534576416015625, 1.596923828125, 1.659271240234375, 1.72161865234375, 1.783966064453125, 1.8463134765625, 1.908660888671875, 1.97100830078125, 2.033355712890625, 2.095703125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 8.0, 12.0, 8.0, 22.0, 21.0, 30.0, 33.0, 33.0, 39.0, 60.0, 69.0, 76.0, 76.0, 82.0, 68.0, 77.0, 48.0, 38.0, 38.0, 22.0, 25.0, 18.0, 12.0, 12.0, 12.0, 2.0, 9.0, 7.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.113502502441406, -9.786001205444336, -9.458500862121582, -9.130999565124512, -8.803498268127441, -8.475997924804688, -8.148496627807617, -7.820995330810547, -7.493494510650635, -7.165993690490723, -6.838492393493652, -6.51099157333374, -6.183490753173828, -5.855989456176758, -5.528488636016846, -5.200987815856934, -4.873486518859863, -4.545985698699951, -4.218484401702881, -3.8909835815429688, -3.5634825229644775, -3.2359814643859863, -2.908480644226074, -2.580979585647583, -2.253478527069092, -1.9259774684906006, -1.598476529121399, -1.2709755897521973, -0.943474531173706, -0.6159734725952148, -0.2884725332260132, 0.03902840614318848, 0.3665304183959961, 0.6940314173698425, 1.021532416343689, 1.3490333557128906, 1.6765344142913818, 2.004035472869873, 2.331536293029785, 2.6590373516082764, 2.9865384101867676, 3.314039468765259, 3.64154052734375, 3.969041347503662, 4.296542167663574, 4.6240434646606445, 4.951544284820557, 5.279045104980469, 5.606546401977539, 5.934047222137451, 6.2615485191345215, 6.589049339294434, 6.916550636291504, 7.244051456451416, 7.571552276611328, 7.899053573608398, 8.226554870605469, 8.554056167602539, 8.881556510925293, 9.209057807922363, 9.536559104919434, 9.864059448242188, 10.191560745239258, 10.519062042236328, 10.846562385559082]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 1.0, 1.0, 8.0, 12.0, 5.0, 12.0, 12.0, 13.0, 17.0, 14.0, 25.0, 26.0, 22.0, 36.0, 28.0, 22.0, 38.0, 33.0, 31.0, 37.0, 36.0, 46.0, 41.0, 37.0, 38.0, 33.0, 37.0, 33.0, 31.0, 36.0, 20.0, 25.0, 34.0, 25.0, 17.0, 21.0, 21.0, 5.0, 6.0, 12.0, 12.0, 11.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-8.707417488098145, -8.438820838928223, -8.170225143432617, -7.901628494262695, -7.633031845092773, -7.36443567276001, -7.095839500427246, -6.827242851257324, -6.558646202087402, -6.290050029754639, -6.021453380584717, -5.752857208251953, -5.484260559082031, -5.215664386749268, -4.947068214416504, -4.678471565246582, -4.409875392913818, -4.141279220581055, -3.872682571411133, -3.604086399078369, -3.3354897499084473, -3.0668935775756836, -2.798297166824341, -2.529700756072998, -2.2611043453216553, -1.9925079345703125, -1.7239115238189697, -1.4553152322769165, -1.1867188215255737, -0.918122410774231, -0.6495261192321777, -0.38092970848083496, -0.11233329772949219, 0.1562630832195282, 0.4248594641685486, 0.6934558153152466, 0.9620522260665894, 1.2306486368179321, 1.4992449283599854, 1.7678413391113281, 2.036437749862671, 2.3050341606140137, 2.5736305713653564, 2.842226982116699, 3.110823154449463, 3.3794198036193848, 3.6480159759521484, 3.916612386703491, 4.185208797454834, 4.453804969787598, 4.7224016189575195, 4.990997791290283, 5.259594440460205, 5.528190612792969, 5.796787261962891, 6.065383434295654, 6.333979606628418, 6.602575778961182, 6.8711724281311035, 7.139768600463867, 7.408365249633789, 7.676961421966553, 7.945557594299316, 8.214154243469238, 8.48275089263916]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 11.0, 9.0, 20.0, 33.0, 46.0, 65.0, 117.0, 170.0, 314.0, 495.0, 842.0, 1516.0, 2818.0, 5258.0, 9902.0, 19654.0, 39102.0, 79592.0, 173563.0, 468321.0, 1377439.0, 1287620.0, 414042.0, 159702.0, 74092.0, 37187.0, 19242.0, 10226.0, 5677.0, 3060.0, 1716.0, 1008.0, 572.0, 338.0, 190.0, 123.0, 89.0, 40.0, 23.0, 18.0, 12.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-17.484375, -17.01123046875, -16.5380859375, -16.06494140625, -15.591796875, -15.11865234375, -14.6455078125, -14.17236328125, -13.69921875, -13.22607421875, -12.7529296875, -12.27978515625, -11.806640625, -11.33349609375, -10.8603515625, -10.38720703125, -9.9140625, -9.44091796875, -8.9677734375, -8.49462890625, -8.021484375, -7.54833984375, -7.0751953125, -6.60205078125, -6.12890625, -5.65576171875, -5.1826171875, -4.70947265625, -4.236328125, -3.76318359375, -3.2900390625, -2.81689453125, -2.34375, -1.87060546875, -1.3974609375, -0.92431640625, -0.451171875, 0.02197265625, 0.4951171875, 0.96826171875, 1.44140625, 1.91455078125, 2.3876953125, 2.86083984375, 3.333984375, 3.80712890625, 4.2802734375, 4.75341796875, 5.2265625, 5.69970703125, 6.1728515625, 6.64599609375, 7.119140625, 7.59228515625, 8.0654296875, 8.53857421875, 9.01171875, 9.48486328125, 9.9580078125, 10.43115234375, 10.904296875, 11.37744140625, 11.8505859375, 12.32373046875, 12.796875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 8.0, 9.0, 7.0, 13.0, 19.0, 13.0, 12.0, 20.0, 25.0, 31.0, 34.0, 35.0, 22.0, 34.0, 37.0, 39.0, 33.0, 36.0, 37.0, 56.0, 45.0, 34.0, 36.0, 32.0, 47.0, 32.0, 32.0, 36.0, 24.0, 29.0, 16.0, 12.0, 22.0, 11.0, 8.0, 9.0, 9.0, 7.0, 11.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-7.41015625, -7.18011474609375, -6.9500732421875, -6.72003173828125, -6.489990234375, -6.25994873046875, -6.0299072265625, -5.79986572265625, -5.56982421875, -5.33978271484375, -5.1097412109375, -4.87969970703125, -4.649658203125, -4.41961669921875, -4.1895751953125, -3.95953369140625, -3.7294921875, -3.49945068359375, -3.2694091796875, -3.03936767578125, -2.809326171875, -2.57928466796875, -2.3492431640625, -2.11920166015625, -1.88916015625, -1.65911865234375, -1.4290771484375, -1.19903564453125, -0.968994140625, -0.73895263671875, -0.5089111328125, -0.27886962890625, -0.048828125, 0.18121337890625, 0.4112548828125, 0.64129638671875, 0.871337890625, 1.10137939453125, 1.3314208984375, 1.56146240234375, 1.79150390625, 2.02154541015625, 2.2515869140625, 2.48162841796875, 2.711669921875, 2.94171142578125, 3.1717529296875, 3.40179443359375, 3.6318359375, 3.86187744140625, 4.0919189453125, 4.32196044921875, 4.552001953125, 4.78204345703125, 5.0120849609375, 5.24212646484375, 5.47216796875, 5.70220947265625, 5.9322509765625, 6.16229248046875, 6.392333984375, 6.62237548828125, 6.8524169921875, 7.08245849609375, 7.3125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 9.0, 11.0, 14.0, 21.0, 29.0, 46.0, 78.0, 98.0, 176.0, 249.0, 344.0, 548.0, 793.0, 1254.0, 1908.0, 2853.0, 4750.0, 7403.0, 12412.0, 19974.0, 33909.0, 58471.0, 104217.0, 192974.0, 370690.0, 724646.0, 1106036.0, 730562.0, 373508.0, 195060.0, 104817.0, 58753.0, 34025.0, 20137.0, 12483.0, 7555.0, 4847.0, 2983.0, 1839.0, 1252.0, 850.0, 579.0, 373.0, 236.0, 181.0, 108.0, 78.0, 45.0, 34.0, 28.0, 11.0, 12.0, 9.0, 7.0, 1.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2459716796875, -8.921630859375, -8.5972900390625, -8.27294921875, -7.9486083984375, -7.624267578125, -7.2999267578125, -6.9755859375, -6.6512451171875, -6.326904296875, -6.0025634765625, -5.67822265625, -5.3538818359375, -5.029541015625, -4.7052001953125, -4.380859375, -4.0565185546875, -3.732177734375, -3.4078369140625, -3.08349609375, -2.7591552734375, -2.434814453125, -2.1104736328125, -1.7861328125, -1.4617919921875, -1.137451171875, -0.8131103515625, -0.48876953125, -0.1644287109375, 0.159912109375, 0.4842529296875, 0.80859375, 1.1329345703125, 1.457275390625, 1.7816162109375, 2.10595703125, 2.4302978515625, 2.754638671875, 3.0789794921875, 3.4033203125, 3.7276611328125, 4.052001953125, 4.3763427734375, 4.70068359375, 5.0250244140625, 5.349365234375, 5.6737060546875, 5.998046875, 6.3223876953125, 6.646728515625, 6.9710693359375, 7.29541015625, 7.6197509765625, 7.944091796875, 8.2684326171875, 8.5927734375, 8.9171142578125, 9.241455078125, 9.5657958984375, 9.89013671875, 10.2144775390625, 10.538818359375, 10.8631591796875, 11.1875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 6.0, 12.0, 21.0, 22.0, 24.0, 36.0, 44.0, 50.0, 47.0, 65.0, 88.0, 112.0, 115.0, 168.0, 161.0, 225.0, 234.0, 251.0, 278.0, 284.0, 245.0, 263.0, 219.0, 211.0, 151.0, 130.0, 115.0, 85.0, 63.0, 80.0, 51.0, 35.0, 37.0, 23.0, 26.0, 25.0, 14.0, 10.0, 3.0, 4.0, 9.0, 10.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8125, -3.6898193359375, -3.567138671875, -3.4444580078125, -3.32177734375, -3.1990966796875, -3.076416015625, -2.9537353515625, -2.8310546875, -2.7083740234375, -2.585693359375, -2.4630126953125, -2.34033203125, -2.2176513671875, -2.094970703125, -1.9722900390625, -1.849609375, -1.7269287109375, -1.604248046875, -1.4815673828125, -1.35888671875, -1.2362060546875, -1.113525390625, -0.9908447265625, -0.8681640625, -0.7454833984375, -0.622802734375, -0.5001220703125, -0.37744140625, -0.2547607421875, -0.132080078125, -0.0093994140625, 0.11328125, 0.2359619140625, 0.358642578125, 0.4813232421875, 0.60400390625, 0.7266845703125, 0.849365234375, 0.9720458984375, 1.0947265625, 1.2174072265625, 1.340087890625, 1.4627685546875, 1.58544921875, 1.7081298828125, 1.830810546875, 1.9534912109375, 2.076171875, 2.1988525390625, 2.321533203125, 2.4442138671875, 2.56689453125, 2.6895751953125, 2.812255859375, 2.9349365234375, 3.0576171875, 3.1802978515625, 3.302978515625, 3.4256591796875, 3.54833984375, 3.6710205078125, 3.793701171875, 3.9163818359375, 4.0390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 8.0, 12.0, 15.0, 15.0, 22.0, 26.0, 38.0, 43.0, 59.0, 75.0, 81.0, 66.0, 82.0, 86.0, 64.0, 67.0, 48.0, 26.0, 34.0, 17.0, 23.0, 24.0, 10.0, 6.0, 8.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.445117950439453, -8.123140335083008, -7.8011627197265625, -7.479185104370117, -7.157207489013672, -6.835229873657227, -6.5132527351379395, -6.191275119781494, -5.869297504425049, -5.5473198890686035, -5.225342273712158, -4.903364658355713, -4.581387519836426, -4.2594099044799805, -3.937432289123535, -3.61545467376709, -3.2934770584106445, -2.971499443054199, -2.649521827697754, -2.3275444507598877, -2.0055668354034424, -1.683589220046997, -1.3616117238998413, -1.0396342277526855, -0.7176566123962402, -0.3956790566444397, -0.07370150089263916, 0.24827605485916138, 0.5702536106109619, 0.8922312259674072, 1.214208722114563, 1.5361862182617188, 1.8581628799438477, 2.180140495300293, 2.5021181106567383, 2.8240954875946045, 3.14607310295105, 3.468050718307495, 3.7900280952453613, 4.112005710601807, 4.433983325958252, 4.755960941314697, 5.077938556671143, 5.399916172027588, 5.721893310546875, 6.04387092590332, 6.365848541259766, 6.687826156616211, 7.009803771972656, 7.331781387329102, 7.653759002685547, 7.975736618041992, 8.297714233398438, 8.619691848754883, 8.941669464111328, 9.263647079467773, 9.585624694824219, 9.907602310180664, 10.22957992553711, 10.551557540893555, 10.87353515625, 11.195512771606445, 11.51749038696289, 11.839468002319336, 12.161444664001465]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 11.0, 11.0, 10.0, 20.0, 19.0, 18.0, 33.0, 20.0, 20.0, 21.0, 35.0, 32.0, 28.0, 36.0, 27.0, 37.0, 45.0, 33.0, 50.0, 35.0, 48.0, 47.0, 38.0, 26.0, 38.0, 26.0, 37.0, 29.0, 21.0, 20.0, 21.0, 16.0, 16.0, 9.0, 14.0, 3.0, 13.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.554946899414062, -9.291632652282715, -9.028319358825684, -8.765005111694336, -8.501691818237305, -8.238377571105957, -7.975064277648926, -7.711750030517578, -7.448436737060547, -7.185122966766357, -6.921809196472168, -6.6584954261779785, -6.395181655883789, -6.1318678855896, -5.86855411529541, -5.6052398681640625, -5.341926097869873, -5.078612327575684, -4.815298557281494, -4.551984786987305, -4.288671016693115, -4.025357246398926, -3.7620432376861572, -3.4987294673919678, -3.2354156970977783, -2.972101926803589, -2.7087881565093994, -2.445474147796631, -2.1821603775024414, -1.9188467264175415, -1.6555328369140625, -1.392219066619873, -1.1289057731628418, -0.8655920028686523, -0.6022781729698181, -0.3389643430709839, -0.07565057277679443, 0.18766319751739502, 0.450977087020874, 0.7142908573150635, 0.9776046276092529, 1.2409183979034424, 1.5042321681976318, 1.7675460577011108, 2.03085994720459, 2.2941737174987793, 2.5574874877929688, 2.820801258087158, 3.0841150283813477, 3.347428798675537, 3.6107425689697266, 3.874056339263916, 4.1373701095581055, 4.400683879852295, 4.663997650146484, 4.927311897277832, 5.190625190734863, 5.453938961029053, 5.717252731323242, 5.980566501617432, 6.243880271911621, 6.5071940422058105, 6.7705078125, 7.033822059631348, 7.297135829925537]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 10.0, 7.0, 18.0, 24.0, 45.0, 52.0, 65.0, 121.0, 140.0, 262.0, 377.0, 599.0, 875.0, 1348.0, 2128.0, 3262.0, 5177.0, 8020.0, 12682.0, 20317.0, 32748.0, 52330.0, 81922.0, 128933.0, 196162.0, 181725.0, 118580.0, 74197.0, 46820.0, 29184.0, 18541.0, 11544.0, 7294.0, 4542.0, 2996.0, 1863.0, 1254.0, 829.0, 526.0, 357.0, 215.0, 165.0, 104.0, 63.0, 42.0, 33.0, 22.0, 8.0, 9.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.375, -3.2657470703125, -3.156494140625, -3.0472412109375, -2.93798828125, -2.8287353515625, -2.719482421875, -2.6102294921875, -2.5009765625, -2.3917236328125, -2.282470703125, -2.1732177734375, -2.06396484375, -1.9547119140625, -1.845458984375, -1.7362060546875, -1.626953125, -1.5177001953125, -1.408447265625, -1.2991943359375, -1.18994140625, -1.0806884765625, -0.971435546875, -0.8621826171875, -0.7529296875, -0.6436767578125, -0.534423828125, -0.4251708984375, -0.31591796875, -0.2066650390625, -0.097412109375, 0.0118408203125, 0.12109375, 0.2303466796875, 0.339599609375, 0.4488525390625, 0.55810546875, 0.6673583984375, 0.776611328125, 0.8858642578125, 0.9951171875, 1.1043701171875, 1.213623046875, 1.3228759765625, 1.43212890625, 1.5413818359375, 1.650634765625, 1.7598876953125, 1.869140625, 1.9783935546875, 2.087646484375, 2.1968994140625, 2.30615234375, 2.4154052734375, 2.524658203125, 2.6339111328125, 2.7431640625, 2.8524169921875, 2.961669921875, 3.0709228515625, 3.18017578125, 3.2894287109375, 3.398681640625, 3.5079345703125, 3.6171875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 11.0, 10.0, 12.0, 17.0, 24.0, 24.0, 21.0, 28.0, 24.0, 33.0, 31.0, 27.0, 45.0, 44.0, 37.0, 30.0, 42.0, 46.0, 45.0, 44.0, 36.0, 36.0, 31.0, 38.0, 38.0, 26.0, 22.0, 29.0, 19.0, 22.0, 23.0, 14.0, 13.0, 7.0, 7.0, 6.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.6953125, -9.41943359375, -9.1435546875, -8.86767578125, -8.591796875, -8.31591796875, -8.0400390625, -7.76416015625, -7.48828125, -7.21240234375, -6.9365234375, -6.66064453125, -6.384765625, -6.10888671875, -5.8330078125, -5.55712890625, -5.28125, -5.00537109375, -4.7294921875, -4.45361328125, -4.177734375, -3.90185546875, -3.6259765625, -3.35009765625, -3.07421875, -2.79833984375, -2.5224609375, -2.24658203125, -1.970703125, -1.69482421875, -1.4189453125, -1.14306640625, -0.8671875, -0.59130859375, -0.3154296875, -0.03955078125, 0.236328125, 0.51220703125, 0.7880859375, 1.06396484375, 1.33984375, 1.61572265625, 1.8916015625, 2.16748046875, 2.443359375, 2.71923828125, 2.9951171875, 3.27099609375, 3.546875, 3.82275390625, 4.0986328125, 4.37451171875, 4.650390625, 4.92626953125, 5.2021484375, 5.47802734375, 5.75390625, 6.02978515625, 6.3056640625, 6.58154296875, 6.857421875, 7.13330078125, 7.4091796875, 7.68505859375, 7.9609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 20.0, 21.0, 25.0, 40.0, 65.0, 73.0, 167.0, 287.0, 486.0, 770.0, 1339.0, 2361.0, 4168.0, 7603.0, 13820.0, 26788.0, 53413.0, 111860.0, 253872.0, 309624.0, 131641.0, 62657.0, 31191.0, 16475.0, 8564.0, 4752.0, 2720.0, 1495.0, 933.0, 527.0, 303.0, 183.0, 112.0, 69.0, 40.0, 23.0, 16.0, 18.0, 9.0, 5.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.53125, -5.36419677734375, -5.1971435546875, -5.03009033203125, -4.863037109375, -4.69598388671875, -4.5289306640625, -4.36187744140625, -4.19482421875, -4.02777099609375, -3.8607177734375, -3.69366455078125, -3.526611328125, -3.35955810546875, -3.1925048828125, -3.02545166015625, -2.8583984375, -2.69134521484375, -2.5242919921875, -2.35723876953125, -2.190185546875, -2.02313232421875, -1.8560791015625, -1.68902587890625, -1.52197265625, -1.35491943359375, -1.1878662109375, -1.02081298828125, -0.853759765625, -0.68670654296875, -0.5196533203125, -0.35260009765625, -0.185546875, -0.01849365234375, 0.1485595703125, 0.31561279296875, 0.482666015625, 0.64971923828125, 0.8167724609375, 0.98382568359375, 1.15087890625, 1.31793212890625, 1.4849853515625, 1.65203857421875, 1.819091796875, 1.98614501953125, 2.1531982421875, 2.32025146484375, 2.4873046875, 2.65435791015625, 2.8214111328125, 2.98846435546875, 3.155517578125, 3.32257080078125, 3.4896240234375, 3.65667724609375, 3.82373046875, 3.99078369140625, 4.1578369140625, 4.32489013671875, 4.491943359375, 4.65899658203125, 4.8260498046875, 4.99310302734375, 5.16015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 2.0, 9.0, 5.0, 10.0, 13.0, 10.0, 15.0, 14.0, 20.0, 11.0, 23.0, 28.0, 32.0, 32.0, 30.0, 39.0, 34.0, 41.0, 37.0, 32.0, 48.0, 43.0, 47.0, 39.0, 44.0, 28.0, 31.0, 32.0, 20.0, 33.0, 25.0, 21.0, 20.0, 19.0, 19.0, 19.0, 11.0, 9.0, 10.0, 13.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.75390625, -5.5858154296875, -5.417724609375, -5.2496337890625, -5.08154296875, -4.9134521484375, -4.745361328125, -4.5772705078125, -4.4091796875, -4.2410888671875, -4.072998046875, -3.9049072265625, -3.73681640625, -3.5687255859375, -3.400634765625, -3.2325439453125, -3.064453125, -2.8963623046875, -2.728271484375, -2.5601806640625, -2.39208984375, -2.2239990234375, -2.055908203125, -1.8878173828125, -1.7197265625, -1.5516357421875, -1.383544921875, -1.2154541015625, -1.04736328125, -0.8792724609375, -0.711181640625, -0.5430908203125, -0.375, -0.2069091796875, -0.038818359375, 0.1292724609375, 0.29736328125, 0.4654541015625, 0.633544921875, 0.8016357421875, 0.9697265625, 1.1378173828125, 1.305908203125, 1.4739990234375, 1.64208984375, 1.8101806640625, 1.978271484375, 2.1463623046875, 2.314453125, 2.4825439453125, 2.650634765625, 2.8187255859375, 2.98681640625, 3.1549072265625, 3.322998046875, 3.4910888671875, 3.6591796875, 3.8272705078125, 3.995361328125, 4.1634521484375, 4.33154296875, 4.4996337890625, 4.667724609375, 4.8358154296875, 5.00390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 8.0, 10.0, 20.0, 32.0, 35.0, 46.0, 92.0, 158.0, 241.0, 491.0, 1012.0, 2210.0, 5745.0, 18613.0, 78034.0, 546464.0, 322998.0, 51184.0, 13391.0, 4272.0, 1703.0, 793.0, 391.0, 228.0, 130.0, 93.0, 41.0, 32.0, 27.0, 10.0, 15.0, 10.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.07002544403076172, -0.06741905212402344, -0.06481266021728516, -0.062206268310546875, -0.059599876403808594, -0.05699348449707031, -0.05438709259033203, -0.05178070068359375, -0.04917430877685547, -0.04656791687011719, -0.043961524963378906, -0.041355133056640625, -0.038748741149902344, -0.03614234924316406, -0.03353595733642578, -0.0309295654296875, -0.02832317352294922, -0.025716781616210938, -0.023110389709472656, -0.020503997802734375, -0.017897605895996094, -0.015291213989257812, -0.012684822082519531, -0.01007843017578125, -0.007472038269042969, -0.0048656463623046875, -0.0022592544555664062, 0.000347137451171875, 0.0029535293579101562, 0.0055599212646484375, 0.008166313171386719, 0.010772705078125, 0.013379096984863281, 0.015985488891601562, 0.018591880798339844, 0.021198272705078125, 0.023804664611816406, 0.026411056518554688, 0.02901744842529297, 0.03162384033203125, 0.03423023223876953, 0.03683662414550781, 0.039443016052246094, 0.042049407958984375, 0.044655799865722656, 0.04726219177246094, 0.04986858367919922, 0.0524749755859375, 0.05508136749267578, 0.05768775939941406, 0.060294151306152344, 0.06290054321289062, 0.0655069351196289, 0.06811332702636719, 0.07071971893310547, 0.07332611083984375, 0.07593250274658203, 0.07853889465332031, 0.0811452865600586, 0.08375167846679688, 0.08635807037353516, 0.08896446228027344, 0.09157085418701172, 0.09417724609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 7.0, 2.0, 4.0, 7.0, 10.0, 15.0, 17.0, 23.0, 18.0, 33.0, 36.0, 43.0, 53.0, 69.0, 76.0, 67.0, 81.0, 82.0, 44.0, 61.0, 32.0, 43.0, 34.0, 28.0, 26.0, 22.0, 12.0, 7.0, 12.0, 2.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3947486877441406e-05, -1.34957954287529e-05, -1.3044103980064392e-05, -1.2592412531375885e-05, -1.2140721082687378e-05, -1.1689029633998871e-05, -1.1237338185310364e-05, -1.0785646736621857e-05, -1.033395528793335e-05, -9.882263839244843e-06, -9.430572390556335e-06, -8.978880941867828e-06, -8.527189493179321e-06, -8.075498044490814e-06, -7.623806595802307e-06, -7.1721151471138e-06, -6.720423698425293e-06, -6.268732249736786e-06, -5.817040801048279e-06, -5.365349352359772e-06, -4.913657903671265e-06, -4.4619664549827576e-06, -4.0102750062942505e-06, -3.5585835576057434e-06, -3.1068921089172363e-06, -2.6552006602287292e-06, -2.203509211540222e-06, -1.751817762851715e-06, -1.300126314163208e-06, -8.484348654747009e-07, -3.9674341678619385e-07, 5.494803190231323e-08, 5.066394805908203e-07, 9.583309292793274e-07, 1.4100223779678345e-06, 1.8617138266563416e-06, 2.3134052753448486e-06, 2.7650967240333557e-06, 3.216788172721863e-06, 3.66847962141037e-06, 4.120171070098877e-06, 4.571862518787384e-06, 5.023553967475891e-06, 5.475245416164398e-06, 5.926936864852905e-06, 6.378628313541412e-06, 6.8303197622299194e-06, 7.2820112109184265e-06, 7.733702659606934e-06, 8.18539410829544e-06, 8.637085556983948e-06, 9.088777005672455e-06, 9.540468454360962e-06, 9.992159903049469e-06, 1.0443851351737976e-05, 1.0895542800426483e-05, 1.134723424911499e-05, 1.1798925697803497e-05, 1.2250617146492004e-05, 1.2702308595180511e-05, 1.3154000043869019e-05, 1.3605691492557526e-05, 1.4057382941246033e-05, 1.450907438993454e-05, 1.4960765838623047e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 16.0, 6.0, 17.0, 14.0, 28.0, 42.0, 58.0, 79.0, 118.0, 162.0, 173.0, 282.0, 393.0, 613.0, 839.0, 1390.0, 2157.0, 3535.0, 6089.0, 10782.0, 20236.0, 39262.0, 86635.0, 217567.0, 356179.0, 162899.0, 67450.0, 31920.0, 16544.0, 9026.0, 5268.0, 3087.0, 1870.0, 1286.0, 783.0, 527.0, 315.0, 260.0, 191.0, 131.0, 87.0, 64.0, 50.0, 42.0, 29.0, 24.0, 6.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038299560546875, -0.037077903747558594, -0.03585624694824219, -0.03463459014892578, -0.033412933349609375, -0.03219127655029297, -0.030969619750976562, -0.029747962951660156, -0.02852630615234375, -0.027304649353027344, -0.026082992553710938, -0.02486133575439453, -0.023639678955078125, -0.02241802215576172, -0.021196365356445312, -0.019974708557128906, -0.0187530517578125, -0.017531394958496094, -0.016309738159179688, -0.015088081359863281, -0.013866424560546875, -0.012644767761230469, -0.011423110961914062, -0.010201454162597656, -0.00897979736328125, -0.007758140563964844, -0.0065364837646484375, -0.005314826965332031, -0.004093170166015625, -0.0028715133666992188, -0.0016498565673828125, -0.00042819976806640625, 0.00079345703125, 0.0020151138305664062, 0.0032367706298828125, 0.004458427429199219, 0.005680084228515625, 0.006901741027832031, 0.008123397827148438, 0.009345054626464844, 0.01056671142578125, 0.011788368225097656, 0.013010025024414062, 0.014231681823730469, 0.015453338623046875, 0.01667499542236328, 0.017896652221679688, 0.019118309020996094, 0.0203399658203125, 0.021561622619628906, 0.022783279418945312, 0.02400493621826172, 0.025226593017578125, 0.02644824981689453, 0.027669906616210938, 0.028891563415527344, 0.03011322021484375, 0.031334877014160156, 0.03255653381347656, 0.03377819061279297, 0.034999847412109375, 0.03622150421142578, 0.03744316101074219, 0.038664817810058594, 0.039886474609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 11.0, 8.0, 18.0, 24.0, 34.0, 47.0, 75.0, 80.0, 132.0, 138.0, 103.0, 99.0, 61.0, 46.0, 33.0, 17.0, 14.0, 17.0, 6.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017608642578125, -0.01714909076690674, -0.016689538955688477, -0.016229987144470215, -0.015770435333251953, -0.015310883522033691, -0.01485133171081543, -0.014391779899597168, -0.013932228088378906, -0.013472676277160645, -0.013013124465942383, -0.012553572654724121, -0.01209402084350586, -0.011634469032287598, -0.011174917221069336, -0.010715365409851074, -0.010255813598632812, -0.00979626178741455, -0.009336709976196289, -0.008877158164978027, -0.008417606353759766, -0.007958054542541504, -0.007498502731323242, -0.0070389509201049805, -0.006579399108886719, -0.006119847297668457, -0.005660295486450195, -0.005200743675231934, -0.004741191864013672, -0.00428164005279541, -0.0038220882415771484, -0.0033625364303588867, -0.002902984619140625, -0.0024434328079223633, -0.0019838809967041016, -0.0015243291854858398, -0.0010647773742675781, -0.0006052255630493164, -0.0001456737518310547, 0.00031387805938720703, 0.0007734298706054688, 0.0012329816818237305, 0.0016925334930419922, 0.002152085304260254, 0.0026116371154785156, 0.0030711889266967773, 0.003530740737915039, 0.003990292549133301, 0.0044498443603515625, 0.004909396171569824, 0.005368947982788086, 0.005828499794006348, 0.006288051605224609, 0.006747603416442871, 0.007207155227661133, 0.0076667070388793945, 0.008126258850097656, 0.008585810661315918, 0.00904536247253418, 0.009504914283752441, 0.009964466094970703, 0.010424017906188965, 0.010883569717407227, 0.011343121528625488, 0.01180267333984375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 6.0, 16.0, 14.0, 17.0, 26.0, 22.0, 49.0, 45.0, 70.0, 78.0, 77.0, 76.0, 90.0, 70.0, 69.0, 58.0, 39.0, 32.0, 28.0, 12.0, 28.0, 12.0, 10.0, 7.0, 7.0, 3.0, 4.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.41744327545166, -8.091218948364258, -7.764993667602539, -7.4387688636779785, -7.112544059753418, -6.786319732666016, -6.460094928741455, -6.1338701248168945, -5.807645320892334, -5.481420516967773, -5.155195713043213, -4.828970909118652, -4.50274658203125, -4.176521301269531, -3.850296974182129, -3.5240721702575684, -3.197847366333008, -2.8716225624084473, -2.5453977584838867, -2.2191731929779053, -1.8929483890533447, -1.5667235851287842, -1.2404989004135132, -0.9142742156982422, -0.5880494117736816, -0.26182466745376587, 0.0644000768661499, 0.3906248211860657, 0.7168495655059814, 1.043074369430542, 1.369299054145813, 1.695523738861084, 2.0217485427856445, 2.347973346710205, 2.6741981506347656, 3.000422716140747, 3.3266475200653076, 3.652872323989868, 3.9790968894958496, 4.30532169342041, 4.631546497344971, 4.957771301269531, 5.283996105194092, 5.610220909118652, 5.936445236206055, 6.262670516967773, 6.588894844055176, 6.915119647979736, 7.241344451904297, 7.567569255828857, 7.893794059753418, 8.22001838684082, 8.546243667602539, 8.872467994689941, 9.19869327545166, 9.524917602539062, 9.851142883300781, 10.177367210388184, 10.503592491149902, 10.829816818237305, 11.156042098999023, 11.482266426086426, 11.808491706848145, 12.134716033935547, 12.46094036102295]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 11.0, 11.0, 10.0, 19.0, 21.0, 14.0, 33.0, 23.0, 21.0, 20.0, 34.0, 32.0, 28.0, 36.0, 28.0, 38.0, 42.0, 35.0, 48.0, 36.0, 46.0, 52.0, 36.0, 25.0, 37.0, 28.0, 37.0, 28.0, 22.0, 17.0, 23.0, 18.0, 14.0, 9.0, 14.0, 4.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-9.485343933105469, -9.223915100097656, -8.962486267089844, -8.701057434082031, -8.439628601074219, -8.178199768066406, -7.916771411895752, -7.6553425788879395, -7.393913745880127, -7.1324849128723145, -6.871056079864502, -6.6096272468566895, -6.348198890686035, -6.086770057678223, -5.82534122467041, -5.563912391662598, -5.302483558654785, -5.041054725646973, -4.77962589263916, -4.518197059631348, -4.256768226623535, -3.9953396320343018, -3.7339110374450684, -3.472482204437256, -3.2110533714294434, -2.949624538421631, -2.6881957054138184, -2.426767110824585, -2.1653382778167725, -1.90390944480896, -1.642480731010437, -1.381052017211914, -1.1196231842041016, -0.8581944108009338, -0.5967656373977661, -0.3353368639945984, -0.07390809059143066, 0.18752074241638184, 0.4489494562149048, 0.7103781700134277, 0.9718070030212402, 1.2332358360290527, 1.4946645498275757, 1.7560932636260986, 2.017522096633911, 2.2789509296417236, 2.540379524230957, 2.8018083572387695, 3.063237190246582, 3.3246660232543945, 3.586094856262207, 3.8475234508514404, 4.108952522277832, 4.3703813552856445, 4.631809711456299, 4.893238544464111, 5.154667377471924, 5.416096210479736, 5.677525043487549, 5.938953876495361, 6.200382232666016, 6.461811065673828, 6.723239898681641, 6.984668731689453, 7.246097564697266]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 7.0, 10.0, 22.0, 22.0, 46.0, 49.0, 63.0, 129.0, 213.0, 285.0, 424.0, 638.0, 965.0, 1461.0, 2452.0, 3881.0, 5968.0, 9808.0, 16267.0, 26882.0, 44797.0, 73374.0, 116407.0, 166760.0, 184326.0, 145228.0, 96355.0, 59276.0, 36062.0, 21538.0, 13167.0, 7980.0, 4993.0, 3129.0, 1943.0, 1232.0, 811.0, 531.0, 369.0, 222.0, 155.0, 97.0, 60.0, 64.0, 33.0, 22.0, 11.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0], "bins": [-13.375, -12.98486328125, -12.5947265625, -12.20458984375, -11.814453125, -11.42431640625, -11.0341796875, -10.64404296875, -10.25390625, -9.86376953125, -9.4736328125, -9.08349609375, -8.693359375, -8.30322265625, -7.9130859375, -7.52294921875, -7.1328125, -6.74267578125, -6.3525390625, -5.96240234375, -5.572265625, -5.18212890625, -4.7919921875, -4.40185546875, -4.01171875, -3.62158203125, -3.2314453125, -2.84130859375, -2.451171875, -2.06103515625, -1.6708984375, -1.28076171875, -0.890625, -0.50048828125, -0.1103515625, 0.27978515625, 0.669921875, 1.06005859375, 1.4501953125, 1.84033203125, 2.23046875, 2.62060546875, 3.0107421875, 3.40087890625, 3.791015625, 4.18115234375, 4.5712890625, 4.96142578125, 5.3515625, 5.74169921875, 6.1318359375, 6.52197265625, 6.912109375, 7.30224609375, 7.6923828125, 8.08251953125, 8.47265625, 8.86279296875, 9.2529296875, 9.64306640625, 10.033203125, 10.42333984375, 10.8134765625, 11.20361328125, 11.59375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 11.0, 19.0, 8.0, 17.0, 14.0, 22.0, 16.0, 21.0, 24.0, 25.0, 32.0, 21.0, 37.0, 34.0, 29.0, 45.0, 41.0, 33.0, 49.0, 32.0, 57.0, 41.0, 35.0, 33.0, 24.0, 29.0, 31.0, 32.0, 25.0, 18.0, 29.0, 20.0, 10.0, 14.0, 9.0, 6.0, 10.0, 11.0, 5.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.90625, -7.669921875, -7.43359375, -7.197265625, -6.9609375, -6.724609375, -6.48828125, -6.251953125, -6.015625, -5.779296875, -5.54296875, -5.306640625, -5.0703125, -4.833984375, -4.59765625, -4.361328125, -4.125, -3.888671875, -3.65234375, -3.416015625, -3.1796875, -2.943359375, -2.70703125, -2.470703125, -2.234375, -1.998046875, -1.76171875, -1.525390625, -1.2890625, -1.052734375, -0.81640625, -0.580078125, -0.34375, -0.107421875, 0.12890625, 0.365234375, 0.6015625, 0.837890625, 1.07421875, 1.310546875, 1.546875, 1.783203125, 2.01953125, 2.255859375, 2.4921875, 2.728515625, 2.96484375, 3.201171875, 3.4375, 3.673828125, 3.91015625, 4.146484375, 4.3828125, 4.619140625, 4.85546875, 5.091796875, 5.328125, 5.564453125, 5.80078125, 6.037109375, 6.2734375, 6.509765625, 6.74609375, 6.982421875, 7.21875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 16.0, 16.0, 34.0, 28.0, 49.0, 86.0, 128.0, 246.0, 400.0, 599.0, 1041.0, 1684.0, 2615.0, 4464.0, 7488.0, 12337.0, 20898.0, 35188.0, 61201.0, 103443.0, 164228.0, 205385.0, 167747.0, 107000.0, 62572.0, 36255.0, 21326.0, 12700.0, 7699.0, 4429.0, 2821.0, 1707.0, 1035.0, 656.0, 371.0, 231.0, 149.0, 112.0, 55.0, 40.0, 25.0, 19.0, 18.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.984375, -13.5672607421875, -13.150146484375, -12.7330322265625, -12.31591796875, -11.8988037109375, -11.481689453125, -11.0645751953125, -10.6474609375, -10.2303466796875, -9.813232421875, -9.3961181640625, -8.97900390625, -8.5618896484375, -8.144775390625, -7.7276611328125, -7.310546875, -6.8934326171875, -6.476318359375, -6.0592041015625, -5.64208984375, -5.2249755859375, -4.807861328125, -4.3907470703125, -3.9736328125, -3.5565185546875, -3.139404296875, -2.7222900390625, -2.30517578125, -1.8880615234375, -1.470947265625, -1.0538330078125, -0.63671875, -0.2196044921875, 0.197509765625, 0.6146240234375, 1.03173828125, 1.4488525390625, 1.865966796875, 2.2830810546875, 2.7001953125, 3.1173095703125, 3.534423828125, 3.9515380859375, 4.36865234375, 4.7857666015625, 5.202880859375, 5.6199951171875, 6.037109375, 6.4542236328125, 6.871337890625, 7.2884521484375, 7.70556640625, 8.1226806640625, 8.539794921875, 8.9569091796875, 9.3740234375, 9.7911376953125, 10.208251953125, 10.6253662109375, 11.04248046875, 11.4595947265625, 11.876708984375, 12.2938232421875, 12.7109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 6.0, 13.0, 10.0, 13.0, 16.0, 20.0, 20.0, 27.0, 21.0, 30.0, 47.0, 39.0, 30.0, 29.0, 44.0, 38.0, 45.0, 30.0, 37.0, 39.0, 43.0, 35.0, 26.0, 43.0, 30.0, 35.0, 29.0, 17.0, 18.0, 22.0, 18.0, 14.0, 15.0, 12.0, 12.0, 3.0, 4.0, 11.0, 10.0, 11.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0], "bins": [-4.86328125, -4.7139892578125, -4.564697265625, -4.4154052734375, -4.26611328125, -4.1168212890625, -3.967529296875, -3.8182373046875, -3.6689453125, -3.5196533203125, -3.370361328125, -3.2210693359375, -3.07177734375, -2.9224853515625, -2.773193359375, -2.6239013671875, -2.474609375, -2.3253173828125, -2.176025390625, -2.0267333984375, -1.87744140625, -1.7281494140625, -1.578857421875, -1.4295654296875, -1.2802734375, -1.1309814453125, -0.981689453125, -0.8323974609375, -0.68310546875, -0.5338134765625, -0.384521484375, -0.2352294921875, -0.0859375, 0.0633544921875, 0.212646484375, 0.3619384765625, 0.51123046875, 0.6605224609375, 0.809814453125, 0.9591064453125, 1.1083984375, 1.2576904296875, 1.406982421875, 1.5562744140625, 1.70556640625, 1.8548583984375, 2.004150390625, 2.1534423828125, 2.302734375, 2.4520263671875, 2.601318359375, 2.7506103515625, 2.89990234375, 3.0491943359375, 3.198486328125, 3.3477783203125, 3.4970703125, 3.6463623046875, 3.795654296875, 3.9449462890625, 4.09423828125, 4.2435302734375, 4.392822265625, 4.5421142578125, 4.69140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 5.0, 3.0, 9.0, 9.0, 12.0, 14.0, 24.0, 23.0, 51.0, 49.0, 68.0, 94.0, 145.0, 194.0, 301.0, 389.0, 558.0, 849.0, 1196.0, 1897.0, 2754.0, 4195.0, 6758.0, 11328.0, 20919.0, 42279.0, 102035.0, 360769.0, 312029.0, 91991.0, 38765.0, 19524.0, 10887.0, 6318.0, 3980.0, 2522.0, 1715.0, 1142.0, 798.0, 577.0, 381.0, 279.0, 206.0, 161.0, 116.0, 69.0, 49.0, 41.0, 25.0, 22.0, 11.0, 3.0, 7.0, 6.0, 6.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.01953125, -5.82501220703125, -5.6304931640625, -5.43597412109375, -5.241455078125, -5.04693603515625, -4.8524169921875, -4.65789794921875, -4.46337890625, -4.26885986328125, -4.0743408203125, -3.87982177734375, -3.685302734375, -3.49078369140625, -3.2962646484375, -3.10174560546875, -2.9072265625, -2.71270751953125, -2.5181884765625, -2.32366943359375, -2.129150390625, -1.93463134765625, -1.7401123046875, -1.54559326171875, -1.35107421875, -1.15655517578125, -0.9620361328125, -0.76751708984375, -0.572998046875, -0.37847900390625, -0.1839599609375, 0.01055908203125, 0.205078125, 0.39959716796875, 0.5941162109375, 0.78863525390625, 0.983154296875, 1.17767333984375, 1.3721923828125, 1.56671142578125, 1.76123046875, 1.95574951171875, 2.1502685546875, 2.34478759765625, 2.539306640625, 2.73382568359375, 2.9283447265625, 3.12286376953125, 3.3173828125, 3.51190185546875, 3.7064208984375, 3.90093994140625, 4.095458984375, 4.28997802734375, 4.4844970703125, 4.67901611328125, 4.87353515625, 5.06805419921875, 5.2625732421875, 5.45709228515625, 5.651611328125, 5.84613037109375, 6.0406494140625, 6.23516845703125, 6.4296875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 8.0, 8.0, 13.0, 22.0, 19.0, 18.0, 40.0, 43.0, 80.0, 92.0, 91.0, 135.0, 104.0, 84.0, 54.0, 42.0, 28.0, 23.0, 17.0, 18.0, 9.0, 9.0, 15.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003330707550048828, -0.00032309070229530334, -0.0003131106495857239, -0.0003031305968761444, -0.00029315054416656494, -0.0002831704914569855, -0.000273190438747406, -0.00026321038603782654, -0.00025323033332824707, -0.0002432502806186676, -0.00023327022790908813, -0.00022329017519950867, -0.0002133101224899292, -0.00020333006978034973, -0.00019335001707077026, -0.0001833699643611908, -0.00017338991165161133, -0.00016340985894203186, -0.0001534298062324524, -0.00014344975352287292, -0.00013346970081329346, -0.000123489648103714, -0.00011350959539413452, -0.00010352954268455505, -9.354948997497559e-05, -8.356943726539612e-05, -7.358938455581665e-05, -6.360933184623718e-05, -5.3629279136657715e-05, -4.364922642707825e-05, -3.366917371749878e-05, -2.368912100791931e-05, -1.3709068298339844e-05, -3.729015588760376e-06, 6.251037120819092e-06, 1.623108983039856e-05, 2.6211142539978027e-05, 3.6191195249557495e-05, 4.617124795913696e-05, 5.615130066871643e-05, 6.61313533782959e-05, 7.611140608787537e-05, 8.609145879745483e-05, 9.60715115070343e-05, 0.00010605156421661377, 0.00011603161692619324, 0.0001260116696357727, 0.00013599172234535217, 0.00014597177505493164, 0.0001559518277645111, 0.00016593188047409058, 0.00017591193318367004, 0.0001858919858932495, 0.00019587203860282898, 0.00020585209131240845, 0.00021583214402198792, 0.00022581219673156738, 0.00023579224944114685, 0.0002457723021507263, 0.0002557523548603058, 0.00026573240756988525, 0.0002757124602794647, 0.0002856925129890442, 0.00029567256569862366, 0.0003056526184082031]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 6.0, 10.0, 21.0, 25.0, 20.0, 40.0, 48.0, 76.0, 107.0, 153.0, 234.0, 350.0, 574.0, 959.0, 1670.0, 2963.0, 5489.0, 11365.0, 25301.0, 68185.0, 264612.0, 489820.0, 108639.0, 36516.0, 15099.0, 7344.0, 3643.0, 2065.0, 1145.0, 753.0, 453.0, 265.0, 177.0, 131.0, 69.0, 53.0, 52.0, 31.0, 27.0, 11.0, 15.0, 5.0, 13.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-8.296875, -8.04693603515625, -7.7969970703125, -7.54705810546875, -7.297119140625, -7.04718017578125, -6.7972412109375, -6.54730224609375, -6.29736328125, -6.04742431640625, -5.7974853515625, -5.54754638671875, -5.297607421875, -5.04766845703125, -4.7977294921875, -4.54779052734375, -4.2978515625, -4.04791259765625, -3.7979736328125, -3.54803466796875, -3.298095703125, -3.04815673828125, -2.7982177734375, -2.54827880859375, -2.29833984375, -2.04840087890625, -1.7984619140625, -1.54852294921875, -1.298583984375, -1.04864501953125, -0.7987060546875, -0.54876708984375, -0.298828125, -0.04888916015625, 0.2010498046875, 0.45098876953125, 0.700927734375, 0.95086669921875, 1.2008056640625, 1.45074462890625, 1.70068359375, 1.95062255859375, 2.2005615234375, 2.45050048828125, 2.700439453125, 2.95037841796875, 3.2003173828125, 3.45025634765625, 3.7001953125, 3.95013427734375, 4.2000732421875, 4.45001220703125, 4.699951171875, 4.94989013671875, 5.1998291015625, 5.44976806640625, 5.69970703125, 5.94964599609375, 6.1995849609375, 6.44952392578125, 6.699462890625, 6.94940185546875, 7.1993408203125, 7.44927978515625, 7.69921875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 9.0, 1.0, 3.0, 7.0, 7.0, 8.0, 17.0, 26.0, 22.0, 29.0, 48.0, 76.0, 82.0, 125.0, 113.0, 108.0, 82.0, 76.0, 45.0, 33.0, 26.0, 19.0, 11.0, 11.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.724609375, -2.643341064453125, -2.56207275390625, -2.480804443359375, -2.3995361328125, -2.318267822265625, -2.23699951171875, -2.155731201171875, -2.074462890625, -1.993194580078125, -1.91192626953125, -1.830657958984375, -1.7493896484375, -1.668121337890625, -1.58685302734375, -1.505584716796875, -1.42431640625, -1.343048095703125, -1.26177978515625, -1.180511474609375, -1.0992431640625, -1.017974853515625, -0.93670654296875, -0.855438232421875, -0.774169921875, -0.692901611328125, -0.61163330078125, -0.530364990234375, -0.4490966796875, -0.367828369140625, -0.28656005859375, -0.205291748046875, -0.1240234375, -0.042755126953125, 0.03851318359375, 0.119781494140625, 0.2010498046875, 0.282318115234375, 0.36358642578125, 0.444854736328125, 0.526123046875, 0.607391357421875, 0.68865966796875, 0.769927978515625, 0.8511962890625, 0.932464599609375, 1.01373291015625, 1.095001220703125, 1.17626953125, 1.257537841796875, 1.33880615234375, 1.420074462890625, 1.5013427734375, 1.582611083984375, 1.66387939453125, 1.745147705078125, 1.826416015625, 1.907684326171875, 1.98895263671875, 2.070220947265625, 2.1514892578125, 2.232757568359375, 2.31402587890625, 2.395294189453125, 2.4765625]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 7.0, 8.0, 11.0, 9.0, 25.0, 25.0, 28.0, 40.0, 46.0, 56.0, 54.0, 78.0, 71.0, 76.0, 77.0, 69.0, 55.0, 46.0, 36.0, 43.0, 27.0, 20.0, 15.0, 15.0, 13.0, 4.0, 9.0, 4.0, 5.0, 2.0, 4.0, 4.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.962874412536621, -8.657495498657227, -8.352117538452148, -8.046738624572754, -7.741360664367676, -7.435981750488281, -7.130603313446045, -6.825224876403809, -6.519846439361572, -6.214468002319336, -5.9090895652771, -5.603711128234863, -5.298332214355469, -4.992954254150391, -4.687575340270996, -4.38219690322876, -4.076818466186523, -3.771440029144287, -3.466061592102051, -3.1606829166412354, -2.855304479598999, -2.5499260425567627, -2.2445473670959473, -1.939168930053711, -1.6337904930114746, -1.3284120559692383, -1.0230334997177124, -0.7176550030708313, -0.4122765064239502, -0.10689806938171387, 0.198480486869812, 0.5038590431213379, 0.8092374801635742, 1.1146159172058105, 1.4199944734573364, 1.7253730297088623, 2.0307514667510986, 2.336129903793335, 2.6415085792541504, 2.9468870162963867, 3.252265453338623, 3.5576438903808594, 3.8630223274230957, 4.168400764465332, 4.473779678344727, 4.779157638549805, 5.084536552429199, 5.3899149894714355, 5.695293426513672, 6.000671863555908, 6.3060503005981445, 6.611428737640381, 6.916807174682617, 7.222186088562012, 7.527564525604248, 7.832942962646484, 8.138320922851562, 8.443699836730957, 8.749077796936035, 9.05445671081543, 9.359834671020508, 9.665213584899902, 9.97059154510498, 10.275970458984375, 10.58134937286377]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 4.0, 14.0, 19.0, 21.0, 16.0, 12.0, 27.0, 29.0, 20.0, 32.0, 26.0, 41.0, 32.0, 44.0, 48.0, 47.0, 38.0, 39.0, 44.0, 42.0, 47.0, 48.0, 36.0, 37.0, 28.0, 29.0, 33.0, 22.0, 21.0, 29.0, 17.0, 12.0, 8.0, 13.0, 9.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-11.897977828979492, -11.596817970275879, -11.295658111572266, -10.994498252868652, -10.693338394165039, -10.392178535461426, -10.091018676757812, -9.7898588180542, -9.488698959350586, -9.187539100646973, -8.88637924194336, -8.585219383239746, -8.284059524536133, -7.9828996658325195, -7.681739807128906, -7.380579948425293, -7.0794196128845215, -6.778259754180908, -6.477099895477295, -6.175940036773682, -5.874780178070068, -5.573620319366455, -5.272459983825684, -4.97130012512207, -4.670140266418457, -4.368980407714844, -4.0678205490112305, -3.766660690307617, -3.465500831604004, -3.1643409729003906, -2.8631808757781982, -2.562021017074585, -2.260861396789551, -1.9597015380859375, -1.6585416793823242, -1.3573817014694214, -1.056221842765808, -0.7550619840621948, -0.453902006149292, -0.1527421474456787, 0.14841771125793457, 0.44957759976387024, 0.7507374882698059, 1.051897406578064, 1.3530572652816772, 1.6542171239852905, 1.9553771018981934, 2.2565369606018066, 2.55769681930542, 2.858856678009033, 3.1600165367126465, 3.4611763954162598, 3.762336254119873, 4.063496112823486, 4.364656448364258, 4.665816307067871, 4.966976165771484, 5.268136024475098, 5.569295883178711, 5.870455741882324, 6.1716156005859375, 6.472775459289551, 6.773935317993164, 7.075095176696777, 7.376255035400391]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 7.0, 11.0, 9.0, 18.0, 34.0, 43.0, 59.0, 76.0, 132.0, 155.0, 241.0, 391.0, 550.0, 810.0, 1335.0, 2061.0, 3272.0, 5439.0, 8863.0, 14730.0, 25153.0, 43810.0, 79385.0, 156182.0, 363688.0, 955672.0, 1343676.0, 660073.0, 254953.0, 120536.0, 64316.0, 35945.0, 20869.0, 12336.0, 7299.0, 4647.0, 2755.0, 1723.0, 1098.0, 699.0, 458.0, 247.0, 170.0, 131.0, 75.0, 47.0, 46.0, 24.0, 15.0, 11.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.3203125, -11.961181640625, -11.60205078125, -11.242919921875, -10.8837890625, -10.524658203125, -10.16552734375, -9.806396484375, -9.447265625, -9.088134765625, -8.72900390625, -8.369873046875, -8.0107421875, -7.651611328125, -7.29248046875, -6.933349609375, -6.57421875, -6.215087890625, -5.85595703125, -5.496826171875, -5.1376953125, -4.778564453125, -4.41943359375, -4.060302734375, -3.701171875, -3.342041015625, -2.98291015625, -2.623779296875, -2.2646484375, -1.905517578125, -1.54638671875, -1.187255859375, -0.828125, -0.468994140625, -0.10986328125, 0.249267578125, 0.6083984375, 0.967529296875, 1.32666015625, 1.685791015625, 2.044921875, 2.404052734375, 2.76318359375, 3.122314453125, 3.4814453125, 3.840576171875, 4.19970703125, 4.558837890625, 4.91796875, 5.277099609375, 5.63623046875, 5.995361328125, 6.3544921875, 6.713623046875, 7.07275390625, 7.431884765625, 7.791015625, 8.150146484375, 8.50927734375, 8.868408203125, 9.2275390625, 9.586669921875, 9.94580078125, 10.304931640625, 10.6640625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 10.0, 10.0, 10.0, 15.0, 20.0, 31.0, 25.0, 28.0, 32.0, 34.0, 39.0, 41.0, 43.0, 54.0, 49.0, 55.0, 34.0, 55.0, 43.0, 49.0, 50.0, 40.0, 26.0, 34.0, 32.0, 28.0, 18.0, 23.0, 21.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.96875, -9.70599365234375, -9.4432373046875, -9.18048095703125, -8.917724609375, -8.65496826171875, -8.3922119140625, -8.12945556640625, -7.86669921875, -7.60394287109375, -7.3411865234375, -7.07843017578125, -6.815673828125, -6.55291748046875, -6.2901611328125, -6.02740478515625, -5.7646484375, -5.50189208984375, -5.2391357421875, -4.97637939453125, -4.713623046875, -4.45086669921875, -4.1881103515625, -3.92535400390625, -3.66259765625, -3.39984130859375, -3.1370849609375, -2.87432861328125, -2.611572265625, -2.34881591796875, -2.0860595703125, -1.82330322265625, -1.560546875, -1.29779052734375, -1.0350341796875, -0.77227783203125, -0.509521484375, -0.24676513671875, 0.0159912109375, 0.27874755859375, 0.54150390625, 0.80426025390625, 1.0670166015625, 1.32977294921875, 1.592529296875, 1.85528564453125, 2.1180419921875, 2.38079833984375, 2.6435546875, 2.90631103515625, 3.1690673828125, 3.43182373046875, 3.694580078125, 3.95733642578125, 4.2200927734375, 4.48284912109375, 4.74560546875, 5.00836181640625, 5.2711181640625, 5.53387451171875, 5.796630859375, 6.05938720703125, 6.3221435546875, 6.58489990234375, 6.84765625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 12.0, 16.0, 23.0, 40.0, 67.0, 108.0, 138.0, 225.0, 307.0, 502.0, 717.0, 1168.0, 1736.0, 2797.0, 4406.0, 7130.0, 11818.0, 19993.0, 34572.0, 62127.0, 115619.0, 222883.0, 448868.0, 914359.0, 1124003.0, 594979.0, 292055.0, 148210.0, 78527.0, 43272.0, 25008.0, 14820.0, 8751.0, 5363.0, 3449.0, 2178.0, 1366.0, 885.0, 616.0, 394.0, 270.0, 172.0, 114.0, 87.0, 48.0, 33.0, 19.0, 16.0, 14.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.91650390625, -9.5986328125, -9.28076171875, -8.962890625, -8.64501953125, -8.3271484375, -8.00927734375, -7.69140625, -7.37353515625, -7.0556640625, -6.73779296875, -6.419921875, -6.10205078125, -5.7841796875, -5.46630859375, -5.1484375, -4.83056640625, -4.5126953125, -4.19482421875, -3.876953125, -3.55908203125, -3.2412109375, -2.92333984375, -2.60546875, -2.28759765625, -1.9697265625, -1.65185546875, -1.333984375, -1.01611328125, -0.6982421875, -0.38037109375, -0.0625, 0.25537109375, 0.5732421875, 0.89111328125, 1.208984375, 1.52685546875, 1.8447265625, 2.16259765625, 2.48046875, 2.79833984375, 3.1162109375, 3.43408203125, 3.751953125, 4.06982421875, 4.3876953125, 4.70556640625, 5.0234375, 5.34130859375, 5.6591796875, 5.97705078125, 6.294921875, 6.61279296875, 6.9306640625, 7.24853515625, 7.56640625, 7.88427734375, 8.2021484375, 8.52001953125, 8.837890625, 9.15576171875, 9.4736328125, 9.79150390625, 10.109375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 11.0, 8.0, 13.0, 22.0, 20.0, 23.0, 39.0, 40.0, 48.0, 61.0, 93.0, 100.0, 111.0, 136.0, 185.0, 196.0, 240.0, 286.0, 313.0, 309.0, 303.0, 246.0, 222.0, 202.0, 161.0, 133.0, 105.0, 78.0, 73.0, 67.0, 47.0, 39.0, 35.0, 18.0, 18.0, 16.0, 13.0, 9.0, 6.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.6328125, -3.5120849609375, -3.391357421875, -3.2706298828125, -3.14990234375, -3.0291748046875, -2.908447265625, -2.7877197265625, -2.6669921875, -2.5462646484375, -2.425537109375, -2.3048095703125, -2.18408203125, -2.0633544921875, -1.942626953125, -1.8218994140625, -1.701171875, -1.5804443359375, -1.459716796875, -1.3389892578125, -1.21826171875, -1.0975341796875, -0.976806640625, -0.8560791015625, -0.7353515625, -0.6146240234375, -0.493896484375, -0.3731689453125, -0.25244140625, -0.1317138671875, -0.010986328125, 0.1097412109375, 0.23046875, 0.3511962890625, 0.471923828125, 0.5926513671875, 0.71337890625, 0.8341064453125, 0.954833984375, 1.0755615234375, 1.1962890625, 1.3170166015625, 1.437744140625, 1.5584716796875, 1.67919921875, 1.7999267578125, 1.920654296875, 2.0413818359375, 2.162109375, 2.2828369140625, 2.403564453125, 2.5242919921875, 2.64501953125, 2.7657470703125, 2.886474609375, 3.0072021484375, 3.1279296875, 3.2486572265625, 3.369384765625, 3.4901123046875, 3.61083984375, 3.7315673828125, 3.852294921875, 3.9730224609375, 4.09375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 10.0, 9.0, 10.0, 8.0, 13.0, 19.0, 18.0, 29.0, 27.0, 42.0, 48.0, 90.0, 83.0, 88.0, 75.0, 90.0, 62.0, 50.0, 38.0, 41.0, 34.0, 23.0, 16.0, 19.0, 12.0, 12.0, 8.0, 8.0, 1.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.096809387207031, -7.787352561950684, -7.477895736694336, -7.1684393882751465, -6.858982563018799, -6.549525737762451, -6.240069389343262, -5.930612564086914, -5.621155738830566, -5.311698913574219, -5.002242088317871, -4.692785739898682, -4.383328914642334, -4.073872089385986, -3.7644155025482178, -3.454958915710449, -3.1455020904541016, -2.836045265197754, -2.5265886783599854, -2.217132091522217, -1.9076752662658691, -1.598218560218811, -1.288761854171753, -0.9793052673339844, -0.6698484420776367, -0.3603917360305786, -0.05093502998352051, 0.2585216760635376, 0.5679783821105957, 0.8774350881576538, 1.186891794204712, 1.4963483810424805, 1.8058042526245117, 2.1152610778808594, 2.424717664718628, 2.7341742515563965, 3.043631076812744, 3.353087902069092, 3.6625444889068604, 3.972001075744629, 4.281457901000977, 4.590914726257324, 4.900371551513672, 5.209827899932861, 5.519284725189209, 5.828741550445557, 6.138197898864746, 6.447654724121094, 6.757111549377441, 7.066568374633789, 7.376025199890137, 7.685481548309326, 7.994938373565674, 8.304394721984863, 8.613851547241211, 8.923308372497559, 9.232765197753906, 9.542222023010254, 9.851678848266602, 10.16113567352295, 10.470592498779297, 10.780048370361328, 11.089505195617676, 11.398962020874023, 11.708418846130371]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 11.0, 3.0, 6.0, 8.0, 7.0, 16.0, 24.0, 20.0, 20.0, 20.0, 24.0, 23.0, 31.0, 27.0, 32.0, 33.0, 40.0, 37.0, 46.0, 54.0, 46.0, 41.0, 57.0, 43.0, 37.0, 45.0, 34.0, 36.0, 32.0, 24.0, 17.0, 11.0, 20.0, 14.0, 23.0, 11.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.441136360168457, -10.168608665466309, -9.89608097076416, -9.623553276062012, -9.351024627685547, -9.078496932983398, -8.80596923828125, -8.533441543579102, -8.260913848876953, -7.988386154174805, -7.715858459472656, -7.44333028793335, -7.170802593231201, -6.898274898529053, -6.625746726989746, -6.353219032287598, -6.080691337585449, -5.808163642883301, -5.535635948181152, -5.263107776641846, -4.990580081939697, -4.718052387237549, -4.445524215698242, -4.172996520996094, -3.9004688262939453, -3.627941131591797, -3.3554131984710693, -3.082885265350342, -2.8103575706481934, -2.537829875946045, -2.2653019428253174, -1.9927741289138794, -1.7202467918395996, -1.4477189779281616, -1.1751911640167236, -0.9026633501052856, -0.6301355361938477, -0.35760772228240967, -0.08507990837097168, 0.1874479055404663, 0.4599757194519043, 0.7325035333633423, 1.0050313472747803, 1.2775591611862183, 1.5500869750976562, 1.8226147890090942, 2.0951426029205322, 2.3676705360412598, 2.640198230743408, 2.9127259254455566, 3.185253858566284, 3.4577817916870117, 3.73030948638916, 4.002837181091309, 4.275364875793457, 4.547893047332764, 4.820420742034912, 5.0929484367370605, 5.365476608276367, 5.638004302978516, 5.910531997680664, 6.1830596923828125, 6.455587387084961, 6.728115558624268, 7.000643253326416]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 7.0, 28.0, 35.0, 39.0, 48.0, 69.0, 104.0, 125.0, 200.0, 333.0, 442.0, 651.0, 977.0, 1422.0, 2148.0, 3372.0, 5007.0, 7533.0, 11481.0, 17560.0, 26980.0, 42259.0, 66819.0, 105222.0, 164612.0, 205257.0, 138915.0, 88227.0, 55966.0, 35948.0, 22855.0, 15062.0, 9721.0, 6410.0, 4132.0, 2752.0, 1948.0, 1206.0, 828.0, 588.0, 384.0, 252.0, 177.0, 136.0, 95.0, 62.0, 47.0, 31.0, 27.0, 11.0, 7.0, 11.0, 7.0, 5.0, 5.0, 1.0, 4.0], "bins": [-3.06640625, -2.97149658203125, -2.8765869140625, -2.78167724609375, -2.686767578125, -2.59185791015625, -2.4969482421875, -2.40203857421875, -2.30712890625, -2.21221923828125, -2.1173095703125, -2.02239990234375, -1.927490234375, -1.83258056640625, -1.7376708984375, -1.64276123046875, -1.5478515625, -1.45294189453125, -1.3580322265625, -1.26312255859375, -1.168212890625, -1.07330322265625, -0.9783935546875, -0.88348388671875, -0.78857421875, -0.69366455078125, -0.5987548828125, -0.50384521484375, -0.408935546875, -0.31402587890625, -0.2191162109375, -0.12420654296875, -0.029296875, 0.06561279296875, 0.1605224609375, 0.25543212890625, 0.350341796875, 0.44525146484375, 0.5401611328125, 0.63507080078125, 0.72998046875, 0.82489013671875, 0.9197998046875, 1.01470947265625, 1.109619140625, 1.20452880859375, 1.2994384765625, 1.39434814453125, 1.4892578125, 1.58416748046875, 1.6790771484375, 1.77398681640625, 1.868896484375, 1.96380615234375, 2.0587158203125, 2.15362548828125, 2.24853515625, 2.34344482421875, 2.4383544921875, 2.53326416015625, 2.628173828125, 2.72308349609375, 2.8179931640625, 2.91290283203125, 3.0078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 1.0, 4.0, 11.0, 7.0, 13.0, 10.0, 22.0, 15.0, 18.0, 28.0, 15.0, 19.0, 34.0, 28.0, 33.0, 28.0, 33.0, 50.0, 48.0, 42.0, 43.0, 40.0, 41.0, 45.0, 44.0, 41.0, 50.0, 31.0, 28.0, 32.0, 26.0, 15.0, 23.0, 8.0, 15.0, 15.0, 17.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.890625, -9.621337890625, -9.35205078125, -9.082763671875, -8.8134765625, -8.544189453125, -8.27490234375, -8.005615234375, -7.736328125, -7.467041015625, -7.19775390625, -6.928466796875, -6.6591796875, -6.389892578125, -6.12060546875, -5.851318359375, -5.58203125, -5.312744140625, -5.04345703125, -4.774169921875, -4.5048828125, -4.235595703125, -3.96630859375, -3.697021484375, -3.427734375, -3.158447265625, -2.88916015625, -2.619873046875, -2.3505859375, -2.081298828125, -1.81201171875, -1.542724609375, -1.2734375, -1.004150390625, -0.73486328125, -0.465576171875, -0.1962890625, 0.072998046875, 0.34228515625, 0.611572265625, 0.880859375, 1.150146484375, 1.41943359375, 1.688720703125, 1.9580078125, 2.227294921875, 2.49658203125, 2.765869140625, 3.03515625, 3.304443359375, 3.57373046875, 3.843017578125, 4.1123046875, 4.381591796875, 4.65087890625, 4.920166015625, 5.189453125, 5.458740234375, 5.72802734375, 5.997314453125, 6.2666015625, 6.535888671875, 6.80517578125, 7.074462890625, 7.34375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 21.0, 17.0, 31.0, 42.0, 67.0, 136.0, 191.0, 299.0, 454.0, 669.0, 1080.0, 1799.0, 2929.0, 4820.0, 8598.0, 15236.0, 28061.0, 53990.0, 106728.0, 225365.0, 302557.0, 142631.0, 70572.0, 36407.0, 19573.0, 10691.0, 6210.0, 3523.0, 2151.0, 1344.0, 823.0, 517.0, 353.0, 216.0, 140.0, 98.0, 64.0, 42.0, 34.0, 17.0, 10.0, 13.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.359375, -4.2239990234375, -4.088623046875, -3.9532470703125, -3.81787109375, -3.6824951171875, -3.547119140625, -3.4117431640625, -3.2763671875, -3.1409912109375, -3.005615234375, -2.8702392578125, -2.73486328125, -2.5994873046875, -2.464111328125, -2.3287353515625, -2.193359375, -2.0579833984375, -1.922607421875, -1.7872314453125, -1.65185546875, -1.5164794921875, -1.381103515625, -1.2457275390625, -1.1103515625, -0.9749755859375, -0.839599609375, -0.7042236328125, -0.56884765625, -0.4334716796875, -0.298095703125, -0.1627197265625, -0.02734375, 0.1080322265625, 0.243408203125, 0.3787841796875, 0.51416015625, 0.6495361328125, 0.784912109375, 0.9202880859375, 1.0556640625, 1.1910400390625, 1.326416015625, 1.4617919921875, 1.59716796875, 1.7325439453125, 1.867919921875, 2.0032958984375, 2.138671875, 2.2740478515625, 2.409423828125, 2.5447998046875, 2.68017578125, 2.8155517578125, 2.950927734375, 3.0863037109375, 3.2216796875, 3.3570556640625, 3.492431640625, 3.6278076171875, 3.76318359375, 3.8985595703125, 4.033935546875, 4.1693115234375, 4.3046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 3.0, 9.0, 9.0, 6.0, 7.0, 11.0, 22.0, 30.0, 26.0, 18.0, 30.0, 20.0, 31.0, 28.0, 32.0, 34.0, 38.0, 52.0, 31.0, 34.0, 46.0, 47.0, 38.0, 40.0, 33.0, 49.0, 29.0, 29.0, 24.0, 30.0, 23.0, 28.0, 16.0, 14.0, 16.0, 12.0, 6.0, 6.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.94140625, -4.786865234375, -4.63232421875, -4.477783203125, -4.3232421875, -4.168701171875, -4.01416015625, -3.859619140625, -3.705078125, -3.550537109375, -3.39599609375, -3.241455078125, -3.0869140625, -2.932373046875, -2.77783203125, -2.623291015625, -2.46875, -2.314208984375, -2.15966796875, -2.005126953125, -1.8505859375, -1.696044921875, -1.54150390625, -1.386962890625, -1.232421875, -1.077880859375, -0.92333984375, -0.768798828125, -0.6142578125, -0.459716796875, -0.30517578125, -0.150634765625, 0.00390625, 0.158447265625, 0.31298828125, 0.467529296875, 0.6220703125, 0.776611328125, 0.93115234375, 1.085693359375, 1.240234375, 1.394775390625, 1.54931640625, 1.703857421875, 1.8583984375, 2.012939453125, 2.16748046875, 2.322021484375, 2.4765625, 2.631103515625, 2.78564453125, 2.940185546875, 3.0947265625, 3.249267578125, 3.40380859375, 3.558349609375, 3.712890625, 3.867431640625, 4.02197265625, 4.176513671875, 4.3310546875, 4.485595703125, 4.64013671875, 4.794677734375, 4.94921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 12.0, 25.0, 24.0, 38.0, 35.0, 93.0, 131.0, 212.0, 334.0, 522.0, 777.0, 1283.0, 2270.0, 3876.0, 7352.0, 15064.0, 34108.0, 93481.0, 342796.0, 374252.0, 101779.0, 36758.0, 15717.0, 7674.0, 4132.0, 2214.0, 1351.0, 816.0, 482.0, 304.0, 213.0, 153.0, 79.0, 62.0, 44.0, 22.0, 15.0, 11.0, 16.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.044677734375, -0.043238162994384766, -0.04179859161376953, -0.0403590202331543, -0.03891944885253906, -0.03747987747192383, -0.036040306091308594, -0.03460073471069336, -0.033161163330078125, -0.03172159194946289, -0.030282020568847656, -0.028842449188232422, -0.027402877807617188, -0.025963306427001953, -0.02452373504638672, -0.023084163665771484, -0.02164459228515625, -0.020205020904541016, -0.01876544952392578, -0.017325878143310547, -0.015886306762695312, -0.014446735382080078, -0.013007164001464844, -0.01156759262084961, -0.010128021240234375, -0.00868844985961914, -0.007248878479003906, -0.005809307098388672, -0.0043697357177734375, -0.002930164337158203, -0.0014905929565429688, -5.1021575927734375e-05, 0.0013885498046875, 0.0028281211853027344, 0.004267692565917969, 0.005707263946533203, 0.0071468353271484375, 0.008586406707763672, 0.010025978088378906, 0.01146554946899414, 0.012905120849609375, 0.01434469223022461, 0.015784263610839844, 0.017223834991455078, 0.018663406372070312, 0.020102977752685547, 0.02154254913330078, 0.022982120513916016, 0.02442169189453125, 0.025861263275146484, 0.02730083465576172, 0.028740406036376953, 0.030179977416992188, 0.03161954879760742, 0.033059120178222656, 0.03449869155883789, 0.035938262939453125, 0.03737783432006836, 0.038817405700683594, 0.04025697708129883, 0.04169654846191406, 0.0431361198425293, 0.04457569122314453, 0.046015262603759766, 0.047454833984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 11.0, 7.0, 9.0, 16.0, 13.0, 25.0, 26.0, 35.0, 43.0, 51.0, 73.0, 74.0, 90.0, 80.0, 94.0, 60.0, 54.0, 51.0, 35.0, 31.0, 26.0, 15.0, 22.0, 10.0, 12.0, 2.0, 8.0, 3.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5472061932086945e-05, -1.5029683709144592e-05, -1.458730548620224e-05, -1.4144927263259888e-05, -1.3702549040317535e-05, -1.3260170817375183e-05, -1.281779259443283e-05, -1.2375414371490479e-05, -1.1933036148548126e-05, -1.1490657925605774e-05, -1.1048279702663422e-05, -1.060590147972107e-05, -1.0163523256778717e-05, -9.721145033836365e-06, -9.278766810894012e-06, -8.83638858795166e-06, -8.394010365009308e-06, -7.951632142066956e-06, -7.509253919124603e-06, -7.066875696182251e-06, -6.624497473239899e-06, -6.182119250297546e-06, -5.739741027355194e-06, -5.297362804412842e-06, -4.8549845814704895e-06, -4.412606358528137e-06, -3.970228135585785e-06, -3.5278499126434326e-06, -3.0854716897010803e-06, -2.643093466758728e-06, -2.2007152438163757e-06, -1.7583370208740234e-06, -1.3159587979316711e-06, -8.735805749893188e-07, -4.3120235204696655e-07, 1.1175870895385742e-08, 4.5355409383773804e-07, 8.959323167800903e-07, 1.3383105397224426e-06, 1.780688762664795e-06, 2.2230669856071472e-06, 2.6654452085494995e-06, 3.107823431491852e-06, 3.550201654434204e-06, 3.992579877376556e-06, 4.434958100318909e-06, 4.877336323261261e-06, 5.319714546203613e-06, 5.7620927691459656e-06, 6.204470992088318e-06, 6.64684921503067e-06, 7.0892274379730225e-06, 7.531605660915375e-06, 7.973983883857727e-06, 8.41636210680008e-06, 8.858740329742432e-06, 9.301118552684784e-06, 9.743496775627136e-06, 1.0185874998569489e-05, 1.062825322151184e-05, 1.1070631444454193e-05, 1.1513009667396545e-05, 1.1955387890338898e-05, 1.239776611328125e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 10.0, 12.0, 13.0, 22.0, 42.0, 52.0, 82.0, 133.0, 170.0, 255.0, 421.0, 587.0, 771.0, 1178.0, 1834.0, 2624.0, 4092.0, 6542.0, 10669.0, 18496.0, 32830.0, 65515.0, 149276.0, 334063.0, 221683.0, 93029.0, 44205.0, 23386.0, 13705.0, 8132.0, 4948.0, 3250.0, 2094.0, 1397.0, 970.0, 667.0, 457.0, 272.0, 204.0, 142.0, 95.0, 81.0, 49.0, 23.0, 22.0, 23.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.033233642578125, -0.032217979431152344, -0.031202316284179688, -0.03018665313720703, -0.029170989990234375, -0.02815532684326172, -0.027139663696289062, -0.026124000549316406, -0.02510833740234375, -0.024092674255371094, -0.023077011108398438, -0.02206134796142578, -0.021045684814453125, -0.02003002166748047, -0.019014358520507812, -0.017998695373535156, -0.0169830322265625, -0.015967369079589844, -0.014951705932617188, -0.013936042785644531, -0.012920379638671875, -0.011904716491699219, -0.010889053344726562, -0.009873390197753906, -0.00885772705078125, -0.007842063903808594, -0.0068264007568359375, -0.005810737609863281, -0.004795074462890625, -0.0037794113159179688, -0.0027637481689453125, -0.0017480850219726562, -0.000732421875, 0.00028324127197265625, 0.0012989044189453125, 0.0023145675659179688, 0.003330230712890625, 0.004345893859863281, 0.0053615570068359375, 0.006377220153808594, 0.00739288330078125, 0.008408546447753906, 0.009424209594726562, 0.010439872741699219, 0.011455535888671875, 0.012471199035644531, 0.013486862182617188, 0.014502525329589844, 0.0155181884765625, 0.016533851623535156, 0.017549514770507812, 0.01856517791748047, 0.019580841064453125, 0.02059650421142578, 0.021612167358398438, 0.022627830505371094, 0.02364349365234375, 0.024659156799316406, 0.025674819946289062, 0.02669048309326172, 0.027706146240234375, 0.02872180938720703, 0.029737472534179688, 0.030753135681152344, 0.031768798828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 6.0, 4.0, 11.0, 14.0, 17.0, 11.0, 30.0, 22.0, 41.0, 35.0, 55.0, 126.0, 150.0, 130.0, 86.0, 54.0, 45.0, 34.0, 18.0, 25.0, 17.0, 15.0, 5.0, 5.0, 7.0, 5.0, 3.0, 9.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011505126953125, -0.01110374927520752, -0.010702371597290039, -0.010300993919372559, -0.009899616241455078, -0.009498238563537598, -0.009096860885620117, -0.008695483207702637, -0.008294105529785156, -0.007892727851867676, -0.007491350173950195, -0.007089972496032715, -0.006688594818115234, -0.006287217140197754, -0.0058858394622802734, -0.005484461784362793, -0.0050830841064453125, -0.004681706428527832, -0.0042803287506103516, -0.003878951072692871, -0.0034775733947753906, -0.00307619571685791, -0.0026748180389404297, -0.0022734403610229492, -0.0018720626831054688, -0.0014706850051879883, -0.0010693073272705078, -0.0006679296493530273, -0.0002665519714355469, 0.0001348257064819336, 0.0005362033843994141, 0.0009375810623168945, 0.001338958740234375, 0.0017403364181518555, 0.002141714096069336, 0.0025430917739868164, 0.002944469451904297, 0.0033458471298217773, 0.003747224807739258, 0.004148602485656738, 0.004549980163574219, 0.004951357841491699, 0.00535273551940918, 0.00575411319732666, 0.006155490875244141, 0.006556868553161621, 0.0069582462310791016, 0.007359623908996582, 0.0077610015869140625, 0.008162379264831543, 0.008563756942749023, 0.008965134620666504, 0.009366512298583984, 0.009767889976501465, 0.010169267654418945, 0.010570645332336426, 0.010972023010253906, 0.011373400688171387, 0.011774778366088867, 0.012176156044006348, 0.012577533721923828, 0.012978911399841309, 0.013380289077758789, 0.01378166675567627, 0.01418304443359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 2.0, 13.0, 5.0, 8.0, 14.0, 17.0, 26.0, 22.0, 35.0, 38.0, 60.0, 83.0, 86.0, 97.0, 75.0, 88.0, 64.0, 48.0, 45.0, 40.0, 23.0, 25.0, 16.0, 15.0, 15.0, 5.0, 13.0, 1.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.343414306640625, -8.023571968078613, -7.70373010635376, -7.383888244628906, -7.0640459060668945, -6.744204044342041, -6.4243621826171875, -6.104519844055176, -5.784677982330322, -5.464836120605469, -5.144993782043457, -4.8251519203186035, -4.50531005859375, -4.185467720031738, -3.8656258583068848, -3.545783758163452, -3.2259416580200195, -2.906099557876587, -2.5862574577331543, -2.266415596008301, -1.9465734958648682, -1.6267313957214355, -1.3068894147872925, -0.9870474338531494, -0.6672053337097168, -0.34736329317092896, -0.027521252632141113, 0.29232078790664673, 0.6121628284454346, 0.9320049285888672, 1.2518469095230103, 1.5716888904571533, 1.8915300369262695, 2.211372137069702, 2.5312142372131348, 2.8510560989379883, 3.170898199081421, 3.4907402992248535, 3.810582160949707, 4.130424499511719, 4.450266361236572, 4.770108222961426, 5.0899505615234375, 5.409792423248291, 5.7296342849731445, 6.049476623535156, 6.36931848526001, 6.689160346984863, 7.009002685546875, 7.3288445472717285, 7.64868688583374, 7.968528747558594, 8.288371086120605, 8.608213424682617, 8.928054809570312, 9.247897148132324, 9.567739486694336, 9.887581825256348, 10.207423210144043, 10.527265548706055, 10.847107887268066, 11.166950225830078, 11.486791610717773, 11.806633949279785, 12.12647533416748]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 10.0, 4.0, 4.0, 9.0, 8.0, 15.0, 25.0, 21.0, 20.0, 19.0, 23.0, 25.0, 29.0, 30.0, 30.0, 34.0, 39.0, 37.0, 47.0, 51.0, 48.0, 41.0, 56.0, 44.0, 36.0, 47.0, 31.0, 36.0, 34.0, 23.0, 18.0, 11.0, 18.0, 17.0, 22.0, 9.0, 11.0, 8.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.367788314819336, -10.096941947937012, -9.826096534729004, -9.55525016784668, -9.284404754638672, -9.013558387756348, -8.74271297454834, -8.471866607666016, -8.201021194458008, -7.930175304412842, -7.659329414367676, -7.38848352432251, -7.117637634277344, -6.846791744232178, -6.575945854187012, -6.3050994873046875, -6.0342535972595215, -5.7634077072143555, -5.4925618171691895, -5.221715927124023, -4.950870037078857, -4.680024147033691, -4.409177780151367, -4.138332366943359, -3.8674862384796143, -3.5966403484344482, -3.3257944583892822, -3.054948329925537, -2.784102439880371, -2.513256549835205, -2.242410659790039, -1.971564769744873, -1.7007184028625488, -1.4298725128173828, -1.1590266227722168, -0.8881806135177612, -0.6173347234725952, -0.3464888334274292, -0.07564282417297363, 0.19520306587219238, 0.4660489559173584, 0.7368948459625244, 1.0077407360076904, 1.278586745262146, 1.549432635307312, 1.820278525352478, 2.0911245346069336, 2.3619704246520996, 2.6328163146972656, 2.9036622047424316, 3.1745080947875977, 3.4453539848327637, 3.7161998748779297, 3.9870457649230957, 4.257891654968262, 4.528738021850586, 4.799583435058594, 5.07042932510376, 5.341275215148926, 5.612121105194092, 5.882966995239258, 6.153812885284424, 6.42465877532959, 6.695505142211914, 6.96635103225708]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 19.0, 13.0, 27.0, 49.0, 71.0, 128.0, 233.0, 363.0, 509.0, 930.0, 1531.0, 2464.0, 4085.0, 6842.0, 11290.0, 18833.0, 31901.0, 56192.0, 98743.0, 162878.0, 210688.0, 176772.0, 111307.0, 63433.0, 36466.0, 20993.0, 12490.0, 7540.0, 4661.0, 2729.0, 1715.0, 1030.0, 615.0, 386.0, 240.0, 159.0, 78.0, 51.0, 30.0, 19.0, 19.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.22509765625, -9.8408203125, -9.45654296875, -9.072265625, -8.68798828125, -8.3037109375, -7.91943359375, -7.53515625, -7.15087890625, -6.7666015625, -6.38232421875, -5.998046875, -5.61376953125, -5.2294921875, -4.84521484375, -4.4609375, -4.07666015625, -3.6923828125, -3.30810546875, -2.923828125, -2.53955078125, -2.1552734375, -1.77099609375, -1.38671875, -1.00244140625, -0.6181640625, -0.23388671875, 0.150390625, 0.53466796875, 0.9189453125, 1.30322265625, 1.6875, 2.07177734375, 2.4560546875, 2.84033203125, 3.224609375, 3.60888671875, 3.9931640625, 4.37744140625, 4.76171875, 5.14599609375, 5.5302734375, 5.91455078125, 6.298828125, 6.68310546875, 7.0673828125, 7.45166015625, 7.8359375, 8.22021484375, 8.6044921875, 8.98876953125, 9.373046875, 9.75732421875, 10.1416015625, 10.52587890625, 10.91015625, 11.29443359375, 11.6787109375, 12.06298828125, 12.447265625, 12.83154296875, 13.2158203125, 13.60009765625, 13.984375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 6.0, 14.0, 10.0, 14.0, 19.0, 22.0, 24.0, 28.0, 31.0, 25.0, 30.0, 29.0, 37.0, 27.0, 45.0, 57.0, 50.0, 41.0, 45.0, 46.0, 56.0, 38.0, 45.0, 48.0, 34.0, 30.0, 19.0, 18.0, 17.0, 10.0, 11.0, 13.0, 15.0, 10.0, 13.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0], "bins": [-10.4609375, -10.200927734375, -9.94091796875, -9.680908203125, -9.4208984375, -9.160888671875, -8.90087890625, -8.640869140625, -8.380859375, -8.120849609375, -7.86083984375, -7.600830078125, -7.3408203125, -7.080810546875, -6.82080078125, -6.560791015625, -6.30078125, -6.040771484375, -5.78076171875, -5.520751953125, -5.2607421875, -5.000732421875, -4.74072265625, -4.480712890625, -4.220703125, -3.960693359375, -3.70068359375, -3.440673828125, -3.1806640625, -2.920654296875, -2.66064453125, -2.400634765625, -2.140625, -1.880615234375, -1.62060546875, -1.360595703125, -1.1005859375, -0.840576171875, -0.58056640625, -0.320556640625, -0.060546875, 0.199462890625, 0.45947265625, 0.719482421875, 0.9794921875, 1.239501953125, 1.49951171875, 1.759521484375, 2.01953125, 2.279541015625, 2.53955078125, 2.799560546875, 3.0595703125, 3.319580078125, 3.57958984375, 3.839599609375, 4.099609375, 4.359619140625, 4.61962890625, 4.879638671875, 5.1396484375, 5.399658203125, 5.65966796875, 5.919677734375, 6.1796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 8.0, 15.0, 18.0, 27.0, 29.0, 62.0, 78.0, 152.0, 202.0, 306.0, 401.0, 560.0, 916.0, 1295.0, 1987.0, 2797.0, 4190.0, 6395.0, 9302.0, 13900.0, 20975.0, 31371.0, 47465.0, 71703.0, 107193.0, 146266.0, 162519.0, 134736.0, 95122.0, 63132.0, 41797.0, 27546.0, 18476.0, 12332.0, 8232.0, 5484.0, 3696.0, 2515.0, 1779.0, 1204.0, 741.0, 525.0, 342.0, 251.0, 152.0, 119.0, 77.0, 53.0, 37.0, 24.0, 19.0, 12.0, 11.0, 8.0, 1.0, 2.0, 3.0, 2.0], "bins": [-9.5703125, -9.2744140625, -8.978515625, -8.6826171875, -8.38671875, -8.0908203125, -7.794921875, -7.4990234375, -7.203125, -6.9072265625, -6.611328125, -6.3154296875, -6.01953125, -5.7236328125, -5.427734375, -5.1318359375, -4.8359375, -4.5400390625, -4.244140625, -3.9482421875, -3.65234375, -3.3564453125, -3.060546875, -2.7646484375, -2.46875, -2.1728515625, -1.876953125, -1.5810546875, -1.28515625, -0.9892578125, -0.693359375, -0.3974609375, -0.1015625, 0.1943359375, 0.490234375, 0.7861328125, 1.08203125, 1.3779296875, 1.673828125, 1.9697265625, 2.265625, 2.5615234375, 2.857421875, 3.1533203125, 3.44921875, 3.7451171875, 4.041015625, 4.3369140625, 4.6328125, 4.9287109375, 5.224609375, 5.5205078125, 5.81640625, 6.1123046875, 6.408203125, 6.7041015625, 7.0, 7.2958984375, 7.591796875, 7.8876953125, 8.18359375, 8.4794921875, 8.775390625, 9.0712890625, 9.3671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 5.0, 11.0, 8.0, 12.0, 9.0, 15.0, 18.0, 12.0, 25.0, 29.0, 25.0, 30.0, 20.0, 29.0, 31.0, 38.0, 40.0, 27.0, 40.0, 43.0, 37.0, 42.0, 37.0, 36.0, 33.0, 33.0, 33.0, 20.0, 31.0, 39.0, 30.0, 27.0, 19.0, 15.0, 18.0, 11.0, 12.0, 13.0, 10.0, 5.0, 3.0, 1.0, 5.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.345947265625, -4.20361328125, -4.061279296875, -3.9189453125, -3.776611328125, -3.63427734375, -3.491943359375, -3.349609375, -3.207275390625, -3.06494140625, -2.922607421875, -2.7802734375, -2.637939453125, -2.49560546875, -2.353271484375, -2.2109375, -2.068603515625, -1.92626953125, -1.783935546875, -1.6416015625, -1.499267578125, -1.35693359375, -1.214599609375, -1.072265625, -0.929931640625, -0.78759765625, -0.645263671875, -0.5029296875, -0.360595703125, -0.21826171875, -0.075927734375, 0.06640625, 0.208740234375, 0.35107421875, 0.493408203125, 0.6357421875, 0.778076171875, 0.92041015625, 1.062744140625, 1.205078125, 1.347412109375, 1.48974609375, 1.632080078125, 1.7744140625, 1.916748046875, 2.05908203125, 2.201416015625, 2.34375, 2.486083984375, 2.62841796875, 2.770751953125, 2.9130859375, 3.055419921875, 3.19775390625, 3.340087890625, 3.482421875, 3.624755859375, 3.76708984375, 3.909423828125, 4.0517578125, 4.194091796875, 4.33642578125, 4.478759765625, 4.62109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 15.0, 15.0, 21.0, 23.0, 29.0, 45.0, 85.0, 146.0, 206.0, 318.0, 452.0, 748.0, 1055.0, 1724.0, 2572.0, 4163.0, 6599.0, 10944.0, 18841.0, 35145.0, 81238.0, 288443.0, 399616.0, 101092.0, 41343.0, 21321.0, 12200.0, 7420.0, 4463.0, 2912.0, 1867.0, 1212.0, 787.0, 503.0, 310.0, 222.0, 160.0, 105.0, 72.0, 37.0, 31.0, 16.0, 13.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.859375, -5.6580810546875, -5.456787109375, -5.2554931640625, -5.05419921875, -4.8529052734375, -4.651611328125, -4.4503173828125, -4.2490234375, -4.0477294921875, -3.846435546875, -3.6451416015625, -3.44384765625, -3.2425537109375, -3.041259765625, -2.8399658203125, -2.638671875, -2.4373779296875, -2.236083984375, -2.0347900390625, -1.83349609375, -1.6322021484375, -1.430908203125, -1.2296142578125, -1.0283203125, -0.8270263671875, -0.625732421875, -0.4244384765625, -0.22314453125, -0.0218505859375, 0.179443359375, 0.3807373046875, 0.58203125, 0.7833251953125, 0.984619140625, 1.1859130859375, 1.38720703125, 1.5885009765625, 1.789794921875, 1.9910888671875, 2.1923828125, 2.3936767578125, 2.594970703125, 2.7962646484375, 2.99755859375, 3.1988525390625, 3.400146484375, 3.6014404296875, 3.802734375, 4.0040283203125, 4.205322265625, 4.4066162109375, 4.60791015625, 4.8092041015625, 5.010498046875, 5.2117919921875, 5.4130859375, 5.6143798828125, 5.815673828125, 6.0169677734375, 6.21826171875, 6.4195556640625, 6.620849609375, 6.8221435546875, 7.0234375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 6.0, 6.0, 7.0, 10.0, 17.0, 12.0, 24.0, 13.0, 22.0, 31.0, 65.0, 65.0, 90.0, 93.0, 118.0, 91.0, 84.0, 52.0, 50.0, 27.0, 22.0, 19.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002529621124267578, -0.00024423748254776, -0.0002355128526687622, -0.0002267882227897644, -0.0002180635929107666, -0.0002093389630317688, -0.000200614333152771, -0.0001918897032737732, -0.0001831650733947754, -0.0001744404435157776, -0.00016571581363677979, -0.00015699118375778198, -0.00014826655387878418, -0.00013954192399978638, -0.00013081729412078857, -0.00012209266424179077, -0.00011336803436279297, -0.00010464340448379517, -9.591877460479736e-05, -8.719414472579956e-05, -7.846951484680176e-05, -6.974488496780396e-05, -6.102025508880615e-05, -5.229562520980835e-05, -4.357099533081055e-05, -3.4846365451812744e-05, -2.612173557281494e-05, -1.739710569381714e-05, -8.672475814819336e-06, 5.21540641784668e-08, 8.77678394317627e-06, 1.7501413822174072e-05, 2.6226043701171875e-05, 3.495067358016968e-05, 4.367530345916748e-05, 5.239993333816528e-05, 6.112456321716309e-05, 6.984919309616089e-05, 7.857382297515869e-05, 8.72984528541565e-05, 9.60230827331543e-05, 0.0001047477126121521, 0.0001134723424911499, 0.0001221969723701477, 0.0001309216022491455, 0.0001396462321281433, 0.0001483708620071411, 0.00015709549188613892, 0.00016582012176513672, 0.00017454475164413452, 0.00018326938152313232, 0.00019199401140213013, 0.00020071864128112793, 0.00020944327116012573, 0.00021816790103912354, 0.00022689253091812134, 0.00023561716079711914, 0.00024434179067611694, 0.00025306642055511475, 0.00026179105043411255, 0.00027051568031311035, 0.00027924031019210815, 0.00028796494007110596, 0.00029668956995010376, 0.00030541419982910156]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 11.0, 15.0, 18.0, 26.0, 36.0, 41.0, 71.0, 89.0, 135.0, 196.0, 280.0, 411.0, 582.0, 862.0, 1210.0, 1905.0, 2646.0, 4143.0, 6815.0, 11062.0, 18948.0, 34893.0, 70774.0, 185979.0, 427604.0, 144863.0, 60157.0, 30517.0, 16763.0, 9791.0, 5988.0, 3757.0, 2612.0, 1652.0, 1189.0, 798.0, 522.0, 354.0, 251.0, 168.0, 127.0, 92.0, 68.0, 42.0, 28.0, 21.0, 14.0, 8.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.9453125, -4.7825927734375, -4.619873046875, -4.4571533203125, -4.29443359375, -4.1317138671875, -3.968994140625, -3.8062744140625, -3.6435546875, -3.4808349609375, -3.318115234375, -3.1553955078125, -2.99267578125, -2.8299560546875, -2.667236328125, -2.5045166015625, -2.341796875, -2.1790771484375, -2.016357421875, -1.8536376953125, -1.69091796875, -1.5281982421875, -1.365478515625, -1.2027587890625, -1.0400390625, -0.8773193359375, -0.714599609375, -0.5518798828125, -0.38916015625, -0.2264404296875, -0.063720703125, 0.0989990234375, 0.26171875, 0.4244384765625, 0.587158203125, 0.7498779296875, 0.91259765625, 1.0753173828125, 1.238037109375, 1.4007568359375, 1.5634765625, 1.7261962890625, 1.888916015625, 2.0516357421875, 2.21435546875, 2.3770751953125, 2.539794921875, 2.7025146484375, 2.865234375, 3.0279541015625, 3.190673828125, 3.3533935546875, 3.51611328125, 3.6788330078125, 3.841552734375, 4.0042724609375, 4.1669921875, 4.3297119140625, 4.492431640625, 4.6551513671875, 4.81787109375, 4.9805908203125, 5.143310546875, 5.3060302734375, 5.46875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 9.0, 9.0, 11.0, 9.0, 11.0, 16.0, 19.0, 26.0, 37.0, 46.0, 49.0, 52.0, 47.0, 94.0, 85.0, 79.0, 69.0, 46.0, 44.0, 46.0, 30.0, 33.0, 20.0, 20.0, 18.0, 6.0, 10.0, 6.0, 9.0, 3.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.552734375, -1.5006866455078125, -1.448638916015625, -1.3965911865234375, -1.34454345703125, -1.2924957275390625, -1.240447998046875, -1.1884002685546875, -1.1363525390625, -1.0843048095703125, -1.032257080078125, -0.9802093505859375, -0.92816162109375, -0.8761138916015625, -0.824066162109375, -0.7720184326171875, -0.719970703125, -0.6679229736328125, -0.615875244140625, -0.5638275146484375, -0.51177978515625, -0.4597320556640625, -0.407684326171875, -0.3556365966796875, -0.3035888671875, -0.2515411376953125, -0.199493408203125, -0.1474456787109375, -0.09539794921875, -0.0433502197265625, 0.008697509765625, 0.0607452392578125, 0.11279296875, 0.1648406982421875, 0.216888427734375, 0.2689361572265625, 0.32098388671875, 0.3730316162109375, 0.425079345703125, 0.4771270751953125, 0.5291748046875, 0.5812225341796875, 0.633270263671875, 0.6853179931640625, 0.73736572265625, 0.7894134521484375, 0.841461181640625, 0.8935089111328125, 0.945556640625, 0.9976043701171875, 1.049652099609375, 1.1016998291015625, 1.15374755859375, 1.2057952880859375, 1.257843017578125, 1.3098907470703125, 1.3619384765625, 1.4139862060546875, 1.466033935546875, 1.5180816650390625, 1.57012939453125, 1.6221771240234375, 1.674224853515625, 1.7262725830078125, 1.7783203125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 5.0, 7.0, 7.0, 7.0, 7.0, 21.0, 13.0, 28.0, 34.0, 35.0, 50.0, 80.0, 76.0, 85.0, 94.0, 63.0, 82.0, 50.0, 46.0, 33.0, 43.0, 31.0, 24.0, 13.0, 9.0, 14.0, 12.0, 5.0, 10.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.378427505493164, -10.06989574432373, -9.761363983154297, -9.452832221984863, -9.14430046081543, -8.835769653320312, -8.527236938476562, -8.218706130981445, -7.910174369812012, -7.601642608642578, -7.2931108474731445, -6.984579086303711, -6.6760478019714355, -6.367516040802002, -6.058984279632568, -5.750452995300293, -5.441920757293701, -5.133388996124268, -4.824857234954834, -4.516325950622559, -4.207794189453125, -3.8992624282836914, -3.590730667114258, -3.2821991443634033, -2.9736673831939697, -2.665135622024536, -2.3566040992736816, -2.048072338104248, -1.739540696144104, -1.43100905418396, -1.1224772930145264, -0.8139457702636719, -0.5054140090942383, -0.19688233733177185, 0.11164933443069458, 0.4201810359954834, 0.7287126779556274, 1.0372443199157715, 1.345776081085205, 1.6543076038360596, 1.9628393650054932, 2.2713711261749268, 2.5799026489257812, 2.888434410095215, 3.1969661712646484, 3.505497694015503, 3.8140294551849365, 4.122560977935791, 4.431092739105225, 4.739624500274658, 5.048156261444092, 5.356687545776367, 5.665219306945801, 5.973751068115234, 6.282282829284668, 6.590814590454102, 6.899346351623535, 7.207878112792969, 7.516409873962402, 7.824941635131836, 8.13347339630127, 8.442005157470703, 8.75053596496582, 9.059067726135254, 9.367599487304688]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 7.0, 8.0, 10.0, 13.0, 14.0, 14.0, 16.0, 17.0, 19.0, 25.0, 29.0, 23.0, 20.0, 23.0, 28.0, 34.0, 39.0, 36.0, 41.0, 48.0, 29.0, 29.0, 39.0, 45.0, 22.0, 27.0, 46.0, 30.0, 36.0, 31.0, 34.0, 22.0, 17.0, 22.0, 14.0, 13.0, 8.0, 12.0, 10.0, 8.0, 4.0, 7.0, 6.0, 3.0, 6.0, 7.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.546819686889648, -7.3178791999816895, -7.088938236236572, -6.859997749328613, -6.631056785583496, -6.402116298675537, -6.173175811767578, -5.944234848022461, -5.715293884277344, -5.486353397369385, -5.257412433624268, -5.028471946716309, -4.799530982971191, -4.570590496063232, -4.341650009155273, -4.112709045410156, -3.8837685585021973, -3.654827833175659, -3.425887107849121, -3.196946620941162, -2.968005657196045, -2.739065170288086, -2.510124444961548, -2.2811837196350098, -2.0522429943084717, -1.8233022689819336, -1.5943615436553955, -1.365420937538147, -1.1364802122116089, -0.9075394868850708, -0.6785988807678223, -0.4496581554412842, -0.2207179069519043, 0.008222788572311401, 0.2371634840965271, 0.4661041498184204, 0.6950448751449585, 0.9239856004714966, 1.1529262065887451, 1.3818669319152832, 1.6108076572418213, 1.8397483825683594, 2.0686891078948975, 2.2976298332214355, 2.5265703201293945, 2.7555112838745117, 2.9844517707824707, 3.213392496109009, 3.442333221435547, 3.671273946762085, 3.900214672088623, 4.129155158996582, 4.358096122741699, 4.587036609649658, 4.815977096557617, 5.044918060302734, 5.273859024047852, 5.5027995109558105, 5.731740474700928, 5.960680961608887, 6.189621925354004, 6.418562412261963, 6.647502899169922, 6.876443862915039, 7.105384349822998]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 14.0, 23.0, 21.0, 31.0, 43.0, 76.0, 116.0, 160.0, 243.0, 333.0, 546.0, 876.0, 1333.0, 2106.0, 3183.0, 4983.0, 7888.0, 12466.0, 20078.0, 32073.0, 53869.0, 94197.0, 181271.0, 411947.0, 985530.0, 1214528.0, 613738.0, 248829.0, 124270.0, 70321.0, 41256.0, 24892.0, 15614.0, 9645.0, 6192.0, 4135.0, 2559.0, 1657.0, 1069.0, 737.0, 479.0, 348.0, 217.0, 131.0, 91.0, 59.0, 40.0, 26.0, 16.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0], "bins": [-9.90625, -9.6080322265625, -9.309814453125, -9.0115966796875, -8.71337890625, -8.4151611328125, -8.116943359375, -7.8187255859375, -7.5205078125, -7.2222900390625, -6.924072265625, -6.6258544921875, -6.32763671875, -6.0294189453125, -5.731201171875, -5.4329833984375, -5.134765625, -4.8365478515625, -4.538330078125, -4.2401123046875, -3.94189453125, -3.6436767578125, -3.345458984375, -3.0472412109375, -2.7490234375, -2.4508056640625, -2.152587890625, -1.8543701171875, -1.55615234375, -1.2579345703125, -0.959716796875, -0.6614990234375, -0.36328125, -0.0650634765625, 0.233154296875, 0.5313720703125, 0.82958984375, 1.1278076171875, 1.426025390625, 1.7242431640625, 2.0224609375, 2.3206787109375, 2.618896484375, 2.9171142578125, 3.21533203125, 3.5135498046875, 3.811767578125, 4.1099853515625, 4.408203125, 4.7064208984375, 5.004638671875, 5.3028564453125, 5.60107421875, 5.8992919921875, 6.197509765625, 6.4957275390625, 6.7939453125, 7.0921630859375, 7.390380859375, 7.6885986328125, 7.98681640625, 8.2850341796875, 8.583251953125, 8.8814697265625, 9.1796875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 7.0, 11.0, 17.0, 17.0, 16.0, 17.0, 17.0, 25.0, 23.0, 31.0, 23.0, 35.0, 31.0, 31.0, 41.0, 52.0, 45.0, 35.0, 42.0, 36.0, 39.0, 33.0, 38.0, 37.0, 46.0, 29.0, 28.0, 20.0, 30.0, 19.0, 21.0, 15.0, 12.0, 11.0, 9.0, 7.0, 6.0, 9.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-7.1484375, -6.9451904296875, -6.741943359375, -6.5386962890625, -6.33544921875, -6.1322021484375, -5.928955078125, -5.7257080078125, -5.5224609375, -5.3192138671875, -5.115966796875, -4.9127197265625, -4.70947265625, -4.5062255859375, -4.302978515625, -4.0997314453125, -3.896484375, -3.6932373046875, -3.489990234375, -3.2867431640625, -3.08349609375, -2.8802490234375, -2.677001953125, -2.4737548828125, -2.2705078125, -2.0672607421875, -1.864013671875, -1.6607666015625, -1.45751953125, -1.2542724609375, -1.051025390625, -0.8477783203125, -0.64453125, -0.4412841796875, -0.238037109375, -0.0347900390625, 0.16845703125, 0.3717041015625, 0.574951171875, 0.7781982421875, 0.9814453125, 1.1846923828125, 1.387939453125, 1.5911865234375, 1.79443359375, 1.9976806640625, 2.200927734375, 2.4041748046875, 2.607421875, 2.8106689453125, 3.013916015625, 3.2171630859375, 3.42041015625, 3.6236572265625, 3.826904296875, 4.0301513671875, 4.2333984375, 4.4366455078125, 4.639892578125, 4.8431396484375, 5.04638671875, 5.2496337890625, 5.452880859375, 5.6561279296875, 5.859375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 10.0, 10.0, 16.0, 23.0, 48.0, 59.0, 99.0, 109.0, 211.0, 289.0, 486.0, 727.0, 1060.0, 1596.0, 2414.0, 3882.0, 5946.0, 9529.0, 15461.0, 25425.0, 42343.0, 74074.0, 130770.0, 240165.0, 456724.0, 866671.0, 1027700.0, 590356.0, 307458.0, 165520.0, 91583.0, 52577.0, 30932.0, 18442.0, 11426.0, 7164.0, 4479.0, 2906.0, 1881.0, 1205.0, 844.0, 567.0, 353.0, 261.0, 155.0, 120.0, 69.0, 51.0, 34.0, 14.0, 17.0, 13.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.5750732421875, -7.306396484375, -7.0377197265625, -6.76904296875, -6.5003662109375, -6.231689453125, -5.9630126953125, -5.6943359375, -5.4256591796875, -5.156982421875, -4.8883056640625, -4.61962890625, -4.3509521484375, -4.082275390625, -3.8135986328125, -3.544921875, -3.2762451171875, -3.007568359375, -2.7388916015625, -2.47021484375, -2.2015380859375, -1.932861328125, -1.6641845703125, -1.3955078125, -1.1268310546875, -0.858154296875, -0.5894775390625, -0.32080078125, -0.0521240234375, 0.216552734375, 0.4852294921875, 0.75390625, 1.0225830078125, 1.291259765625, 1.5599365234375, 1.82861328125, 2.0972900390625, 2.365966796875, 2.6346435546875, 2.9033203125, 3.1719970703125, 3.440673828125, 3.7093505859375, 3.97802734375, 4.2467041015625, 4.515380859375, 4.7840576171875, 5.052734375, 5.3214111328125, 5.590087890625, 5.8587646484375, 6.12744140625, 6.3961181640625, 6.664794921875, 6.9334716796875, 7.2021484375, 7.4708251953125, 7.739501953125, 8.0081787109375, 8.27685546875, 8.5455322265625, 8.814208984375, 9.0828857421875, 9.3515625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 10.0, 8.0, 10.0, 16.0, 13.0, 25.0, 40.0, 41.0, 52.0, 42.0, 83.0, 78.0, 102.0, 134.0, 156.0, 162.0, 177.0, 183.0, 232.0, 273.0, 279.0, 264.0, 236.0, 211.0, 183.0, 171.0, 151.0, 123.0, 107.0, 88.0, 78.0, 49.0, 55.0, 44.0, 42.0, 38.0, 18.0, 12.0, 18.0, 6.0, 16.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.041015625, -2.94140625, -2.841796875, -2.7421875, -2.642578125, -2.54296875, -2.443359375, -2.34375, -2.244140625, -2.14453125, -2.044921875, -1.9453125, -1.845703125, -1.74609375, -1.646484375, -1.546875, -1.447265625, -1.34765625, -1.248046875, -1.1484375, -1.048828125, -0.94921875, -0.849609375, -0.75, -0.650390625, -0.55078125, -0.451171875, -0.3515625, -0.251953125, -0.15234375, -0.052734375, 0.046875, 0.146484375, 0.24609375, 0.345703125, 0.4453125, 0.544921875, 0.64453125, 0.744140625, 0.84375, 0.943359375, 1.04296875, 1.142578125, 1.2421875, 1.341796875, 1.44140625, 1.541015625, 1.640625, 1.740234375, 1.83984375, 1.939453125, 2.0390625, 2.138671875, 2.23828125, 2.337890625, 2.4375, 2.537109375, 2.63671875, 2.736328125, 2.8359375, 2.935546875, 3.03515625, 3.134765625, 3.234375, 3.333984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 7.0, 7.0, 10.0, 19.0, 15.0, 18.0, 23.0, 32.0, 34.0, 46.0, 50.0, 57.0, 79.0, 71.0, 76.0, 62.0, 61.0, 48.0, 46.0, 33.0, 36.0, 28.0, 31.0, 25.0, 9.0, 9.0, 5.0, 9.0, 5.0, 6.0, 12.0, 6.0, 2.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6175537109375, -8.372597694396973, -8.127640724182129, -7.882684707641602, -7.637728214263916, -7.3927717208862305, -7.147815704345703, -6.902859210968018, -6.657902717590332, -6.4129462242126465, -6.167989730834961, -5.923033714294434, -5.678077220916748, -5.4331207275390625, -5.188164710998535, -4.94320821762085, -4.698251724243164, -4.4532952308654785, -4.208338737487793, -3.9633827209472656, -3.71842622756958, -3.4734697341918945, -3.228513479232788, -2.9835572242736816, -2.738600730895996, -2.4936442375183105, -2.248687982559204, -2.0037317276000977, -1.758775234222412, -1.5138188600540161, -1.2688624858856201, -1.0239061117172241, -0.7789492607116699, -0.5339928865432739, -0.28903651237487793, -0.044080138206481934, 0.20087623596191406, 0.44583261013031006, 0.690788984298706, 0.935745358467102, 1.180701732635498, 1.425658106803894, 1.67061448097229, 1.915570855140686, 2.160527229309082, 2.4054837226867676, 2.650439977645874, 2.8953962326049805, 3.140352725982666, 3.3853092193603516, 3.630265474319458, 3.8752217292785645, 4.12017822265625, 4.3651347160339355, 4.610091209411621, 4.855047225952148, 5.100003719329834, 5.3449602127075195, 5.589916229248047, 5.834872722625732, 6.079829216003418, 6.3247857093811035, 6.569742202758789, 6.814698219299316, 7.059654712677002]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 11.0, 14.0, 12.0, 14.0, 14.0, 19.0, 13.0, 26.0, 30.0, 29.0, 29.0, 40.0, 29.0, 40.0, 37.0, 49.0, 44.0, 38.0, 44.0, 39.0, 36.0, 46.0, 32.0, 47.0, 33.0, 37.0, 26.0, 13.0, 23.0, 23.0, 17.0, 13.0, 17.0, 12.0, 8.0, 9.0, 14.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.602009296417236, -7.371581554412842, -7.1411542892456055, -6.910726547241211, -6.680299282073975, -6.44987154006958, -6.219444274902344, -5.989016532897949, -5.758588790893555, -5.52816104888916, -5.297733783721924, -5.067306041717529, -4.836878776550293, -4.606451034545898, -4.376023292541504, -4.145596027374268, -3.9151687622070312, -3.684741258621216, -3.4543137550354004, -3.223886013031006, -2.9934587478637695, -2.763031005859375, -2.5326035022735596, -2.302175998687744, -2.0717484951019287, -1.8413209915161133, -1.6108934879302979, -1.3804658651351929, -1.1500383615493774, -0.919610857963562, -0.689183235168457, -0.4587557315826416, -0.22832870483398438, 0.0020988285541534424, 0.23252636194229126, 0.46295392513275146, 0.6933814287185669, 0.9238089323043823, 1.1542365550994873, 1.3846640586853027, 1.6150915622711182, 1.8455190658569336, 2.075946569442749, 2.3063740730285645, 2.536801815032959, 2.7672290802001953, 2.99765682220459, 3.2280843257904053, 3.4585118293762207, 3.688939332962036, 3.9193668365478516, 4.149794578552246, 4.380221843719482, 4.610649585723877, 4.841076850891113, 5.071504592895508, 5.301932334899902, 5.532360076904297, 5.762787342071533, 5.993215084075928, 6.223642349243164, 6.454070091247559, 6.684497833251953, 6.9149250984191895, 7.145352363586426]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 9.0, 23.0, 19.0, 31.0, 51.0, 68.0, 108.0, 150.0, 240.0, 365.0, 633.0, 921.0, 1450.0, 2260.0, 3634.0, 5545.0, 8729.0, 14036.0, 22411.0, 36016.0, 58036.0, 93828.0, 149282.0, 220972.0, 162064.0, 100674.0, 62899.0, 38800.0, 24274.0, 15078.0, 9308.0, 5996.0, 3869.0, 2410.0, 1497.0, 1004.0, 642.0, 444.0, 251.0, 192.0, 96.0, 85.0, 41.0, 40.0, 32.0, 18.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.009765625, -2.914459228515625, -2.81915283203125, -2.723846435546875, -2.6285400390625, -2.533233642578125, -2.43792724609375, -2.342620849609375, -2.247314453125, -2.152008056640625, -2.05670166015625, -1.961395263671875, -1.8660888671875, -1.770782470703125, -1.67547607421875, -1.580169677734375, -1.48486328125, -1.389556884765625, -1.29425048828125, -1.198944091796875, -1.1036376953125, -1.008331298828125, -0.91302490234375, -0.817718505859375, -0.722412109375, -0.627105712890625, -0.53179931640625, -0.436492919921875, -0.3411865234375, -0.245880126953125, -0.15057373046875, -0.055267333984375, 0.0400390625, 0.135345458984375, 0.23065185546875, 0.325958251953125, 0.4212646484375, 0.516571044921875, 0.61187744140625, 0.707183837890625, 0.802490234375, 0.897796630859375, 0.99310302734375, 1.088409423828125, 1.1837158203125, 1.279022216796875, 1.37432861328125, 1.469635009765625, 1.56494140625, 1.660247802734375, 1.75555419921875, 1.850860595703125, 1.9461669921875, 2.041473388671875, 2.13677978515625, 2.232086181640625, 2.327392578125, 2.422698974609375, 2.51800537109375, 2.613311767578125, 2.7086181640625, 2.803924560546875, 2.89923095703125, 2.994537353515625, 3.08984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 13.0, 5.0, 13.0, 15.0, 16.0, 16.0, 22.0, 15.0, 29.0, 29.0, 37.0, 28.0, 44.0, 34.0, 34.0, 42.0, 48.0, 38.0, 40.0, 50.0, 52.0, 42.0, 26.0, 37.0, 37.0, 26.0, 28.0, 17.0, 27.0, 17.0, 19.0, 15.0, 12.0, 12.0, 8.0, 11.0, 8.0, 8.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.2890625, -7.0560302734375, -6.822998046875, -6.5899658203125, -6.35693359375, -6.1239013671875, -5.890869140625, -5.6578369140625, -5.4248046875, -5.1917724609375, -4.958740234375, -4.7257080078125, -4.49267578125, -4.2596435546875, -4.026611328125, -3.7935791015625, -3.560546875, -3.3275146484375, -3.094482421875, -2.8614501953125, -2.62841796875, -2.3953857421875, -2.162353515625, -1.9293212890625, -1.6962890625, -1.4632568359375, -1.230224609375, -0.9971923828125, -0.76416015625, -0.5311279296875, -0.298095703125, -0.0650634765625, 0.16796875, 0.4010009765625, 0.634033203125, 0.8670654296875, 1.10009765625, 1.3331298828125, 1.566162109375, 1.7991943359375, 2.0322265625, 2.2652587890625, 2.498291015625, 2.7313232421875, 2.96435546875, 3.1973876953125, 3.430419921875, 3.6634521484375, 3.896484375, 4.1295166015625, 4.362548828125, 4.5955810546875, 4.82861328125, 5.0616455078125, 5.294677734375, 5.5277099609375, 5.7607421875, 5.9937744140625, 6.226806640625, 6.4598388671875, 6.69287109375, 6.9259033203125, 7.158935546875, 7.3919677734375, 7.625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 23.0, 28.0, 46.0, 64.0, 110.0, 175.0, 238.0, 408.0, 627.0, 982.0, 1567.0, 2743.0, 4575.0, 7829.0, 14223.0, 26071.0, 49469.0, 96608.0, 201804.0, 319020.0, 156102.0, 77114.0, 39636.0, 21051.0, 11585.0, 6634.0, 3782.0, 2285.0, 1348.0, 871.0, 543.0, 326.0, 223.0, 139.0, 91.0, 64.0, 47.0, 30.0, 14.0, 14.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.44140625, -4.315704345703125, -4.19000244140625, -4.064300537109375, -3.9385986328125, -3.812896728515625, -3.68719482421875, -3.561492919921875, -3.435791015625, -3.310089111328125, -3.18438720703125, -3.058685302734375, -2.9329833984375, -2.807281494140625, -2.68157958984375, -2.555877685546875, -2.43017578125, -2.304473876953125, -2.17877197265625, -2.053070068359375, -1.9273681640625, -1.801666259765625, -1.67596435546875, -1.550262451171875, -1.424560546875, -1.298858642578125, -1.17315673828125, -1.047454833984375, -0.9217529296875, -0.796051025390625, -0.67034912109375, -0.544647216796875, -0.4189453125, -0.293243408203125, -0.16754150390625, -0.041839599609375, 0.0838623046875, 0.209564208984375, 0.33526611328125, 0.460968017578125, 0.586669921875, 0.712371826171875, 0.83807373046875, 0.963775634765625, 1.0894775390625, 1.215179443359375, 1.34088134765625, 1.466583251953125, 1.59228515625, 1.717987060546875, 1.84368896484375, 1.969390869140625, 2.0950927734375, 2.220794677734375, 2.34649658203125, 2.472198486328125, 2.597900390625, 2.723602294921875, 2.84930419921875, 2.975006103515625, 3.1007080078125, 3.226409912109375, 3.35211181640625, 3.477813720703125, 3.603515625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 5.0, 6.0, 19.0, 16.0, 17.0, 22.0, 22.0, 25.0, 27.0, 35.0, 47.0, 30.0, 38.0, 48.0, 34.0, 40.0, 32.0, 38.0, 38.0, 41.0, 39.0, 27.0, 42.0, 37.0, 31.0, 31.0, 31.0, 28.0, 16.0, 15.0, 16.0, 23.0, 7.0, 9.0, 11.0, 6.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.68359375, -4.53973388671875, -4.3958740234375, -4.25201416015625, -4.108154296875, -3.96429443359375, -3.8204345703125, -3.67657470703125, -3.53271484375, -3.38885498046875, -3.2449951171875, -3.10113525390625, -2.957275390625, -2.81341552734375, -2.6695556640625, -2.52569580078125, -2.3818359375, -2.23797607421875, -2.0941162109375, -1.95025634765625, -1.806396484375, -1.66253662109375, -1.5186767578125, -1.37481689453125, -1.23095703125, -1.08709716796875, -0.9432373046875, -0.79937744140625, -0.655517578125, -0.51165771484375, -0.3677978515625, -0.22393798828125, -0.080078125, 0.06378173828125, 0.2076416015625, 0.35150146484375, 0.495361328125, 0.63922119140625, 0.7830810546875, 0.92694091796875, 1.07080078125, 1.21466064453125, 1.3585205078125, 1.50238037109375, 1.646240234375, 1.79010009765625, 1.9339599609375, 2.07781982421875, 2.2216796875, 2.36553955078125, 2.5093994140625, 2.65325927734375, 2.797119140625, 2.94097900390625, 3.0848388671875, 3.22869873046875, 3.37255859375, 3.51641845703125, 3.6602783203125, 3.80413818359375, 3.947998046875, 4.09185791015625, 4.2357177734375, 4.37957763671875, 4.5234375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 10.0, 20.0, 25.0, 35.0, 41.0, 79.0, 116.0, 153.0, 267.0, 400.0, 727.0, 1208.0, 2449.0, 5237.0, 12393.0, 35397.0, 131979.0, 593054.0, 190937.0, 45814.0, 15488.0, 6332.0, 2897.0, 1433.0, 788.0, 469.0, 259.0, 183.0, 115.0, 79.0, 53.0, 37.0, 24.0, 18.0, 9.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.06353759765625, -0.06158924102783203, -0.05964088439941406, -0.057692527770996094, -0.055744171142578125, -0.053795814514160156, -0.05184745788574219, -0.04989910125732422, -0.04795074462890625, -0.04600238800048828, -0.04405403137207031, -0.042105674743652344, -0.040157318115234375, -0.038208961486816406, -0.03626060485839844, -0.03431224822998047, -0.0323638916015625, -0.03041553497314453, -0.028467178344726562, -0.026518821716308594, -0.024570465087890625, -0.022622108459472656, -0.020673751831054688, -0.01872539520263672, -0.01677703857421875, -0.014828681945800781, -0.012880325317382812, -0.010931968688964844, -0.008983612060546875, -0.007035255432128906, -0.0050868988037109375, -0.0031385421752929688, -0.001190185546875, 0.0007581710815429688, 0.0027065277099609375, 0.004654884338378906, 0.006603240966796875, 0.008551597595214844, 0.010499954223632812, 0.012448310852050781, 0.01439666748046875, 0.01634502410888672, 0.018293380737304688, 0.020241737365722656, 0.022190093994140625, 0.024138450622558594, 0.026086807250976562, 0.02803516387939453, 0.0299835205078125, 0.03193187713623047, 0.03388023376464844, 0.035828590393066406, 0.037776947021484375, 0.039725303649902344, 0.04167366027832031, 0.04362201690673828, 0.04557037353515625, 0.04751873016357422, 0.04946708679199219, 0.051415443420410156, 0.053363800048828125, 0.055312156677246094, 0.05726051330566406, 0.05920886993408203, 0.0611572265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 13.0, 20.0, 31.0, 26.0, 45.0, 55.0, 90.0, 121.0, 130.0, 116.0, 98.0, 78.0, 47.0, 41.0, 22.0, 8.0, 10.0, 5.0, 9.0, 9.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.5987625122070312e-05, -2.531241625547409e-05, -2.463720738887787e-05, -2.3961998522281647e-05, -2.3286789655685425e-05, -2.2611580789089203e-05, -2.193637192249298e-05, -2.126116305589676e-05, -2.0585954189300537e-05, -1.9910745322704315e-05, -1.9235536456108093e-05, -1.856032758951187e-05, -1.788511872291565e-05, -1.7209909856319427e-05, -1.6534700989723206e-05, -1.5859492123126984e-05, -1.5184283256530762e-05, -1.450907438993454e-05, -1.3833865523338318e-05, -1.3158656656742096e-05, -1.2483447790145874e-05, -1.1808238923549652e-05, -1.113303005695343e-05, -1.0457821190357208e-05, -9.782612323760986e-06, -9.107403457164764e-06, -8.432194590568542e-06, -7.75698572397232e-06, -7.081776857376099e-06, -6.406567990779877e-06, -5.731359124183655e-06, -5.056150257587433e-06, -4.380941390991211e-06, -3.705732524394989e-06, -3.030523657798767e-06, -2.355314791202545e-06, -1.6801059246063232e-06, -1.0048970580101013e-06, -3.296881914138794e-07, 3.4552067518234253e-07, 1.0207295417785645e-06, 1.6959384083747864e-06, 2.3711472749710083e-06, 3.0463561415672302e-06, 3.721565008163452e-06, 4.396773874759674e-06, 5.071982741355896e-06, 5.747191607952118e-06, 6.42240047454834e-06, 7.097609341144562e-06, 7.772818207740784e-06, 8.448027074337006e-06, 9.123235940933228e-06, 9.79844480752945e-06, 1.0473653674125671e-05, 1.1148862540721893e-05, 1.1824071407318115e-05, 1.2499280273914337e-05, 1.3174489140510559e-05, 1.3849698007106781e-05, 1.4524906873703003e-05, 1.5200115740299225e-05, 1.5875324606895447e-05, 1.655053347349167e-05, 1.722574234008789e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 7.0, 10.0, 14.0, 17.0, 8.0, 21.0, 46.0, 54.0, 77.0, 101.0, 166.0, 236.0, 347.0, 444.0, 722.0, 1057.0, 1551.0, 2359.0, 3717.0, 6104.0, 10202.0, 18978.0, 37333.0, 81991.0, 203802.0, 364824.0, 169781.0, 70434.0, 32438.0, 16646.0, 9329.0, 5503.0, 3459.0, 2290.0, 1414.0, 990.0, 670.0, 413.0, 307.0, 219.0, 128.0, 95.0, 82.0, 54.0, 33.0, 23.0, 23.0, 11.0, 12.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0322265625, -0.031200408935546875, -0.03017425537109375, -0.029148101806640625, -0.0281219482421875, -0.027095794677734375, -0.02606964111328125, -0.025043487548828125, -0.024017333984375, -0.022991180419921875, -0.02196502685546875, -0.020938873291015625, -0.0199127197265625, -0.018886566162109375, -0.01786041259765625, -0.016834259033203125, -0.01580810546875, -0.014781951904296875, -0.01375579833984375, -0.012729644775390625, -0.0117034912109375, -0.010677337646484375, -0.00965118408203125, -0.008625030517578125, -0.007598876953125, -0.006572723388671875, -0.00554656982421875, -0.004520416259765625, -0.0034942626953125, -0.002468109130859375, -0.00144195556640625, -0.000415802001953125, 0.0006103515625, 0.001636505126953125, 0.00266265869140625, 0.003688812255859375, 0.0047149658203125, 0.005741119384765625, 0.00676727294921875, 0.007793426513671875, 0.008819580078125, 0.009845733642578125, 0.01087188720703125, 0.011898040771484375, 0.0129241943359375, 0.013950347900390625, 0.01497650146484375, 0.016002655029296875, 0.01702880859375, 0.018054962158203125, 0.01908111572265625, 0.020107269287109375, 0.0211334228515625, 0.022159576416015625, 0.02318572998046875, 0.024211883544921875, 0.025238037109375, 0.026264190673828125, 0.02729034423828125, 0.028316497802734375, 0.0293426513671875, 0.030368804931640625, 0.03139495849609375, 0.032421112060546875, 0.033447265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 10.0, 12.0, 12.0, 9.0, 20.0, 21.0, 31.0, 43.0, 40.0, 65.0, 62.0, 67.0, 84.0, 83.0, 79.0, 52.0, 55.0, 42.0, 44.0, 34.0, 28.0, 19.0, 13.0, 11.0, 17.0, 7.0, 6.0, 4.0, 2.0, 3.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0101318359375, -0.009756922721862793, -0.009382009506225586, -0.009007096290588379, -0.008632183074951172, -0.008257269859313965, -0.007882356643676758, -0.007507443428039551, -0.007132530212402344, -0.006757616996765137, -0.00638270378112793, -0.006007790565490723, -0.005632877349853516, -0.005257964134216309, -0.0048830509185791016, -0.0045081377029418945, -0.0041332244873046875, -0.0037583112716674805, -0.0033833980560302734, -0.0030084848403930664, -0.0026335716247558594, -0.0022586584091186523, -0.0018837451934814453, -0.0015088319778442383, -0.0011339187622070312, -0.0007590055465698242, -0.0003840923309326172, -9.179115295410156e-06, 0.0003657341003417969, 0.0007406473159790039, 0.001115560531616211, 0.001490473747253418, 0.001865386962890625, 0.002240300178527832, 0.002615213394165039, 0.002990126609802246, 0.003365039825439453, 0.00373995304107666, 0.004114866256713867, 0.004489779472351074, 0.004864692687988281, 0.005239605903625488, 0.005614519119262695, 0.005989432334899902, 0.006364345550537109, 0.006739258766174316, 0.0071141719818115234, 0.0074890851974487305, 0.007863998413085938, 0.008238911628723145, 0.008613824844360352, 0.008988738059997559, 0.009363651275634766, 0.009738564491271973, 0.01011347770690918, 0.010488390922546387, 0.010863304138183594, 0.0112382173538208, 0.011613130569458008, 0.011988043785095215, 0.012362957000732422, 0.012737870216369629, 0.013112783432006836, 0.013487696647644043, 0.01386260986328125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 10.0, 14.0, 14.0, 13.0, 16.0, 24.0, 28.0, 34.0, 51.0, 49.0, 64.0, 73.0, 71.0, 68.0, 63.0, 59.0, 55.0, 34.0, 45.0, 35.0, 34.0, 24.0, 24.0, 10.0, 6.0, 8.0, 9.0, 10.0, 6.0, 9.0, 6.0, 0.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.43670654296875, -8.19694995880127, -7.957193851470947, -7.717437267303467, -7.477680683135986, -7.237924575805664, -6.998167991638184, -6.758411407470703, -6.518654823303223, -6.278898239135742, -6.03914213180542, -5.7993855476379395, -5.559628963470459, -5.319872856140137, -5.080116271972656, -4.840359687805176, -4.600603103637695, -4.360846519470215, -4.121090412139893, -3.881333827972412, -3.6415772438049316, -3.4018208980560303, -3.162064552307129, -2.9223079681396484, -2.682551860809326, -2.442795515060425, -2.2030389308929443, -1.963282585144043, -1.7235260009765625, -1.4837696552276611, -1.2440131902694702, -1.0042567253112793, -0.7645001411437988, -0.5247436761856079, -0.2849872410297394, -0.04523080587387085, 0.19452565908432007, 0.4342820644378662, 0.6740385293960571, 0.913794994354248, 1.153551459312439, 1.3933079242706299, 1.6330643892288208, 1.8728208541870117, 2.112577199935913, 2.3523335456848145, 2.592090129852295, 2.8318467140197754, 3.0716030597686768, 3.311359405517578, 3.5511159896850586, 3.79087233543396, 4.030628681182861, 4.270385265350342, 4.510141849517822, 4.7498979568481445, 4.989654541015625, 5.2294111251831055, 5.469167232513428, 5.708923816680908, 5.948680400848389, 6.188436508178711, 6.428193092346191, 6.667949676513672, 6.907706260681152]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 12.0, 14.0, 11.0, 14.0, 13.0, 21.0, 11.0, 27.0, 31.0, 26.0, 31.0, 41.0, 27.0, 41.0, 36.0, 50.0, 42.0, 36.0, 50.0, 37.0, 35.0, 46.0, 32.0, 48.0, 34.0, 35.0, 28.0, 11.0, 23.0, 25.0, 15.0, 15.0, 16.0, 12.0, 9.0, 9.0, 12.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.576226711273193, -7.347590446472168, -7.118953704833984, -6.890317440032959, -6.661681175231934, -6.43304443359375, -6.204408168792725, -5.975771903991699, -5.747135639190674, -5.518499374389648, -5.289862632751465, -5.0612263679504395, -4.832590103149414, -4.6039533615112305, -4.375317096710205, -4.14668083190918, -3.918044328689575, -3.6894078254699707, -3.4607715606689453, -3.232135057449341, -3.0034987926483154, -2.774862289428711, -2.5462260246276855, -2.317589521408081, -2.0889530181884766, -1.8603166341781616, -1.6316802501678467, -1.4030437469482422, -1.1744074821472168, -0.9457709789276123, -0.7171345949172974, -0.4884982109069824, -0.25986194610595703, -0.031225547194480896, 0.19741085171699524, 0.42604726552963257, 0.6546836495399475, 0.8833200931549072, 1.1119564771652222, 1.340592861175537, 1.569229245185852, 1.797865629196167, 2.0265021324157715, 2.255138397216797, 2.4837749004364014, 2.712411403656006, 2.9410476684570312, 3.1696839332580566, 3.398320436477661, 3.6269569396972656, 3.855593204498291, 4.084229469299316, 4.3128662109375, 4.541502475738525, 4.770138740539551, 4.998775482177734, 5.22741174697876, 5.456048011779785, 5.684684753417969, 5.913321018218994, 6.1419572830200195, 6.370594024658203, 6.5992302894592285, 6.827866554260254, 7.056502819061279]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 7.0, 3.0, 12.0, 19.0, 23.0, 34.0, 57.0, 91.0, 124.0, 173.0, 251.0, 365.0, 549.0, 839.0, 1179.0, 1801.0, 2572.0, 3921.0, 5794.0, 8939.0, 13366.0, 20458.0, 32266.0, 50892.0, 80379.0, 123946.0, 171535.0, 172928.0, 126748.0, 81962.0, 52172.0, 32945.0, 21259.0, 13544.0, 9178.0, 5961.0, 4011.0, 2705.0, 1786.0, 1258.0, 792.0, 550.0, 374.0, 261.0, 178.0, 105.0, 81.0, 63.0, 38.0, 21.0, 19.0, 8.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-9.625, -9.324462890625, -9.02392578125, -8.723388671875, -8.4228515625, -8.122314453125, -7.82177734375, -7.521240234375, -7.220703125, -6.920166015625, -6.61962890625, -6.319091796875, -6.0185546875, -5.718017578125, -5.41748046875, -5.116943359375, -4.81640625, -4.515869140625, -4.21533203125, -3.914794921875, -3.6142578125, -3.313720703125, -3.01318359375, -2.712646484375, -2.412109375, -2.111572265625, -1.81103515625, -1.510498046875, -1.2099609375, -0.909423828125, -0.60888671875, -0.308349609375, -0.0078125, 0.292724609375, 0.59326171875, 0.893798828125, 1.1943359375, 1.494873046875, 1.79541015625, 2.095947265625, 2.396484375, 2.697021484375, 2.99755859375, 3.298095703125, 3.5986328125, 3.899169921875, 4.19970703125, 4.500244140625, 4.80078125, 5.101318359375, 5.40185546875, 5.702392578125, 6.0029296875, 6.303466796875, 6.60400390625, 6.904541015625, 7.205078125, 7.505615234375, 7.80615234375, 8.106689453125, 8.4072265625, 8.707763671875, 9.00830078125, 9.308837890625, 9.609375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 8.0, 9.0, 9.0, 14.0, 14.0, 19.0, 11.0, 18.0, 13.0, 27.0, 35.0, 25.0, 35.0, 42.0, 32.0, 43.0, 35.0, 42.0, 45.0, 49.0, 52.0, 38.0, 46.0, 28.0, 42.0, 41.0, 26.0, 28.0, 29.0, 19.0, 17.0, 18.0, 19.0, 12.0, 15.0, 14.0, 6.0, 3.0, 4.0, 8.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.99609375, -6.77294921875, -6.5498046875, -6.32666015625, -6.103515625, -5.88037109375, -5.6572265625, -5.43408203125, -5.2109375, -4.98779296875, -4.7646484375, -4.54150390625, -4.318359375, -4.09521484375, -3.8720703125, -3.64892578125, -3.42578125, -3.20263671875, -2.9794921875, -2.75634765625, -2.533203125, -2.31005859375, -2.0869140625, -1.86376953125, -1.640625, -1.41748046875, -1.1943359375, -0.97119140625, -0.748046875, -0.52490234375, -0.3017578125, -0.07861328125, 0.14453125, 0.36767578125, 0.5908203125, 0.81396484375, 1.037109375, 1.26025390625, 1.4833984375, 1.70654296875, 1.9296875, 2.15283203125, 2.3759765625, 2.59912109375, 2.822265625, 3.04541015625, 3.2685546875, 3.49169921875, 3.71484375, 3.93798828125, 4.1611328125, 4.38427734375, 4.607421875, 4.83056640625, 5.0537109375, 5.27685546875, 5.5, 5.72314453125, 5.9462890625, 6.16943359375, 6.392578125, 6.61572265625, 6.8388671875, 7.06201171875, 7.28515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 17.0, 13.0, 34.0, 40.0, 78.0, 84.0, 133.0, 179.0, 241.0, 382.0, 551.0, 807.0, 1188.0, 1742.0, 2545.0, 3754.0, 5517.0, 8236.0, 11962.0, 18021.0, 27120.0, 41373.0, 62797.0, 93470.0, 131095.0, 157561.0, 145863.0, 110041.0, 75413.0, 49898.0, 32448.0, 21347.0, 14390.0, 9854.0, 6358.0, 4472.0, 3005.0, 2119.0, 1344.0, 946.0, 635.0, 514.0, 310.0, 215.0, 140.0, 98.0, 52.0, 40.0, 31.0, 21.0, 15.0, 12.0, 19.0, 6.0, 3.0, 0.0, 3.0], "bins": [-8.890625, -8.618896484375, -8.34716796875, -8.075439453125, -7.8037109375, -7.531982421875, -7.26025390625, -6.988525390625, -6.716796875, -6.445068359375, -6.17333984375, -5.901611328125, -5.6298828125, -5.358154296875, -5.08642578125, -4.814697265625, -4.54296875, -4.271240234375, -3.99951171875, -3.727783203125, -3.4560546875, -3.184326171875, -2.91259765625, -2.640869140625, -2.369140625, -2.097412109375, -1.82568359375, -1.553955078125, -1.2822265625, -1.010498046875, -0.73876953125, -0.467041015625, -0.1953125, 0.076416015625, 0.34814453125, 0.619873046875, 0.8916015625, 1.163330078125, 1.43505859375, 1.706787109375, 1.978515625, 2.250244140625, 2.52197265625, 2.793701171875, 3.0654296875, 3.337158203125, 3.60888671875, 3.880615234375, 4.15234375, 4.424072265625, 4.69580078125, 4.967529296875, 5.2392578125, 5.510986328125, 5.78271484375, 6.054443359375, 6.326171875, 6.597900390625, 6.86962890625, 7.141357421875, 7.4130859375, 7.684814453125, 7.95654296875, 8.228271484375, 8.5]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 7.0, 1.0, 6.0, 8.0, 10.0, 11.0, 17.0, 13.0, 18.0, 20.0, 20.0, 22.0, 15.0, 27.0, 36.0, 31.0, 39.0, 41.0, 29.0, 33.0, 47.0, 46.0, 42.0, 28.0, 29.0, 36.0, 39.0, 36.0, 34.0, 34.0, 28.0, 28.0, 31.0, 27.0, 19.0, 12.0, 18.0, 13.0, 9.0, 5.0, 7.0, 10.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.3671875, -4.2325439453125, -4.097900390625, -3.9632568359375, -3.82861328125, -3.6939697265625, -3.559326171875, -3.4246826171875, -3.2900390625, -3.1553955078125, -3.020751953125, -2.8861083984375, -2.75146484375, -2.6168212890625, -2.482177734375, -2.3475341796875, -2.212890625, -2.0782470703125, -1.943603515625, -1.8089599609375, -1.67431640625, -1.5396728515625, -1.405029296875, -1.2703857421875, -1.1357421875, -1.0010986328125, -0.866455078125, -0.7318115234375, -0.59716796875, -0.4625244140625, -0.327880859375, -0.1932373046875, -0.05859375, 0.0760498046875, 0.210693359375, 0.3453369140625, 0.47998046875, 0.6146240234375, 0.749267578125, 0.8839111328125, 1.0185546875, 1.1531982421875, 1.287841796875, 1.4224853515625, 1.55712890625, 1.6917724609375, 1.826416015625, 1.9610595703125, 2.095703125, 2.2303466796875, 2.364990234375, 2.4996337890625, 2.63427734375, 2.7689208984375, 2.903564453125, 3.0382080078125, 3.1728515625, 3.3074951171875, 3.442138671875, 3.5767822265625, 3.71142578125, 3.8460693359375, 3.980712890625, 4.1153564453125, 4.25]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 13.0, 20.0, 28.0, 14.0, 32.0, 39.0, 96.0, 122.0, 174.0, 184.0, 329.0, 471.0, 684.0, 1001.0, 1629.0, 2470.0, 4355.0, 7355.0, 13903.0, 27896.0, 66958.0, 228748.0, 487291.0, 117004.0, 43095.0, 19548.0, 10084.0, 5693.0, 3287.0, 2032.0, 1276.0, 862.0, 611.0, 377.0, 253.0, 165.0, 147.0, 85.0, 66.0, 37.0, 26.0, 20.0, 21.0, 13.0, 10.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-6.34375, -6.14080810546875, -5.9378662109375, -5.73492431640625, -5.531982421875, -5.32904052734375, -5.1260986328125, -4.92315673828125, -4.72021484375, -4.51727294921875, -4.3143310546875, -4.11138916015625, -3.908447265625, -3.70550537109375, -3.5025634765625, -3.29962158203125, -3.0966796875, -2.89373779296875, -2.6907958984375, -2.48785400390625, -2.284912109375, -2.08197021484375, -1.8790283203125, -1.67608642578125, -1.47314453125, -1.27020263671875, -1.0672607421875, -0.86431884765625, -0.661376953125, -0.45843505859375, -0.2554931640625, -0.05255126953125, 0.150390625, 0.35333251953125, 0.5562744140625, 0.75921630859375, 0.962158203125, 1.16510009765625, 1.3680419921875, 1.57098388671875, 1.77392578125, 1.97686767578125, 2.1798095703125, 2.38275146484375, 2.585693359375, 2.78863525390625, 2.9915771484375, 3.19451904296875, 3.3974609375, 3.60040283203125, 3.8033447265625, 4.00628662109375, 4.209228515625, 4.41217041015625, 4.6151123046875, 4.81805419921875, 5.02099609375, 5.22393798828125, 5.4268798828125, 5.62982177734375, 5.832763671875, 6.03570556640625, 6.2386474609375, 6.44158935546875, 6.64453125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 11.0, 19.0, 32.0, 34.0, 54.0, 102.0, 139.0, 165.0, 151.0, 107.0, 66.0, 40.0, 26.0, 17.0, 10.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003509521484375, -0.00033770501613616943, -0.00032445788383483887, -0.0003112107515335083, -0.00029796361923217773, -0.00028471648693084717, -0.0002714693546295166, -0.00025822222232818604, -0.00024497509002685547, -0.0002317279577255249, -0.00021848082542419434, -0.00020523369312286377, -0.0001919865608215332, -0.00017873942852020264, -0.00016549229621887207, -0.0001522451639175415, -0.00013899803161621094, -0.00012575089931488037, -0.0001125037670135498, -9.925663471221924e-05, -8.600950241088867e-05, -7.27623701095581e-05, -5.951523780822754e-05, -4.626810550689697e-05, -3.3020973205566406e-05, -1.977384090423584e-05, -6.5267086029052734e-06, 6.720423698425293e-06, 1.996755599975586e-05, 3.3214688301086426e-05, 4.646182060241699e-05, 5.970895290374756e-05, 7.295608520507812e-05, 8.620321750640869e-05, 9.945034980773926e-05, 0.00011269748210906982, 0.0001259446144104004, 0.00013919174671173096, 0.00015243887901306152, 0.0001656860113143921, 0.00017893314361572266, 0.00019218027591705322, 0.0002054274082183838, 0.00021867454051971436, 0.00023192167282104492, 0.0002451688051223755, 0.00025841593742370605, 0.0002716630697250366, 0.0002849102020263672, 0.00029815733432769775, 0.0003114044666290283, 0.0003246515989303589, 0.00033789873123168945, 0.00035114586353302, 0.0003643929958343506, 0.00037764012813568115, 0.0003908872604370117, 0.0004041343927383423, 0.00041738152503967285, 0.0004306286573410034, 0.000443875789642334, 0.00045712292194366455, 0.0004703700542449951, 0.0004836171865463257, 0.0004968643188476562]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 12.0, 13.0, 19.0, 38.0, 51.0, 58.0, 91.0, 119.0, 171.0, 274.0, 411.0, 586.0, 859.0, 1280.0, 1899.0, 2992.0, 4520.0, 7494.0, 12582.0, 22914.0, 45897.0, 107634.0, 413016.0, 261002.0, 80270.0, 36622.0, 18819.0, 10739.0, 6365.0, 4052.0, 2564.0, 1708.0, 1079.0, 770.0, 523.0, 293.0, 233.0, 153.0, 136.0, 82.0, 59.0, 53.0, 27.0, 22.0, 11.0, 13.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.83984375, -5.66204833984375, -5.4842529296875, -5.30645751953125, -5.128662109375, -4.95086669921875, -4.7730712890625, -4.59527587890625, -4.41748046875, -4.23968505859375, -4.0618896484375, -3.88409423828125, -3.706298828125, -3.52850341796875, -3.3507080078125, -3.17291259765625, -2.9951171875, -2.81732177734375, -2.6395263671875, -2.46173095703125, -2.283935546875, -2.10614013671875, -1.9283447265625, -1.75054931640625, -1.57275390625, -1.39495849609375, -1.2171630859375, -1.03936767578125, -0.861572265625, -0.68377685546875, -0.5059814453125, -0.32818603515625, -0.150390625, 0.02740478515625, 0.2052001953125, 0.38299560546875, 0.560791015625, 0.73858642578125, 0.9163818359375, 1.09417724609375, 1.27197265625, 1.44976806640625, 1.6275634765625, 1.80535888671875, 1.983154296875, 2.16094970703125, 2.3387451171875, 2.51654052734375, 2.6943359375, 2.87213134765625, 3.0499267578125, 3.22772216796875, 3.405517578125, 3.58331298828125, 3.7611083984375, 3.93890380859375, 4.11669921875, 4.29449462890625, 4.4722900390625, 4.65008544921875, 4.827880859375, 5.00567626953125, 5.1834716796875, 5.36126708984375, 5.5390625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 5.0, 6.0, 7.0, 5.0, 6.0, 13.0, 14.0, 19.0, 21.0, 22.0, 26.0, 37.0, 45.0, 45.0, 65.0, 79.0, 114.0, 100.0, 62.0, 59.0, 53.0, 41.0, 28.0, 18.0, 15.0, 13.0, 11.0, 18.0, 10.0, 4.0, 5.0, 7.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8701171875, -1.812957763671875, -1.75579833984375, -1.698638916015625, -1.6414794921875, -1.584320068359375, -1.52716064453125, -1.470001220703125, -1.412841796875, -1.355682373046875, -1.29852294921875, -1.241363525390625, -1.1842041015625, -1.127044677734375, -1.06988525390625, -1.012725830078125, -0.95556640625, -0.898406982421875, -0.84124755859375, -0.784088134765625, -0.7269287109375, -0.669769287109375, -0.61260986328125, -0.555450439453125, -0.498291015625, -0.441131591796875, -0.38397216796875, -0.326812744140625, -0.2696533203125, -0.212493896484375, -0.15533447265625, -0.098175048828125, -0.041015625, 0.016143798828125, 0.07330322265625, 0.130462646484375, 0.1876220703125, 0.244781494140625, 0.30194091796875, 0.359100341796875, 0.416259765625, 0.473419189453125, 0.53057861328125, 0.587738037109375, 0.6448974609375, 0.702056884765625, 0.75921630859375, 0.816375732421875, 0.87353515625, 0.930694580078125, 0.98785400390625, 1.045013427734375, 1.1021728515625, 1.159332275390625, 1.21649169921875, 1.273651123046875, 1.330810546875, 1.387969970703125, 1.44512939453125, 1.502288818359375, 1.5594482421875, 1.616607666015625, 1.67376708984375, 1.730926513671875, 1.7880859375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 4.0, 6.0, 12.0, 12.0, 19.0, 19.0, 22.0, 30.0, 36.0, 67.0, 67.0, 88.0, 86.0, 80.0, 58.0, 65.0, 57.0, 53.0, 37.0, 25.0, 29.0, 16.0, 16.0, 10.0, 8.0, 10.0, 5.0, 6.0, 10.0, 9.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.304664611816406, -8.03990650177002, -7.775148868560791, -7.510390758514404, -7.245632648468018, -6.980875015258789, -6.716116905212402, -6.451358795166016, -6.186600685119629, -5.921842575073242, -5.657084941864014, -5.392326831817627, -5.12756872177124, -4.862811088562012, -4.598052978515625, -4.333294868469238, -4.06853723526001, -3.803779363632202, -3.5390212535858154, -3.274263381958008, -3.009505271911621, -2.7447474002838135, -2.479989528656006, -2.215231418609619, -1.9504735469818115, -1.6857155561447144, -1.4209575653076172, -1.1561996936798096, -0.8914417028427124, -0.6266837120056152, -0.3619258403778076, -0.09716784954071045, 0.16759014129638672, 0.4323481023311615, 0.6971060633659363, 0.9618639945983887, 1.2266219854354858, 1.491379976272583, 1.7561378479003906, 2.0208959579467773, 2.285653829574585, 2.5504117012023926, 2.8151698112487793, 3.079927682876587, 3.3446855545043945, 3.6094436645507812, 3.874201536178589, 4.1389594078063965, 4.403717517852783, 4.66847562789917, 4.933233261108398, 5.197991371154785, 5.462749481201172, 5.727507591247559, 5.992265224456787, 6.257023334503174, 6.521780967712402, 6.786539077758789, 7.051296710968018, 7.316054821014404, 7.580812931060791, 7.8455705642700195, 8.110328674316406, 8.375086784362793, 8.63984489440918]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 7.0, 5.0, 7.0, 6.0, 7.0, 11.0, 11.0, 13.0, 12.0, 8.0, 20.0, 19.0, 27.0, 29.0, 32.0, 39.0, 35.0, 37.0, 32.0, 45.0, 36.0, 44.0, 29.0, 32.0, 46.0, 37.0, 41.0, 33.0, 32.0, 33.0, 29.0, 23.0, 35.0, 25.0, 20.0, 15.0, 19.0, 14.0, 7.0, 9.0, 12.0, 6.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.904817581176758, -7.682013034820557, -7.459208011627197, -7.236403465270996, -7.013598442077637, -6.7907938957214355, -6.567989349365234, -6.345184326171875, -6.122379779815674, -5.899575233459473, -5.676770210266113, -5.453965663909912, -5.231160640716553, -5.008356094360352, -4.785551071166992, -4.562746524810791, -4.33994197845459, -4.117137432098389, -3.8943324089050293, -3.671527862548828, -3.448723077774048, -3.2259182929992676, -3.0031135082244873, -2.780308723449707, -2.5575037002563477, -2.3346989154815674, -2.111894130706787, -1.8890894651412964, -1.6662847995758057, -1.4434800148010254, -1.2206752300262451, -0.9978705644607544, -0.7750658988952637, -0.5522611737251282, -0.3294564187526703, -0.1066516637802124, 0.1161530613899231, 0.3389577865600586, 0.5617625713348389, 0.7845672369003296, 1.0073720216751099, 1.2301768064498901, 1.4529814720153809, 1.6757862567901611, 1.8985910415649414, 2.1213955879211426, 2.344200611114502, 2.567005157470703, 2.7898099422454834, 3.0126147270202637, 3.235419511795044, 3.458224296569824, 3.6810288429260254, 3.9038336277008057, 4.126638412475586, 4.349442958831787, 4.5722479820251465, 4.795052528381348, 5.017857551574707, 5.240662097930908, 5.463467121124268, 5.686271667480469, 5.909076690673828, 6.131881237030029, 6.3546857833862305]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 7.0, 7.0, 9.0, 21.0, 25.0, 35.0, 53.0, 75.0, 103.0, 176.0, 231.0, 375.0, 617.0, 924.0, 1398.0, 2192.0, 3175.0, 5083.0, 8240.0, 13082.0, 20829.0, 34185.0, 58229.0, 104382.0, 213108.0, 534419.0, 1209827.0, 1112045.0, 452141.0, 186429.0, 95186.0, 53409.0, 31753.0, 19389.0, 12319.0, 7589.0, 4814.0, 3065.0, 1946.0, 1267.0, 841.0, 460.0, 307.0, 192.0, 134.0, 80.0, 40.0, 30.0, 20.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.7578125, -9.46142578125, -9.1650390625, -8.86865234375, -8.572265625, -8.27587890625, -7.9794921875, -7.68310546875, -7.38671875, -7.09033203125, -6.7939453125, -6.49755859375, -6.201171875, -5.90478515625, -5.6083984375, -5.31201171875, -5.015625, -4.71923828125, -4.4228515625, -4.12646484375, -3.830078125, -3.53369140625, -3.2373046875, -2.94091796875, -2.64453125, -2.34814453125, -2.0517578125, -1.75537109375, -1.458984375, -1.16259765625, -0.8662109375, -0.56982421875, -0.2734375, 0.02294921875, 0.3193359375, 0.61572265625, 0.912109375, 1.20849609375, 1.5048828125, 1.80126953125, 2.09765625, 2.39404296875, 2.6904296875, 2.98681640625, 3.283203125, 3.57958984375, 3.8759765625, 4.17236328125, 4.46875, 4.76513671875, 5.0615234375, 5.35791015625, 5.654296875, 5.95068359375, 6.2470703125, 6.54345703125, 6.83984375, 7.13623046875, 7.4326171875, 7.72900390625, 8.025390625, 8.32177734375, 8.6181640625, 8.91455078125, 9.2109375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 6.0, 6.0, 8.0, 8.0, 9.0, 13.0, 14.0, 10.0, 13.0, 18.0, 26.0, 34.0, 37.0, 39.0, 37.0, 42.0, 36.0, 43.0, 48.0, 40.0, 38.0, 47.0, 33.0, 34.0, 44.0, 38.0, 32.0, 32.0, 30.0, 28.0, 30.0, 20.0, 24.0, 16.0, 15.0, 12.0, 6.0, 12.0, 4.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.12890625, -6.9329833984375, -6.737060546875, -6.5411376953125, -6.34521484375, -6.1492919921875, -5.953369140625, -5.7574462890625, -5.5615234375, -5.3656005859375, -5.169677734375, -4.9737548828125, -4.77783203125, -4.5819091796875, -4.385986328125, -4.1900634765625, -3.994140625, -3.7982177734375, -3.602294921875, -3.4063720703125, -3.21044921875, -3.0145263671875, -2.818603515625, -2.6226806640625, -2.4267578125, -2.2308349609375, -2.034912109375, -1.8389892578125, -1.64306640625, -1.4471435546875, -1.251220703125, -1.0552978515625, -0.859375, -0.6634521484375, -0.467529296875, -0.2716064453125, -0.07568359375, 0.1202392578125, 0.316162109375, 0.5120849609375, 0.7080078125, 0.9039306640625, 1.099853515625, 1.2957763671875, 1.49169921875, 1.6876220703125, 1.883544921875, 2.0794677734375, 2.275390625, 2.4713134765625, 2.667236328125, 2.8631591796875, 3.05908203125, 3.2550048828125, 3.450927734375, 3.6468505859375, 3.8427734375, 4.0386962890625, 4.234619140625, 4.4305419921875, 4.62646484375, 4.8223876953125, 5.018310546875, 5.2142333984375, 5.41015625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 12.0, 13.0, 22.0, 28.0, 48.0, 66.0, 101.0, 161.0, 227.0, 407.0, 604.0, 958.0, 1611.0, 2573.0, 4244.0, 7205.0, 12564.0, 21883.0, 40109.0, 76141.0, 149721.0, 311114.0, 671267.0, 1213193.0, 870925.0, 406001.0, 192597.0, 95930.0, 49948.0, 27200.0, 15297.0, 8841.0, 5121.0, 3115.0, 1860.0, 1200.0, 702.0, 458.0, 287.0, 166.0, 122.0, 89.0, 52.0, 34.0, 21.0, 18.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.6688232421875, -8.376708984375, -8.0845947265625, -7.79248046875, -7.5003662109375, -7.208251953125, -6.9161376953125, -6.6240234375, -6.3319091796875, -6.039794921875, -5.7476806640625, -5.45556640625, -5.1634521484375, -4.871337890625, -4.5792236328125, -4.287109375, -3.9949951171875, -3.702880859375, -3.4107666015625, -3.11865234375, -2.8265380859375, -2.534423828125, -2.2423095703125, -1.9501953125, -1.6580810546875, -1.365966796875, -1.0738525390625, -0.78173828125, -0.4896240234375, -0.197509765625, 0.0946044921875, 0.38671875, 0.6788330078125, 0.970947265625, 1.2630615234375, 1.55517578125, 1.8472900390625, 2.139404296875, 2.4315185546875, 2.7236328125, 3.0157470703125, 3.307861328125, 3.5999755859375, 3.89208984375, 4.1842041015625, 4.476318359375, 4.7684326171875, 5.060546875, 5.3526611328125, 5.644775390625, 5.9368896484375, 6.22900390625, 6.5211181640625, 6.813232421875, 7.1053466796875, 7.3974609375, 7.6895751953125, 7.981689453125, 8.2738037109375, 8.56591796875, 8.8580322265625, 9.150146484375, 9.4422607421875, 9.734375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 11.0, 22.0, 23.0, 17.0, 38.0, 25.0, 39.0, 71.0, 66.0, 98.0, 120.0, 135.0, 183.0, 208.0, 246.0, 283.0, 310.0, 303.0, 297.0, 230.0, 235.0, 184.0, 182.0, 143.0, 107.0, 95.0, 79.0, 74.0, 53.0, 46.0, 37.0, 23.0, 16.0, 16.0, 5.0, 10.0, 7.0, 9.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.056640625, -2.95233154296875, -2.8480224609375, -2.74371337890625, -2.639404296875, -2.53509521484375, -2.4307861328125, -2.32647705078125, -2.22216796875, -2.11785888671875, -2.0135498046875, -1.90924072265625, -1.804931640625, -1.70062255859375, -1.5963134765625, -1.49200439453125, -1.3876953125, -1.28338623046875, -1.1790771484375, -1.07476806640625, -0.970458984375, -0.86614990234375, -0.7618408203125, -0.65753173828125, -0.55322265625, -0.44891357421875, -0.3446044921875, -0.24029541015625, -0.135986328125, -0.03167724609375, 0.0726318359375, 0.17694091796875, 0.28125, 0.38555908203125, 0.4898681640625, 0.59417724609375, 0.698486328125, 0.80279541015625, 0.9071044921875, 1.01141357421875, 1.11572265625, 1.22003173828125, 1.3243408203125, 1.42864990234375, 1.532958984375, 1.63726806640625, 1.7415771484375, 1.84588623046875, 1.9501953125, 2.05450439453125, 2.1588134765625, 2.26312255859375, 2.367431640625, 2.47174072265625, 2.5760498046875, 2.68035888671875, 2.78466796875, 2.88897705078125, 2.9932861328125, 3.09759521484375, 3.201904296875, 3.30621337890625, 3.4105224609375, 3.51483154296875, 3.619140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 10.0, 13.0, 9.0, 21.0, 21.0, 15.0, 37.0, 33.0, 47.0, 51.0, 56.0, 65.0, 75.0, 75.0, 73.0, 61.0, 61.0, 42.0, 32.0, 26.0, 36.0, 20.0, 15.0, 14.0, 9.0, 9.0, 7.0, 10.0, 9.0, 7.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.4575724601745605, -7.22041654586792, -6.983260631561279, -6.746105194091797, -6.508949279785156, -6.271793365478516, -6.034637451171875, -5.797481536865234, -5.560325622558594, -5.323169708251953, -5.0860137939453125, -4.848857879638672, -4.6117024421691895, -4.374546527862549, -4.137390613555908, -3.9002346992492676, -3.663079023361206, -3.4259231090545654, -3.188767433166504, -2.9516115188598633, -2.7144556045532227, -2.477299690246582, -2.2401440143585205, -2.00298810005188, -1.7658323049545288, -1.5286765098571777, -1.291520595550537, -1.054364800453186, -0.8172089457511902, -0.5800530910491943, -0.34289729595184326, -0.10574138164520264, 0.13141441345214844, 0.3685702681541443, 0.6057261228561401, 0.8428819179534912, 1.0800378322601318, 1.317193627357483, 1.554349422454834, 1.7915053367614746, 2.0286612510681152, 2.265817165374756, 2.5029728412628174, 2.740128755569458, 2.9772846698760986, 3.21444034576416, 3.451596260070801, 3.6887521743774414, 3.925907850265503, 4.1630635261535645, 4.400219440460205, 4.637375354766846, 4.874531269073486, 5.111687183380127, 5.348842620849609, 5.58599853515625, 5.823154449462891, 6.060310363769531, 6.297466278076172, 6.5346221923828125, 6.771777629852295, 7.0089335441589355, 7.246089458465576, 7.483245372772217, 7.720401287078857]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 6.0, 4.0, 8.0, 6.0, 12.0, 15.0, 8.0, 18.0, 25.0, 20.0, 19.0, 24.0, 37.0, 32.0, 31.0, 18.0, 34.0, 36.0, 35.0, 38.0, 40.0, 34.0, 22.0, 43.0, 41.0, 39.0, 32.0, 32.0, 27.0, 35.0, 30.0, 25.0, 19.0, 29.0, 11.0, 20.0, 13.0, 6.0, 11.0, 17.0, 5.0, 8.0, 7.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 5.0], "bins": [-6.9016265869140625, -6.708951950073242, -6.51627779006958, -6.32360315322876, -6.1309285163879395, -5.938254356384277, -5.745579719543457, -5.552905082702637, -5.360230922698975, -5.167556285858154, -4.974882125854492, -4.782207489013672, -4.589532852172852, -4.3968586921691895, -4.204184055328369, -4.011509895324707, -3.8188350200653076, -3.6261606216430664, -3.433485984802246, -3.240811586380005, -3.0481371879577637, -2.8554625511169434, -2.662788152694702, -2.470113754272461, -2.2774391174316406, -2.0847647190093994, -1.8920902013778687, -1.699415683746338, -1.5067412853240967, -1.314066767692566, -1.1213922500610352, -0.928717851638794, -0.7360434532165527, -0.5433689951896667, -0.3506945073604584, -0.15802001953125, 0.034654438495635986, 0.22732889652252197, 0.42000341415405273, 0.612677812576294, 0.8053523302078247, 0.9980267882347107, 1.1907012462615967, 1.3833757638931274, 1.5760502815246582, 1.7687246799468994, 1.9613991975784302, 2.154073715209961, 2.346748113632202, 2.5394225120544434, 2.7320971488952637, 2.924771547317505, 3.117445945739746, 3.3101205825805664, 3.5027949810028076, 3.695469379425049, 3.888144016265869, 4.0808186531066895, 4.273492813110352, 4.466167449951172, 4.658842086791992, 4.851516246795654, 5.044190883636475, 5.236865043640137, 5.429539680480957]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 9.0, 10.0, 17.0, 29.0, 46.0, 87.0, 103.0, 166.0, 229.0, 382.0, 585.0, 847.0, 1204.0, 1929.0, 2996.0, 4482.0, 7069.0, 10896.0, 17517.0, 27440.0, 44724.0, 72702.0, 118249.0, 188814.0, 204534.0, 130474.0, 80401.0, 48834.0, 30443.0, 18993.0, 12227.0, 7762.0, 5004.0, 3083.0, 2178.0, 1375.0, 910.0, 599.0, 411.0, 269.0, 188.0, 106.0, 74.0, 45.0, 38.0, 21.0, 20.0, 8.0, 3.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-2.74609375, -2.660552978515625, -2.57501220703125, -2.489471435546875, -2.4039306640625, -2.318389892578125, -2.23284912109375, -2.147308349609375, -2.061767578125, -1.976226806640625, -1.89068603515625, -1.805145263671875, -1.7196044921875, -1.634063720703125, -1.54852294921875, -1.462982177734375, -1.37744140625, -1.291900634765625, -1.20635986328125, -1.120819091796875, -1.0352783203125, -0.949737548828125, -0.86419677734375, -0.778656005859375, -0.693115234375, -0.607574462890625, -0.52203369140625, -0.436492919921875, -0.3509521484375, -0.265411376953125, -0.17987060546875, -0.094329833984375, -0.0087890625, 0.076751708984375, 0.16229248046875, 0.247833251953125, 0.3333740234375, 0.418914794921875, 0.50445556640625, 0.589996337890625, 0.675537109375, 0.761077880859375, 0.84661865234375, 0.932159423828125, 1.0177001953125, 1.103240966796875, 1.18878173828125, 1.274322509765625, 1.35986328125, 1.445404052734375, 1.53094482421875, 1.616485595703125, 1.7020263671875, 1.787567138671875, 1.87310791015625, 1.958648681640625, 2.044189453125, 2.129730224609375, 2.21527099609375, 2.300811767578125, 2.3863525390625, 2.471893310546875, 2.55743408203125, 2.642974853515625, 2.728515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 2.0, 7.0, 5.0, 8.0, 12.0, 12.0, 14.0, 16.0, 18.0, 20.0, 18.0, 30.0, 29.0, 32.0, 27.0, 31.0, 29.0, 24.0, 36.0, 47.0, 33.0, 47.0, 30.0, 38.0, 34.0, 36.0, 31.0, 42.0, 32.0, 25.0, 24.0, 39.0, 18.0, 22.0, 17.0, 13.0, 17.0, 10.0, 6.0, 10.0, 11.0, 7.0, 9.0, 5.0, 11.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.052978515625, -5.85205078125, -5.651123046875, -5.4501953125, -5.249267578125, -5.04833984375, -4.847412109375, -4.646484375, -4.445556640625, -4.24462890625, -4.043701171875, -3.8427734375, -3.641845703125, -3.44091796875, -3.239990234375, -3.0390625, -2.838134765625, -2.63720703125, -2.436279296875, -2.2353515625, -2.034423828125, -1.83349609375, -1.632568359375, -1.431640625, -1.230712890625, -1.02978515625, -0.828857421875, -0.6279296875, -0.427001953125, -0.22607421875, -0.025146484375, 0.17578125, 0.376708984375, 0.57763671875, 0.778564453125, 0.9794921875, 1.180419921875, 1.38134765625, 1.582275390625, 1.783203125, 1.984130859375, 2.18505859375, 2.385986328125, 2.5869140625, 2.787841796875, 2.98876953125, 3.189697265625, 3.390625, 3.591552734375, 3.79248046875, 3.993408203125, 4.1943359375, 4.395263671875, 4.59619140625, 4.797119140625, 4.998046875, 5.198974609375, 5.39990234375, 5.600830078125, 5.8017578125, 6.002685546875, 6.20361328125, 6.404541015625, 6.60546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 19.0, 34.0, 35.0, 65.0, 100.0, 140.0, 200.0, 343.0, 499.0, 821.0, 1275.0, 1885.0, 2905.0, 4586.0, 7387.0, 12344.0, 20622.0, 34937.0, 60931.0, 109412.0, 209330.0, 263866.0, 135851.0, 75283.0, 42408.0, 24613.0, 14718.0, 8816.0, 5468.0, 3339.0, 2175.0, 1425.0, 936.0, 613.0, 369.0, 269.0, 167.0, 106.0, 81.0, 50.0, 25.0, 21.0, 22.0, 7.0, 4.0, 7.0, 3.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.255859375, -3.15142822265625, -3.0469970703125, -2.94256591796875, -2.838134765625, -2.73370361328125, -2.6292724609375, -2.52484130859375, -2.42041015625, -2.31597900390625, -2.2115478515625, -2.10711669921875, -2.002685546875, -1.89825439453125, -1.7938232421875, -1.68939208984375, -1.5849609375, -1.48052978515625, -1.3760986328125, -1.27166748046875, -1.167236328125, -1.06280517578125, -0.9583740234375, -0.85394287109375, -0.74951171875, -0.64508056640625, -0.5406494140625, -0.43621826171875, -0.331787109375, -0.22735595703125, -0.1229248046875, -0.01849365234375, 0.0859375, 0.19036865234375, 0.2947998046875, 0.39923095703125, 0.503662109375, 0.60809326171875, 0.7125244140625, 0.81695556640625, 0.92138671875, 1.02581787109375, 1.1302490234375, 1.23468017578125, 1.339111328125, 1.44354248046875, 1.5479736328125, 1.65240478515625, 1.7568359375, 1.86126708984375, 1.9656982421875, 2.07012939453125, 2.174560546875, 2.27899169921875, 2.3834228515625, 2.48785400390625, 2.59228515625, 2.69671630859375, 2.8011474609375, 2.90557861328125, 3.010009765625, 3.11444091796875, 3.2188720703125, 3.32330322265625, 3.427734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 5.0, 4.0, 7.0, 16.0, 11.0, 17.0, 19.0, 20.0, 21.0, 30.0, 32.0, 27.0, 30.0, 31.0, 38.0, 38.0, 39.0, 31.0, 47.0, 37.0, 38.0, 36.0, 41.0, 36.0, 40.0, 31.0, 31.0, 34.0, 35.0, 35.0, 30.0, 18.0, 16.0, 10.0, 12.0, 8.0, 17.0, 16.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.2054443359375, -4.059326171875, -3.9132080078125, -3.76708984375, -3.6209716796875, -3.474853515625, -3.3287353515625, -3.1826171875, -3.0364990234375, -2.890380859375, -2.7442626953125, -2.59814453125, -2.4520263671875, -2.305908203125, -2.1597900390625, -2.013671875, -1.8675537109375, -1.721435546875, -1.5753173828125, -1.42919921875, -1.2830810546875, -1.136962890625, -0.9908447265625, -0.8447265625, -0.6986083984375, -0.552490234375, -0.4063720703125, -0.26025390625, -0.1141357421875, 0.031982421875, 0.1781005859375, 0.32421875, 0.4703369140625, 0.616455078125, 0.7625732421875, 0.90869140625, 1.0548095703125, 1.200927734375, 1.3470458984375, 1.4931640625, 1.6392822265625, 1.785400390625, 1.9315185546875, 2.07763671875, 2.2237548828125, 2.369873046875, 2.5159912109375, 2.662109375, 2.8082275390625, 2.954345703125, 3.1004638671875, 3.24658203125, 3.3927001953125, 3.538818359375, 3.6849365234375, 3.8310546875, 3.9771728515625, 4.123291015625, 4.2694091796875, 4.41552734375, 4.5616455078125, 4.707763671875, 4.8538818359375, 5.0]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 2.0, 8.0, 7.0, 8.0, 18.0, 26.0, 42.0, 43.0, 78.0, 117.0, 183.0, 286.0, 424.0, 698.0, 1182.0, 2078.0, 3621.0, 6915.0, 14165.0, 32502.0, 91013.0, 346010.0, 382631.0, 99397.0, 35166.0, 15273.0, 7375.0, 3875.0, 2168.0, 1248.0, 733.0, 433.0, 288.0, 174.0, 117.0, 72.0, 58.0, 38.0, 19.0, 20.0, 14.0, 8.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0360107421875, -0.034811973571777344, -0.03361320495605469, -0.03241443634033203, -0.031215667724609375, -0.03001689910888672, -0.028818130493164062, -0.027619361877441406, -0.02642059326171875, -0.025221824645996094, -0.024023056030273438, -0.02282428741455078, -0.021625518798828125, -0.02042675018310547, -0.019227981567382812, -0.018029212951660156, -0.0168304443359375, -0.015631675720214844, -0.014432907104492188, -0.013234138488769531, -0.012035369873046875, -0.010836601257324219, -0.009637832641601562, -0.008439064025878906, -0.00724029541015625, -0.006041526794433594, -0.0048427581787109375, -0.0036439895629882812, -0.002445220947265625, -0.0012464523315429688, -4.76837158203125e-05, 0.0011510848999023438, 0.002349853515625, 0.0035486221313476562, 0.0047473907470703125, 0.005946159362792969, 0.007144927978515625, 0.008343696594238281, 0.009542465209960938, 0.010741233825683594, 0.01194000244140625, 0.013138771057128906, 0.014337539672851562, 0.015536308288574219, 0.016735076904296875, 0.01793384552001953, 0.019132614135742188, 0.020331382751464844, 0.0215301513671875, 0.022728919982910156, 0.023927688598632812, 0.02512645721435547, 0.026325225830078125, 0.02752399444580078, 0.028722763061523438, 0.029921531677246094, 0.03112030029296875, 0.032319068908691406, 0.03351783752441406, 0.03471660614013672, 0.035915374755859375, 0.03711414337158203, 0.03831291198730469, 0.039511680603027344, 0.04071044921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 6.0, 10.0, 9.0, 6.0, 7.0, 17.0, 22.0, 15.0, 23.0, 24.0, 35.0, 59.0, 59.0, 76.0, 75.0, 60.0, 80.0, 75.0, 55.0, 48.0, 54.0, 25.0, 29.0, 24.0, 22.0, 9.0, 15.0, 8.0, 11.0, 11.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.430511474609375e-05, -1.3937242329120636e-05, -1.3569369912147522e-05, -1.3201497495174408e-05, -1.2833625078201294e-05, -1.246575266122818e-05, -1.2097880244255066e-05, -1.1730007827281952e-05, -1.1362135410308838e-05, -1.0994262993335724e-05, -1.062639057636261e-05, -1.0258518159389496e-05, -9.890645742416382e-06, -9.522773325443268e-06, -9.154900908470154e-06, -8.78702849149704e-06, -8.419156074523926e-06, -8.051283657550812e-06, -7.683411240577698e-06, -7.315538823604584e-06, -6.94766640663147e-06, -6.579793989658356e-06, -6.211921572685242e-06, -5.844049155712128e-06, -5.476176738739014e-06, -5.1083043217659e-06, -4.740431904792786e-06, -4.372559487819672e-06, -4.004687070846558e-06, -3.6368146538734436e-06, -3.2689422369003296e-06, -2.9010698199272156e-06, -2.5331974029541016e-06, -2.1653249859809875e-06, -1.7974525690078735e-06, -1.4295801520347595e-06, -1.0617077350616455e-06, -6.938353180885315e-07, -3.259629011154175e-07, 4.190951585769653e-08, 4.0978193283081055e-07, 7.776543498039246e-07, 1.1455267667770386e-06, 1.5133991837501526e-06, 1.8812716007232666e-06, 2.2491440176963806e-06, 2.6170164346694946e-06, 2.9848888516426086e-06, 3.3527612686157227e-06, 3.7206336855888367e-06, 4.088506102561951e-06, 4.456378519535065e-06, 4.824250936508179e-06, 5.192123353481293e-06, 5.559995770454407e-06, 5.927868187427521e-06, 6.295740604400635e-06, 6.663613021373749e-06, 7.031485438346863e-06, 7.399357855319977e-06, 7.76723027229309e-06, 8.135102689266205e-06, 8.502975106239319e-06, 8.870847523212433e-06, 9.238719940185547e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 9.0, 10.0, 17.0, 23.0, 39.0, 54.0, 74.0, 101.0, 136.0, 181.0, 267.0, 348.0, 496.0, 678.0, 1019.0, 1459.0, 2115.0, 3271.0, 4953.0, 7956.0, 12693.0, 22242.0, 40124.0, 76249.0, 159564.0, 297599.0, 203672.0, 95933.0, 48802.0, 26563.0, 15322.0, 9102.0, 5807.0, 3623.0, 2419.0, 1699.0, 1168.0, 737.0, 534.0, 416.0, 316.0, 211.0, 152.0, 108.0, 86.0, 54.0, 37.0, 27.0, 24.0, 18.0, 13.0, 9.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.023468017578125, -0.022726774215698242, -0.021985530853271484, -0.021244287490844727, -0.02050304412841797, -0.01976180076599121, -0.019020557403564453, -0.018279314041137695, -0.017538070678710938, -0.01679682731628418, -0.016055583953857422, -0.015314340591430664, -0.014573097229003906, -0.013831853866577148, -0.01309061050415039, -0.012349367141723633, -0.011608123779296875, -0.010866880416870117, -0.01012563705444336, -0.009384393692016602, -0.008643150329589844, -0.007901906967163086, -0.007160663604736328, -0.00641942024230957, -0.0056781768798828125, -0.004936933517456055, -0.004195690155029297, -0.003454446792602539, -0.0027132034301757812, -0.0019719600677490234, -0.0012307167053222656, -0.0004894733428955078, 0.00025177001953125, 0.0009930133819580078, 0.0017342567443847656, 0.0024755001068115234, 0.0032167434692382812, 0.003957986831665039, 0.004699230194091797, 0.005440473556518555, 0.0061817169189453125, 0.00692296028137207, 0.007664203643798828, 0.008405447006225586, 0.009146690368652344, 0.009887933731079102, 0.01062917709350586, 0.011370420455932617, 0.012111663818359375, 0.012852907180786133, 0.01359415054321289, 0.014335393905639648, 0.015076637268066406, 0.015817880630493164, 0.016559123992919922, 0.01730036735534668, 0.018041610717773438, 0.018782854080200195, 0.019524097442626953, 0.02026534080505371, 0.02100658416748047, 0.021747827529907227, 0.022489070892333984, 0.023230314254760742, 0.0239715576171875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 9.0, 3.0, 5.0, 9.0, 11.0, 15.0, 18.0, 19.0, 29.0, 36.0, 36.0, 53.0, 85.0, 86.0, 89.0, 93.0, 90.0, 61.0, 54.0, 34.0, 33.0, 25.0, 15.0, 31.0, 15.0, 7.0, 6.0, 4.0, 7.0, 8.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0115203857421875, -0.01119089126586914, -0.010861396789550781, -0.010531902313232422, -0.010202407836914062, -0.009872913360595703, -0.009543418884277344, -0.009213924407958984, -0.008884429931640625, -0.008554935455322266, -0.008225440979003906, -0.007895946502685547, -0.0075664520263671875, -0.007236957550048828, -0.006907463073730469, -0.006577968597412109, -0.00624847412109375, -0.005918979644775391, -0.005589485168457031, -0.005259990692138672, -0.0049304962158203125, -0.004601001739501953, -0.004271507263183594, -0.003942012786865234, -0.003612518310546875, -0.0032830238342285156, -0.0029535293579101562, -0.002624034881591797, -0.0022945404052734375, -0.001965045928955078, -0.0016355514526367188, -0.0013060569763183594, -0.0009765625, -0.0006470680236816406, -0.00031757354736328125, 1.1920928955078125e-05, 0.0003414154052734375, 0.0006709098815917969, 0.0010004043579101562, 0.0013298988342285156, 0.001659393310546875, 0.0019888877868652344, 0.0023183822631835938, 0.002647876739501953, 0.0029773712158203125, 0.003306865692138672, 0.0036363601684570312, 0.003965854644775391, 0.00429534912109375, 0.004624843597412109, 0.004954338073730469, 0.005283832550048828, 0.0056133270263671875, 0.005942821502685547, 0.006272315979003906, 0.006601810455322266, 0.006931304931640625, 0.007260799407958984, 0.007590293884277344, 0.007919788360595703, 0.008249282836914062, 0.008578777313232422, 0.008908271789550781, 0.00923776626586914, 0.0095672607421875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 16.0, 13.0, 11.0, 19.0, 22.0, 29.0, 34.0, 44.0, 50.0, 57.0, 66.0, 73.0, 74.0, 74.0, 67.0, 59.0, 42.0, 35.0, 30.0, 29.0, 23.0, 13.0, 17.0, 10.0, 9.0, 10.0, 8.0, 9.0, 7.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.458872318267822, -7.222723007202148, -6.986573219299316, -6.750423908233643, -6.514274597167969, -6.278124809265137, -6.041975498199463, -5.805826187133789, -5.569676399230957, -5.333527088165283, -5.097377300262451, -4.861227989196777, -4.6250786781311035, -4.3889288902282715, -4.152779579162598, -3.9166300296783447, -3.680480718612671, -3.444331169128418, -3.208181858062744, -2.972032308578491, -2.7358827590942383, -2.4997334480285645, -2.2635838985443115, -2.0274343490600586, -1.7912849187850952, -1.5551354885101318, -1.318985939025879, -1.0828365087509155, -0.8466870188713074, -0.6105375289916992, -0.37438809871673584, -0.1382385492324829, 0.09791088104248047, 0.3340603709220886, 0.5702098608016968, 0.8063592910766602, 1.042508840560913, 1.2786582708358765, 1.5148077011108398, 1.7509572505950928, 1.9871066808700562, 2.2232561111450195, 2.4594056606292725, 2.6955552101135254, 2.931704521179199, 3.167854070663452, 3.404003620147705, 3.640152931213379, 3.876302480697632, 4.112452030181885, 4.348601341247559, 4.584751129150391, 4.8209004402160645, 5.057049751281738, 5.29319953918457, 5.529348850250244, 5.765498161315918, 6.001647472381592, 6.237797260284424, 6.473946571350098, 6.7100958824157715, 6.9462456703186035, 7.182394981384277, 7.418544769287109, 7.654694080352783]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 5.0, 4.0, 9.0, 6.0, 11.0, 15.0, 10.0, 17.0, 25.0, 19.0, 19.0, 25.0, 39.0, 32.0, 28.0, 21.0, 32.0, 37.0, 36.0, 38.0, 38.0, 33.0, 23.0, 41.0, 43.0, 43.0, 28.0, 31.0, 29.0, 35.0, 32.0, 22.0, 19.0, 28.0, 12.0, 19.0, 13.0, 7.0, 10.0, 17.0, 5.0, 8.0, 7.0, 3.0, 2.0, 7.0, 2.0, 4.0, 2.0, 5.0], "bins": [-6.817597389221191, -6.625896453857422, -6.434195518493652, -6.242495059967041, -6.0507941246032715, -5.859093189239502, -5.667392253875732, -5.475691795349121, -5.283990859985352, -5.092289924621582, -4.9005889892578125, -4.708888530731201, -4.517187595367432, -4.325486660003662, -4.133785724639893, -3.942085027694702, -3.7503840923309326, -3.558683156967163, -3.3669824600219727, -3.175281524658203, -2.9835808277130127, -2.791879892349243, -2.6001791954040527, -2.408478260040283, -2.2167773246765137, -2.025076389312744, -1.8333756923675537, -1.6416747570037842, -1.4499740600585938, -1.2582731246948242, -1.0665723085403442, -0.8748714923858643, -0.6831707954406738, -0.49146997928619385, -0.2997691333293915, -0.10806828737258911, 0.08363252878189087, 0.27533334493637085, 0.4670342206954956, 0.6587350368499756, 0.8504358530044556, 1.0421366691589355, 1.2338374853134155, 1.4255383014678955, 1.617239236831665, 1.8089399337768555, 2.000640869140625, 2.1923418045043945, 2.384042501449585, 2.5757434368133545, 2.767444133758545, 2.9591450691223145, 3.150845766067505, 3.3425467014312744, 3.534247398376465, 3.7259483337402344, 3.917649269104004, 4.109350204467773, 4.301051139831543, 4.492751598358154, 4.684452533721924, 4.876153469085693, 5.067854404449463, 5.259554862976074, 5.451255798339844]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 4.0, 8.0, 7.0, 10.0, 25.0, 34.0, 52.0, 70.0, 117.0, 147.0, 229.0, 334.0, 456.0, 699.0, 1013.0, 1450.0, 2178.0, 3360.0, 5044.0, 7687.0, 11629.0, 18099.0, 27439.0, 43338.0, 68412.0, 106054.0, 151541.0, 175939.0, 145356.0, 99520.0, 63314.0, 40133.0, 25880.0, 16443.0, 10882.0, 7192.0, 4771.0, 3112.0, 2091.0, 1443.0, 965.0, 636.0, 403.0, 338.0, 245.0, 173.0, 94.0, 66.0, 46.0, 27.0, 23.0, 15.0, 7.0, 12.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.4921875, -8.221923828125, -7.95166015625, -7.681396484375, -7.4111328125, -7.140869140625, -6.87060546875, -6.600341796875, -6.330078125, -6.059814453125, -5.78955078125, -5.519287109375, -5.2490234375, -4.978759765625, -4.70849609375, -4.438232421875, -4.16796875, -3.897705078125, -3.62744140625, -3.357177734375, -3.0869140625, -2.816650390625, -2.54638671875, -2.276123046875, -2.005859375, -1.735595703125, -1.46533203125, -1.195068359375, -0.9248046875, -0.654541015625, -0.38427734375, -0.114013671875, 0.15625, 0.426513671875, 0.69677734375, 0.967041015625, 1.2373046875, 1.507568359375, 1.77783203125, 2.048095703125, 2.318359375, 2.588623046875, 2.85888671875, 3.129150390625, 3.3994140625, 3.669677734375, 3.93994140625, 4.210205078125, 4.48046875, 4.750732421875, 5.02099609375, 5.291259765625, 5.5615234375, 5.831787109375, 6.10205078125, 6.372314453125, 6.642578125, 6.912841796875, 7.18310546875, 7.453369140625, 7.7236328125, 7.993896484375, 8.26416015625, 8.534423828125, 8.8046875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 8.0, 8.0, 8.0, 11.0, 11.0, 10.0, 18.0, 20.0, 12.0, 22.0, 19.0, 32.0, 29.0, 39.0, 22.0, 31.0, 31.0, 37.0, 29.0, 42.0, 39.0, 32.0, 28.0, 30.0, 42.0, 33.0, 35.0, 35.0, 26.0, 38.0, 28.0, 32.0, 19.0, 16.0, 18.0, 17.0, 14.0, 10.0, 14.0, 4.0, 7.0, 8.0, 10.0, 4.0, 3.0, 6.0, 2.0, 4.0, 2.0, 4.0, 4.0], "bins": [-6.05859375, -5.8831787109375, -5.707763671875, -5.5323486328125, -5.35693359375, -5.1815185546875, -5.006103515625, -4.8306884765625, -4.6552734375, -4.4798583984375, -4.304443359375, -4.1290283203125, -3.95361328125, -3.7781982421875, -3.602783203125, -3.4273681640625, -3.251953125, -3.0765380859375, -2.901123046875, -2.7257080078125, -2.55029296875, -2.3748779296875, -2.199462890625, -2.0240478515625, -1.8486328125, -1.6732177734375, -1.497802734375, -1.3223876953125, -1.14697265625, -0.9715576171875, -0.796142578125, -0.6207275390625, -0.4453125, -0.2698974609375, -0.094482421875, 0.0809326171875, 0.25634765625, 0.4317626953125, 0.607177734375, 0.7825927734375, 0.9580078125, 1.1334228515625, 1.308837890625, 1.4842529296875, 1.65966796875, 1.8350830078125, 2.010498046875, 2.1859130859375, 2.361328125, 2.5367431640625, 2.712158203125, 2.8875732421875, 3.06298828125, 3.2384033203125, 3.413818359375, 3.5892333984375, 3.7646484375, 3.9400634765625, 4.115478515625, 4.2908935546875, 4.46630859375, 4.6417236328125, 4.817138671875, 4.9925537109375, 5.16796875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 8.0, 18.0, 30.0, 34.0, 44.0, 71.0, 97.0, 190.0, 200.0, 327.0, 520.0, 717.0, 1048.0, 1493.0, 2294.0, 3340.0, 4976.0, 7338.0, 11132.0, 16798.0, 25407.0, 38954.0, 59700.0, 90005.0, 128514.0, 158131.0, 151056.0, 115454.0, 78734.0, 51777.0, 34110.0, 22125.0, 14523.0, 9727.0, 6331.0, 4296.0, 2776.0, 1873.0, 1312.0, 938.0, 643.0, 459.0, 336.0, 205.0, 163.0, 97.0, 65.0, 63.0, 40.0, 16.0, 15.0, 15.0, 5.0, 8.0, 3.0, 1.0, 1.0], "bins": [-8.4765625, -8.2183837890625, -7.960205078125, -7.7020263671875, -7.44384765625, -7.1856689453125, -6.927490234375, -6.6693115234375, -6.4111328125, -6.1529541015625, -5.894775390625, -5.6365966796875, -5.37841796875, -5.1202392578125, -4.862060546875, -4.6038818359375, -4.345703125, -4.0875244140625, -3.829345703125, -3.5711669921875, -3.31298828125, -3.0548095703125, -2.796630859375, -2.5384521484375, -2.2802734375, -2.0220947265625, -1.763916015625, -1.5057373046875, -1.24755859375, -0.9893798828125, -0.731201171875, -0.4730224609375, -0.21484375, 0.0433349609375, 0.301513671875, 0.5596923828125, 0.81787109375, 1.0760498046875, 1.334228515625, 1.5924072265625, 1.8505859375, 2.1087646484375, 2.366943359375, 2.6251220703125, 2.88330078125, 3.1414794921875, 3.399658203125, 3.6578369140625, 3.916015625, 4.1741943359375, 4.432373046875, 4.6905517578125, 4.94873046875, 5.2069091796875, 5.465087890625, 5.7232666015625, 5.9814453125, 6.2396240234375, 6.497802734375, 6.7559814453125, 7.01416015625, 7.2723388671875, 7.530517578125, 7.7886962890625, 8.046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 5.0, 11.0, 11.0, 8.0, 16.0, 7.0, 17.0, 22.0, 28.0, 21.0, 19.0, 35.0, 29.0, 39.0, 40.0, 39.0, 49.0, 37.0, 45.0, 36.0, 37.0, 33.0, 38.0, 40.0, 37.0, 43.0, 32.0, 35.0, 35.0, 23.0, 23.0, 17.0, 18.0, 19.0, 10.0, 14.0, 5.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.99188232421875, -3.8548583984375, -3.71783447265625, -3.580810546875, -3.44378662109375, -3.3067626953125, -3.16973876953125, -3.03271484375, -2.89569091796875, -2.7586669921875, -2.62164306640625, -2.484619140625, -2.34759521484375, -2.2105712890625, -2.07354736328125, -1.9365234375, -1.79949951171875, -1.6624755859375, -1.52545166015625, -1.388427734375, -1.25140380859375, -1.1143798828125, -0.97735595703125, -0.84033203125, -0.70330810546875, -0.5662841796875, -0.42926025390625, -0.292236328125, -0.15521240234375, -0.0181884765625, 0.11883544921875, 0.255859375, 0.39288330078125, 0.5299072265625, 0.66693115234375, 0.803955078125, 0.94097900390625, 1.0780029296875, 1.21502685546875, 1.35205078125, 1.48907470703125, 1.6260986328125, 1.76312255859375, 1.900146484375, 2.03717041015625, 2.1741943359375, 2.31121826171875, 2.4482421875, 2.58526611328125, 2.7222900390625, 2.85931396484375, 2.996337890625, 3.13336181640625, 3.2703857421875, 3.40740966796875, 3.54443359375, 3.68145751953125, 3.8184814453125, 3.95550537109375, 4.092529296875, 4.22955322265625, 4.3665771484375, 4.50360107421875, 4.640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 8.0, 11.0, 16.0, 20.0, 14.0, 30.0, 24.0, 49.0, 60.0, 78.0, 115.0, 169.0, 205.0, 314.0, 422.0, 632.0, 893.0, 1201.0, 1769.0, 2603.0, 3995.0, 6054.0, 9466.0, 15427.0, 26699.0, 51408.0, 122351.0, 428644.0, 214193.0, 72995.0, 35207.0, 19492.0, 11692.0, 7360.0, 4790.0, 3077.0, 2110.0, 1477.0, 983.0, 725.0, 470.0, 341.0, 293.0, 182.0, 133.0, 99.0, 69.0, 54.0, 35.0, 24.0, 26.0, 22.0, 9.0, 12.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0], "bins": [-5.5859375, -5.40985107421875, -5.2337646484375, -5.05767822265625, -4.881591796875, -4.70550537109375, -4.5294189453125, -4.35333251953125, -4.17724609375, -4.00115966796875, -3.8250732421875, -3.64898681640625, -3.472900390625, -3.29681396484375, -3.1207275390625, -2.94464111328125, -2.7685546875, -2.59246826171875, -2.4163818359375, -2.24029541015625, -2.064208984375, -1.88812255859375, -1.7120361328125, -1.53594970703125, -1.35986328125, -1.18377685546875, -1.0076904296875, -0.83160400390625, -0.655517578125, -0.47943115234375, -0.3033447265625, -0.12725830078125, 0.048828125, 0.22491455078125, 0.4010009765625, 0.57708740234375, 0.753173828125, 0.92926025390625, 1.1053466796875, 1.28143310546875, 1.45751953125, 1.63360595703125, 1.8096923828125, 1.98577880859375, 2.161865234375, 2.33795166015625, 2.5140380859375, 2.69012451171875, 2.8662109375, 3.04229736328125, 3.2183837890625, 3.39447021484375, 3.570556640625, 3.74664306640625, 3.9227294921875, 4.09881591796875, 4.27490234375, 4.45098876953125, 4.6270751953125, 4.80316162109375, 4.979248046875, 5.15533447265625, 5.3314208984375, 5.50750732421875, 5.68359375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 4.0, 8.0, 7.0, 10.0, 23.0, 20.0, 34.0, 55.0, 51.0, 66.0, 94.0, 108.0, 114.0, 90.0, 82.0, 49.0, 50.0, 28.0, 23.0, 11.0, 14.0, 9.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002486705780029297, -0.00023969635367393494, -0.00023072212934494019, -0.00022174790501594543, -0.00021277368068695068, -0.00020379945635795593, -0.00019482523202896118, -0.00018585100769996643, -0.00017687678337097168, -0.00016790255904197693, -0.00015892833471298218, -0.00014995411038398743, -0.00014097988605499268, -0.00013200566172599792, -0.00012303143739700317, -0.00011405721306800842, -0.00010508298873901367, -9.610876441001892e-05, -8.713454008102417e-05, -7.816031575202942e-05, -6.918609142303467e-05, -6.021186709403992e-05, -5.1237642765045166e-05, -4.2263418436050415e-05, -3.3289194107055664e-05, -2.4314969778060913e-05, -1.5340745449066162e-05, -6.366521120071411e-06, 2.60770320892334e-06, 1.158192753791809e-05, 2.0556151866912842e-05, 2.9530376195907593e-05, 3.8504600524902344e-05, 4.7478824853897095e-05, 5.6453049182891846e-05, 6.54272735118866e-05, 7.440149784088135e-05, 8.33757221698761e-05, 9.234994649887085e-05, 0.0001013241708278656, 0.00011029839515686035, 0.0001192726194858551, 0.00012824684381484985, 0.0001372210681438446, 0.00014619529247283936, 0.0001551695168018341, 0.00016414374113082886, 0.0001731179654598236, 0.00018209218978881836, 0.0001910664141178131, 0.00020004063844680786, 0.0002090148627758026, 0.00021798908710479736, 0.00022696331143379211, 0.00023593753576278687, 0.0002449117600917816, 0.00025388598442077637, 0.0002628602087497711, 0.00027183443307876587, 0.0002808086574077606, 0.00028978288173675537, 0.0002987571060657501, 0.0003077313303947449, 0.0003167055547237396, 0.0003256797790527344]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 7.0, 15.0, 19.0, 31.0, 43.0, 65.0, 77.0, 122.0, 182.0, 273.0, 375.0, 564.0, 770.0, 1178.0, 1774.0, 2709.0, 4115.0, 6433.0, 10258.0, 16906.0, 29788.0, 57421.0, 140741.0, 448808.0, 176709.0, 65614.0, 33198.0, 18866.0, 11283.0, 7019.0, 4331.0, 2936.0, 1909.0, 1307.0, 822.0, 592.0, 390.0, 288.0, 187.0, 140.0, 82.0, 65.0, 36.0, 25.0, 28.0, 20.0, 15.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.4375, -5.265380859375, -5.09326171875, -4.921142578125, -4.7490234375, -4.576904296875, -4.40478515625, -4.232666015625, -4.060546875, -3.888427734375, -3.71630859375, -3.544189453125, -3.3720703125, -3.199951171875, -3.02783203125, -2.855712890625, -2.68359375, -2.511474609375, -2.33935546875, -2.167236328125, -1.9951171875, -1.822998046875, -1.65087890625, -1.478759765625, -1.306640625, -1.134521484375, -0.96240234375, -0.790283203125, -0.6181640625, -0.446044921875, -0.27392578125, -0.101806640625, 0.0703125, 0.242431640625, 0.41455078125, 0.586669921875, 0.7587890625, 0.930908203125, 1.10302734375, 1.275146484375, 1.447265625, 1.619384765625, 1.79150390625, 1.963623046875, 2.1357421875, 2.307861328125, 2.47998046875, 2.652099609375, 2.82421875, 2.996337890625, 3.16845703125, 3.340576171875, 3.5126953125, 3.684814453125, 3.85693359375, 4.029052734375, 4.201171875, 4.373291015625, 4.54541015625, 4.717529296875, 4.8896484375, 5.061767578125, 5.23388671875, 5.406005859375, 5.578125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 6.0, 2.0, 2.0, 7.0, 4.0, 8.0, 5.0, 3.0, 13.0, 14.0, 12.0, 18.0, 15.0, 26.0, 24.0, 34.0, 27.0, 34.0, 51.0, 66.0, 76.0, 100.0, 82.0, 65.0, 45.0, 41.0, 40.0, 27.0, 15.0, 22.0, 22.0, 8.0, 17.0, 11.0, 10.0, 13.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6767578125, -1.62371826171875, -1.5706787109375, -1.51763916015625, -1.464599609375, -1.41156005859375, -1.3585205078125, -1.30548095703125, -1.25244140625, -1.19940185546875, -1.1463623046875, -1.09332275390625, -1.040283203125, -0.98724365234375, -0.9342041015625, -0.88116455078125, -0.828125, -0.77508544921875, -0.7220458984375, -0.66900634765625, -0.615966796875, -0.56292724609375, -0.5098876953125, -0.45684814453125, -0.40380859375, -0.35076904296875, -0.2977294921875, -0.24468994140625, -0.191650390625, -0.13861083984375, -0.0855712890625, -0.03253173828125, 0.0205078125, 0.07354736328125, 0.1265869140625, 0.17962646484375, 0.232666015625, 0.28570556640625, 0.3387451171875, 0.39178466796875, 0.44482421875, 0.49786376953125, 0.5509033203125, 0.60394287109375, 0.656982421875, 0.71002197265625, 0.7630615234375, 0.81610107421875, 0.869140625, 0.92218017578125, 0.9752197265625, 1.02825927734375, 1.081298828125, 1.13433837890625, 1.1873779296875, 1.24041748046875, 1.29345703125, 1.34649658203125, 1.3995361328125, 1.45257568359375, 1.505615234375, 1.55865478515625, 1.6116943359375, 1.66473388671875, 1.7177734375]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 5.0, 16.0, 10.0, 14.0, 21.0, 27.0, 37.0, 43.0, 52.0, 73.0, 74.0, 96.0, 84.0, 87.0, 70.0, 53.0, 49.0, 35.0, 26.0, 20.0, 22.0, 16.0, 10.0, 15.0, 4.0, 6.0, 2.0, 13.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.280603408813477, -7.9999542236328125, -7.719305038452148, -7.438656330108643, -7.1580071449279785, -6.8773579597473145, -6.596709251403809, -6.3160600662231445, -6.0354108810424805, -5.754761695861816, -5.474112510681152, -5.1934638023376465, -4.912814617156982, -4.632165431976318, -4.3515167236328125, -4.070867538452148, -3.7902183532714844, -3.5095691680908203, -3.2289202213287354, -2.9482712745666504, -2.6676220893859863, -2.3869729042053223, -2.1063239574432373, -1.8256748914718628, -1.5450258255004883, -1.2643767595291138, -0.9837276935577393, -0.7030786275863647, -0.42242956161499023, -0.14178049564361572, 0.1388685703277588, 0.4195176362991333, 0.7001676559448242, 0.9808167219161987, 1.2614657878875732, 1.5421148538589478, 1.8227639198303223, 2.1034131050109863, 2.3840620517730713, 2.6647109985351562, 2.9453601837158203, 3.2260093688964844, 3.5066583156585693, 3.7873072624206543, 4.067956447601318, 4.348605632781982, 4.629254341125488, 4.909903526306152, 5.190552711486816, 5.4712018966674805, 5.7518510818481445, 6.03249979019165, 6.3131489753723145, 6.5937981605529785, 6.874446868896484, 7.155096054077148, 7.4357452392578125, 7.716394424438477, 7.997043609619141, 8.277692794799805, 8.558341979980469, 8.838990211486816, 9.11963939666748, 9.400288581848145, 9.680937767028809]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 3.0, 8.0, 6.0, 13.0, 8.0, 9.0, 16.0, 16.0, 27.0, 22.0, 32.0, 33.0, 30.0, 36.0, 37.0, 41.0, 39.0, 46.0, 33.0, 43.0, 53.0, 31.0, 41.0, 40.0, 46.0, 27.0, 30.0, 29.0, 29.0, 24.0, 32.0, 16.0, 15.0, 17.0, 14.0, 17.0, 7.0, 5.0, 5.0, 2.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.139776706695557, -6.9159722328186035, -6.692167282104492, -6.468362808227539, -6.244558334350586, -6.020753860473633, -5.79694938659668, -5.573144435882568, -5.349339962005615, -5.125535488128662, -4.901730537414551, -4.677926063537598, -4.4541215896606445, -4.230317115783691, -4.006512641906738, -3.782707691192627, -3.558903217315674, -3.3350987434387207, -3.1112940311431885, -2.8874893188476562, -2.663684844970703, -2.43988037109375, -2.2160756587982178, -1.992271065711975, -1.7684664726257324, -1.5446618795394897, -1.320857286453247, -1.0970526933670044, -0.8732481002807617, -0.649443507194519, -0.42563891410827637, -0.2018343210220337, 0.02196979522705078, 0.24577438831329346, 0.46957898139953613, 0.6933835744857788, 0.9171881675720215, 1.1409927606582642, 1.3647973537445068, 1.5886019468307495, 1.8124065399169922, 2.0362110137939453, 2.2600157260894775, 2.4838204383850098, 2.707624912261963, 2.931429386138916, 3.1552340984344482, 3.3790388107299805, 3.6028432846069336, 3.8266477584838867, 4.05045223236084, 4.274257183074951, 4.498061656951904, 4.721866130828857, 4.945671081542969, 5.169475555419922, 5.393280029296875, 5.617084503173828, 5.840888977050781, 6.064693927764893, 6.288498401641846, 6.512302875518799, 6.73610782623291, 6.959912300109863, 7.183716773986816]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 17.0, 11.0, 21.0, 41.0, 58.0, 89.0, 126.0, 209.0, 333.0, 485.0, 830.0, 1263.0, 2051.0, 3280.0, 5501.0, 9257.0, 15620.0, 27738.0, 49975.0, 93423.0, 195277.0, 487384.0, 1235618.0, 1206322.0, 462902.0, 186066.0, 91803.0, 49558.0, 28033.0, 15912.0, 9774.0, 5769.0, 3533.0, 2163.0, 1412.0, 839.0, 543.0, 340.0, 216.0, 157.0, 104.0, 77.0, 54.0, 40.0, 24.0, 8.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.765625, -8.463134765625, -8.16064453125, -7.858154296875, -7.5556640625, -7.253173828125, -6.95068359375, -6.648193359375, -6.345703125, -6.043212890625, -5.74072265625, -5.438232421875, -5.1357421875, -4.833251953125, -4.53076171875, -4.228271484375, -3.92578125, -3.623291015625, -3.32080078125, -3.018310546875, -2.7158203125, -2.413330078125, -2.11083984375, -1.808349609375, -1.505859375, -1.203369140625, -0.90087890625, -0.598388671875, -0.2958984375, 0.006591796875, 0.30908203125, 0.611572265625, 0.9140625, 1.216552734375, 1.51904296875, 1.821533203125, 2.1240234375, 2.426513671875, 2.72900390625, 3.031494140625, 3.333984375, 3.636474609375, 3.93896484375, 4.241455078125, 4.5439453125, 4.846435546875, 5.14892578125, 5.451416015625, 5.75390625, 6.056396484375, 6.35888671875, 6.661376953125, 6.9638671875, 7.266357421875, 7.56884765625, 7.871337890625, 8.173828125, 8.476318359375, 8.77880859375, 9.081298828125, 9.3837890625, 9.686279296875, 9.98876953125, 10.291259765625, 10.59375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 4.0, 14.0, 13.0, 10.0, 12.0, 24.0, 27.0, 30.0, 32.0, 23.0, 35.0, 35.0, 35.0, 33.0, 43.0, 39.0, 38.0, 34.0, 36.0, 46.0, 29.0, 37.0, 41.0, 36.0, 31.0, 24.0, 26.0, 24.0, 22.0, 22.0, 19.0, 16.0, 12.0, 20.0, 10.0, 7.0, 7.0, 3.0, 4.0, 6.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.7822265625, -4.615234375, -4.4482421875, -4.28125, -4.1142578125, -3.947265625, -3.7802734375, -3.61328125, -3.4462890625, -3.279296875, -3.1123046875, -2.9453125, -2.7783203125, -2.611328125, -2.4443359375, -2.27734375, -2.1103515625, -1.943359375, -1.7763671875, -1.609375, -1.4423828125, -1.275390625, -1.1083984375, -0.94140625, -0.7744140625, -0.607421875, -0.4404296875, -0.2734375, -0.1064453125, 0.060546875, 0.2275390625, 0.39453125, 0.5615234375, 0.728515625, 0.8955078125, 1.0625, 1.2294921875, 1.396484375, 1.5634765625, 1.73046875, 1.8974609375, 2.064453125, 2.2314453125, 2.3984375, 2.5654296875, 2.732421875, 2.8994140625, 3.06640625, 3.2333984375, 3.400390625, 3.5673828125, 3.734375, 3.9013671875, 4.068359375, 4.2353515625, 4.40234375, 4.5693359375, 4.736328125, 4.9033203125, 5.0703125, 5.2373046875, 5.404296875, 5.5712890625, 5.73828125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 5.0, 9.0, 14.0, 21.0, 29.0, 43.0, 71.0, 94.0, 156.0, 194.0, 348.0, 456.0, 736.0, 1086.0, 1547.0, 2420.0, 3713.0, 5627.0, 8781.0, 13838.0, 22245.0, 36705.0, 61396.0, 107906.0, 195400.0, 368292.0, 694511.0, 1057030.0, 733489.0, 389637.0, 207056.0, 114090.0, 64994.0, 38281.0, 23197.0, 14495.0, 9179.0, 5890.0, 3841.0, 2513.0, 1647.0, 1097.0, 749.0, 449.0, 318.0, 236.0, 146.0, 97.0, 82.0, 43.0, 33.0, 23.0, 14.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.97265625, -6.744384765625, -6.51611328125, -6.287841796875, -6.0595703125, -5.831298828125, -5.60302734375, -5.374755859375, -5.146484375, -4.918212890625, -4.68994140625, -4.461669921875, -4.2333984375, -4.005126953125, -3.77685546875, -3.548583984375, -3.3203125, -3.092041015625, -2.86376953125, -2.635498046875, -2.4072265625, -2.178955078125, -1.95068359375, -1.722412109375, -1.494140625, -1.265869140625, -1.03759765625, -0.809326171875, -0.5810546875, -0.352783203125, -0.12451171875, 0.103759765625, 0.33203125, 0.560302734375, 0.78857421875, 1.016845703125, 1.2451171875, 1.473388671875, 1.70166015625, 1.929931640625, 2.158203125, 2.386474609375, 2.61474609375, 2.843017578125, 3.0712890625, 3.299560546875, 3.52783203125, 3.756103515625, 3.984375, 4.212646484375, 4.44091796875, 4.669189453125, 4.8974609375, 5.125732421875, 5.35400390625, 5.582275390625, 5.810546875, 6.038818359375, 6.26708984375, 6.495361328125, 6.7236328125, 6.951904296875, 7.18017578125, 7.408447265625, 7.63671875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 5.0, 5.0, 19.0, 10.0, 15.0, 18.0, 28.0, 29.0, 44.0, 42.0, 56.0, 64.0, 95.0, 86.0, 104.0, 126.0, 158.0, 202.0, 211.0, 248.0, 280.0, 285.0, 239.0, 246.0, 226.0, 213.0, 176.0, 150.0, 123.0, 82.0, 86.0, 75.0, 60.0, 58.0, 35.0, 36.0, 19.0, 24.0, 23.0, 15.0, 14.0, 8.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.796875, -2.7086181640625, -2.620361328125, -2.5321044921875, -2.44384765625, -2.3555908203125, -2.267333984375, -2.1790771484375, -2.0908203125, -2.0025634765625, -1.914306640625, -1.8260498046875, -1.73779296875, -1.6495361328125, -1.561279296875, -1.4730224609375, -1.384765625, -1.2965087890625, -1.208251953125, -1.1199951171875, -1.03173828125, -0.9434814453125, -0.855224609375, -0.7669677734375, -0.6787109375, -0.5904541015625, -0.502197265625, -0.4139404296875, -0.32568359375, -0.2374267578125, -0.149169921875, -0.0609130859375, 0.02734375, 0.1156005859375, 0.203857421875, 0.2921142578125, 0.38037109375, 0.4686279296875, 0.556884765625, 0.6451416015625, 0.7333984375, 0.8216552734375, 0.909912109375, 0.9981689453125, 1.08642578125, 1.1746826171875, 1.262939453125, 1.3511962890625, 1.439453125, 1.5277099609375, 1.615966796875, 1.7042236328125, 1.79248046875, 1.8807373046875, 1.968994140625, 2.0572509765625, 2.1455078125, 2.2337646484375, 2.322021484375, 2.4102783203125, 2.49853515625, 2.5867919921875, 2.675048828125, 2.7633056640625, 2.8515625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 7.0, 9.0, 11.0, 10.0, 16.0, 20.0, 20.0, 36.0, 44.0, 48.0, 44.0, 59.0, 71.0, 85.0, 69.0, 67.0, 64.0, 47.0, 49.0, 40.0, 31.0, 21.0, 19.0, 23.0, 20.0, 14.0, 5.0, 10.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.863490104675293, -5.64119815826416, -5.418906211853027, -5.1966142654418945, -4.974322319030762, -4.752030372619629, -4.529737949371338, -4.307446002960205, -4.085154056549072, -3.8628621101379395, -3.6405701637268066, -3.4182779788970947, -3.195986032485962, -2.973694086074829, -2.751401901245117, -2.5291099548339844, -2.3068180084228516, -2.0845260620117188, -1.8622339963912964, -1.639941930770874, -1.4176499843597412, -1.1953580379486084, -0.973065972328186, -0.7507739067077637, -0.5284819602966309, -0.30618995428085327, -0.08389794826507568, 0.1383940577507019, 0.3606860637664795, 0.5829780101776123, 0.8052700757980347, 1.027562141418457, 1.2498540878295898, 1.4721460342407227, 1.694438099861145, 1.9167301654815674, 2.1390221118927, 2.361314058303833, 2.583606243133545, 2.8058981895446777, 3.0281901359558105, 3.2504820823669434, 3.472774028778076, 3.695066213607788, 3.917358160018921, 4.139650344848633, 4.361942291259766, 4.584234237670898, 4.806526184082031, 5.028818130493164, 5.251110076904297, 5.47340202331543, 5.6956939697265625, 5.917985916137695, 6.140278339385986, 6.362570285797119, 6.584862232208252, 6.807154178619385, 7.029446125030518, 7.25173807144165, 7.474030494689941, 7.696322441101074, 7.918614387512207, 8.14090633392334, 8.363198280334473]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 6.0, 20.0, 19.0, 17.0, 20.0, 14.0, 15.0, 36.0, 25.0, 39.0, 28.0, 36.0, 29.0, 35.0, 60.0, 45.0, 54.0, 29.0, 38.0, 43.0, 39.0, 33.0, 41.0, 26.0, 41.0, 21.0, 25.0, 25.0, 12.0, 15.0, 17.0, 14.0, 12.0, 9.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.5958380699157715, -6.392699241638184, -6.1895599365234375, -5.98642110824585, -5.783282279968262, -5.580142974853516, -5.377004146575928, -5.17386531829834, -4.970726013183594, -4.767587184906006, -4.56444787979126, -4.361309051513672, -4.158170223236084, -3.955031156539917, -3.75189208984375, -3.548753261566162, -3.345614433288574, -3.1424753665924072, -2.9393365383148193, -2.7361974716186523, -2.5330586433410645, -2.3299195766448975, -2.1267805099487305, -1.923641562461853, -1.7205026149749756, -1.5173636674880981, -1.3142247200012207, -1.1110856533050537, -0.9079467058181763, -0.7048077583312988, -0.5016686916351318, -0.2985297441482544, -0.09539079666137695, 0.10774818062782288, 0.3108871579170227, 0.5140261650085449, 0.7171651124954224, 0.9203040599822998, 1.1234431266784668, 1.3265820741653442, 1.5297210216522217, 1.7328599691390991, 1.9359989166259766, 2.1391379833221436, 2.3422770500183105, 2.5454158782958984, 2.7485549449920654, 2.9516940116882324, 3.1548328399658203, 3.3579719066619873, 3.561110734939575, 3.764249801635742, 3.96738862991333, 4.170527458190918, 4.373666763305664, 4.576805591583252, 4.77994441986084, 4.983083248138428, 5.186222553253174, 5.389361381530762, 5.59250020980835, 5.7956390380859375, 5.998778343200684, 6.2019171714782715, 6.405056476593018]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 7.0, 12.0, 17.0, 16.0, 22.0, 37.0, 53.0, 67.0, 97.0, 176.0, 229.0, 327.0, 469.0, 633.0, 897.0, 1444.0, 2168.0, 2972.0, 4438.0, 6509.0, 9639.0, 14224.0, 21363.0, 32618.0, 49659.0, 78221.0, 121981.0, 187078.0, 180182.0, 116744.0, 74035.0, 48168.0, 31005.0, 20458.0, 13573.0, 9153.0, 6326.0, 4243.0, 2927.0, 2057.0, 1314.0, 930.0, 683.0, 455.0, 287.0, 204.0, 146.0, 99.0, 63.0, 44.0, 43.0, 16.0, 12.0, 10.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.181640625, -2.11114501953125, -2.0406494140625, -1.97015380859375, -1.899658203125, -1.82916259765625, -1.7586669921875, -1.68817138671875, -1.61767578125, -1.54718017578125, -1.4766845703125, -1.40618896484375, -1.335693359375, -1.26519775390625, -1.1947021484375, -1.12420654296875, -1.0537109375, -0.98321533203125, -0.9127197265625, -0.84222412109375, -0.771728515625, -0.70123291015625, -0.6307373046875, -0.56024169921875, -0.48974609375, -0.41925048828125, -0.3487548828125, -0.27825927734375, -0.207763671875, -0.13726806640625, -0.0667724609375, 0.00372314453125, 0.07421875, 0.14471435546875, 0.2152099609375, 0.28570556640625, 0.356201171875, 0.42669677734375, 0.4971923828125, 0.56768798828125, 0.63818359375, 0.70867919921875, 0.7791748046875, 0.84967041015625, 0.920166015625, 0.99066162109375, 1.0611572265625, 1.13165283203125, 1.2021484375, 1.27264404296875, 1.3431396484375, 1.41363525390625, 1.484130859375, 1.55462646484375, 1.6251220703125, 1.69561767578125, 1.76611328125, 1.83660888671875, 1.9071044921875, 1.97760009765625, 2.048095703125, 2.11859130859375, 2.1890869140625, 2.25958251953125, 2.330078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 5.0, 9.0, 7.0, 12.0, 18.0, 9.0, 20.0, 23.0, 17.0, 21.0, 28.0, 41.0, 46.0, 32.0, 36.0, 53.0, 45.0, 53.0, 58.0, 46.0, 31.0, 48.0, 38.0, 37.0, 39.0, 34.0, 30.0, 29.0, 22.0, 27.0, 13.0, 12.0, 10.0, 8.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.02734375, -6.8021240234375, -6.576904296875, -6.3516845703125, -6.12646484375, -5.9012451171875, -5.676025390625, -5.4508056640625, -5.2255859375, -5.0003662109375, -4.775146484375, -4.5499267578125, -4.32470703125, -4.0994873046875, -3.874267578125, -3.6490478515625, -3.423828125, -3.1986083984375, -2.973388671875, -2.7481689453125, -2.52294921875, -2.2977294921875, -2.072509765625, -1.8472900390625, -1.6220703125, -1.3968505859375, -1.171630859375, -0.9464111328125, -0.72119140625, -0.4959716796875, -0.270751953125, -0.0455322265625, 0.1796875, 0.4049072265625, 0.630126953125, 0.8553466796875, 1.08056640625, 1.3057861328125, 1.531005859375, 1.7562255859375, 1.9814453125, 2.2066650390625, 2.431884765625, 2.6571044921875, 2.88232421875, 3.1075439453125, 3.332763671875, 3.5579833984375, 3.783203125, 4.0084228515625, 4.233642578125, 4.4588623046875, 4.68408203125, 4.9093017578125, 5.134521484375, 5.3597412109375, 5.5849609375, 5.8101806640625, 6.035400390625, 6.2606201171875, 6.48583984375, 6.7110595703125, 6.936279296875, 7.1614990234375, 7.38671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 14.0, 18.0, 25.0, 21.0, 40.0, 78.0, 114.0, 201.0, 287.0, 495.0, 756.0, 1171.0, 1933.0, 3181.0, 5327.0, 8943.0, 15881.0, 27977.0, 51942.0, 99109.0, 207152.0, 307127.0, 149719.0, 74306.0, 40123.0, 21896.0, 12420.0, 7188.0, 4263.0, 2603.0, 1561.0, 974.0, 602.0, 401.0, 255.0, 166.0, 91.0, 56.0, 40.0, 35.0, 12.0, 18.0, 12.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.903228759765625, -2.80059814453125, -2.697967529296875, -2.5953369140625, -2.492706298828125, -2.39007568359375, -2.287445068359375, -2.184814453125, -2.082183837890625, -1.97955322265625, -1.876922607421875, -1.7742919921875, -1.671661376953125, -1.56903076171875, -1.466400146484375, -1.36376953125, -1.261138916015625, -1.15850830078125, -1.055877685546875, -0.9532470703125, -0.850616455078125, -0.74798583984375, -0.645355224609375, -0.542724609375, -0.440093994140625, -0.33746337890625, -0.234832763671875, -0.1322021484375, -0.029571533203125, 0.07305908203125, 0.175689697265625, 0.2783203125, 0.380950927734375, 0.48358154296875, 0.586212158203125, 0.6888427734375, 0.791473388671875, 0.89410400390625, 0.996734619140625, 1.099365234375, 1.201995849609375, 1.30462646484375, 1.407257080078125, 1.5098876953125, 1.612518310546875, 1.71514892578125, 1.817779541015625, 1.92041015625, 2.023040771484375, 2.12567138671875, 2.228302001953125, 2.3309326171875, 2.433563232421875, 2.53619384765625, 2.638824462890625, 2.741455078125, 2.844085693359375, 2.94671630859375, 3.049346923828125, 3.1519775390625, 3.254608154296875, 3.35723876953125, 3.459869384765625, 3.5625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 6.0, 11.0, 7.0, 16.0, 14.0, 17.0, 19.0, 20.0, 25.0, 35.0, 30.0, 38.0, 35.0, 49.0, 52.0, 42.0, 38.0, 37.0, 51.0, 48.0, 42.0, 50.0, 39.0, 37.0, 33.0, 31.0, 28.0, 17.0, 25.0, 23.0, 12.0, 9.0, 11.0, 8.0, 11.0, 10.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.64373779296875, -4.5023193359375, -4.36090087890625, -4.219482421875, -4.07806396484375, -3.9366455078125, -3.79522705078125, -3.65380859375, -3.51239013671875, -3.3709716796875, -3.22955322265625, -3.088134765625, -2.94671630859375, -2.8052978515625, -2.66387939453125, -2.5224609375, -2.38104248046875, -2.2396240234375, -2.09820556640625, -1.956787109375, -1.81536865234375, -1.6739501953125, -1.53253173828125, -1.39111328125, -1.24969482421875, -1.1082763671875, -0.96685791015625, -0.825439453125, -0.68402099609375, -0.5426025390625, -0.40118408203125, -0.259765625, -0.11834716796875, 0.0230712890625, 0.16448974609375, 0.305908203125, 0.44732666015625, 0.5887451171875, 0.73016357421875, 0.87158203125, 1.01300048828125, 1.1544189453125, 1.29583740234375, 1.437255859375, 1.57867431640625, 1.7200927734375, 1.86151123046875, 2.0029296875, 2.14434814453125, 2.2857666015625, 2.42718505859375, 2.568603515625, 2.71002197265625, 2.8514404296875, 2.99285888671875, 3.13427734375, 3.27569580078125, 3.4171142578125, 3.55853271484375, 3.699951171875, 3.84136962890625, 3.9827880859375, 4.12420654296875, 4.265625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 9.0, 16.0, 29.0, 49.0, 49.0, 92.0, 180.0, 286.0, 492.0, 880.0, 1549.0, 3008.0, 5654.0, 11348.0, 24260.0, 58464.0, 169261.0, 441717.0, 207615.0, 69030.0, 28050.0, 12779.0, 6369.0, 3204.0, 1779.0, 1027.0, 540.0, 302.0, 179.0, 123.0, 72.0, 51.0, 33.0, 14.0, 11.0, 7.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028472900390625, -0.027599096298217773, -0.026725292205810547, -0.02585148811340332, -0.024977684020996094, -0.024103879928588867, -0.02323007583618164, -0.022356271743774414, -0.021482467651367188, -0.02060866355895996, -0.019734859466552734, -0.018861055374145508, -0.01798725128173828, -0.017113447189331055, -0.016239643096923828, -0.015365839004516602, -0.014492034912109375, -0.013618230819702148, -0.012744426727294922, -0.011870622634887695, -0.010996818542480469, -0.010123014450073242, -0.009249210357666016, -0.008375406265258789, -0.0075016021728515625, -0.006627798080444336, -0.005753993988037109, -0.004880189895629883, -0.004006385803222656, -0.0031325817108154297, -0.002258777618408203, -0.0013849735260009766, -0.00051116943359375, 0.00036263465881347656, 0.0012364387512207031, 0.0021102428436279297, 0.0029840469360351562, 0.003857851028442383, 0.004731655120849609, 0.005605459213256836, 0.0064792633056640625, 0.007353067398071289, 0.008226871490478516, 0.009100675582885742, 0.009974479675292969, 0.010848283767700195, 0.011722087860107422, 0.012595891952514648, 0.013469696044921875, 0.014343500137329102, 0.015217304229736328, 0.016091108322143555, 0.01696491241455078, 0.017838716506958008, 0.018712520599365234, 0.01958632469177246, 0.020460128784179688, 0.021333932876586914, 0.02220773696899414, 0.023081541061401367, 0.023955345153808594, 0.02482914924621582, 0.025702953338623047, 0.026576757431030273, 0.0274505615234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 2.0, 8.0, 2.0, 10.0, 12.0, 25.0, 21.0, 32.0, 19.0, 45.0, 49.0, 83.0, 81.0, 58.0, 95.0, 67.0, 63.0, 56.0, 56.0, 53.0, 26.0, 34.0, 14.0, 24.0, 18.0, 8.0, 10.0, 9.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.1265277862548828e-05, -1.0992400348186493e-05, -1.0719522833824158e-05, -1.0446645319461823e-05, -1.0173767805099487e-05, -9.900890290737152e-06, -9.628012776374817e-06, -9.355135262012482e-06, -9.082257747650146e-06, -8.809380233287811e-06, -8.536502718925476e-06, -8.263625204563141e-06, -7.990747690200806e-06, -7.71787017583847e-06, -7.444992661476135e-06, -7.1721151471138e-06, -6.899237632751465e-06, -6.62636011838913e-06, -6.3534826040267944e-06, -6.080605089664459e-06, -5.807727575302124e-06, -5.534850060939789e-06, -5.261972546577454e-06, -4.989095032215118e-06, -4.716217517852783e-06, -4.443340003490448e-06, -4.170462489128113e-06, -3.897584974765778e-06, -3.6247074604034424e-06, -3.351829946041107e-06, -3.078952431678772e-06, -2.8060749173164368e-06, -2.5331974029541016e-06, -2.2603198885917664e-06, -1.987442374229431e-06, -1.714564859867096e-06, -1.4416873455047607e-06, -1.1688098311424255e-06, -8.959323167800903e-07, -6.230548024177551e-07, -3.501772880554199e-07, -7.729977369308472e-08, 1.955777406692505e-07, 4.684552550315857e-07, 7.413327693939209e-07, 1.014210283756256e-06, 1.2870877981185913e-06, 1.5599653124809265e-06, 1.8328428268432617e-06, 2.105720341205597e-06, 2.378597855567932e-06, 2.6514753699302673e-06, 2.9243528842926025e-06, 3.1972303986549377e-06, 3.470107913017273e-06, 3.742985427379608e-06, 4.015862941741943e-06, 4.2887404561042786e-06, 4.561617970466614e-06, 4.834495484828949e-06, 5.107372999191284e-06, 5.380250513553619e-06, 5.653128027915955e-06, 5.92600554227829e-06, 6.198883056640625e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 10.0, 14.0, 21.0, 36.0, 66.0, 105.0, 118.0, 195.0, 266.0, 390.0, 580.0, 829.0, 1204.0, 1809.0, 2691.0, 4017.0, 6111.0, 9617.0, 14975.0, 23844.0, 38874.0, 65996.0, 116450.0, 207448.0, 229392.0, 131735.0, 74586.0, 43518.0, 26647.0, 16365.0, 10357.0, 6797.0, 4371.0, 2952.0, 1989.0, 1297.0, 905.0, 649.0, 414.0, 308.0, 178.0, 128.0, 91.0, 69.0, 44.0, 38.0, 16.0, 18.0, 8.0, 10.0, 2.0, 3.0, 1.0], "bins": [-0.016937255859375, -0.01645481586456299, -0.015972375869750977, -0.015489935874938965, -0.015007495880126953, -0.014525055885314941, -0.01404261589050293, -0.013560175895690918, -0.013077735900878906, -0.012595295906066895, -0.012112855911254883, -0.011630415916442871, -0.01114797592163086, -0.010665535926818848, -0.010183095932006836, -0.009700655937194824, -0.009218215942382812, -0.0087357759475708, -0.008253335952758789, -0.007770895957946777, -0.007288455963134766, -0.006806015968322754, -0.006323575973510742, -0.0058411359786987305, -0.005358695983886719, -0.004876255989074707, -0.004393815994262695, -0.003911375999450684, -0.003428936004638672, -0.00294649600982666, -0.0024640560150146484, -0.0019816160202026367, -0.001499176025390625, -0.0010167360305786133, -0.0005342960357666016, -5.1856040954589844e-05, 0.0004305839538574219, 0.0009130239486694336, 0.0013954639434814453, 0.001877903938293457, 0.0023603439331054688, 0.0028427839279174805, 0.003325223922729492, 0.003807663917541504, 0.004290103912353516, 0.004772543907165527, 0.005254983901977539, 0.005737423896789551, 0.0062198638916015625, 0.006702303886413574, 0.007184743881225586, 0.007667183876037598, 0.00814962387084961, 0.008632063865661621, 0.009114503860473633, 0.009596943855285645, 0.010079383850097656, 0.010561823844909668, 0.01104426383972168, 0.011526703834533691, 0.012009143829345703, 0.012491583824157715, 0.012974023818969727, 0.013456463813781738, 0.01393890380859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 8.0, 5.0, 9.0, 13.0, 22.0, 22.0, 24.0, 32.0, 49.0, 61.0, 66.0, 77.0, 79.0, 75.0, 89.0, 74.0, 51.0, 50.0, 30.0, 31.0, 26.0, 23.0, 7.0, 11.0, 6.0, 9.0, 4.0, 7.0, 7.0, 2.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00689697265625, -0.006705522537231445, -0.006514072418212891, -0.006322622299194336, -0.006131172180175781, -0.0059397220611572266, -0.005748271942138672, -0.005556821823120117, -0.0053653717041015625, -0.005173921585083008, -0.004982471466064453, -0.0047910213470458984, -0.004599571228027344, -0.004408121109008789, -0.004216670989990234, -0.00402522087097168, -0.003833770751953125, -0.0036423206329345703, -0.0034508705139160156, -0.003259420394897461, -0.0030679702758789062, -0.0028765201568603516, -0.002685070037841797, -0.002493619918823242, -0.0023021697998046875, -0.002110719680786133, -0.0019192695617675781, -0.0017278194427490234, -0.0015363693237304688, -0.001344919204711914, -0.0011534690856933594, -0.0009620189666748047, -0.00077056884765625, -0.0005791187286376953, -0.0003876686096191406, -0.00019621849060058594, -4.76837158203125e-06, 0.00018668174743652344, 0.0003781318664550781, 0.0005695819854736328, 0.0007610321044921875, 0.0009524822235107422, 0.0011439323425292969, 0.0013353824615478516, 0.0015268325805664062, 0.001718282699584961, 0.0019097328186035156, 0.0021011829376220703, 0.002292633056640625, 0.0024840831756591797, 0.0026755332946777344, 0.002866983413696289, 0.0030584335327148438, 0.0032498836517333984, 0.003441333770751953, 0.003632783889770508, 0.0038242340087890625, 0.004015684127807617, 0.004207134246826172, 0.0043985843658447266, 0.004590034484863281, 0.004781484603881836, 0.004972934722900391, 0.005164384841918945, 0.0053558349609375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 5.0, 15.0, 12.0, 18.0, 16.0, 27.0, 47.0, 41.0, 45.0, 55.0, 61.0, 81.0, 87.0, 74.0, 71.0, 61.0, 46.0, 36.0, 38.0, 24.0, 24.0, 20.0, 19.0, 14.0, 8.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98034143447876, -5.7486138343811035, -5.516885757446289, -5.285158157348633, -5.053430557250977, -4.82170295715332, -4.589975357055664, -4.35824728012085, -4.126519680023193, -3.894792079925537, -3.6630642414093018, -3.4313364028930664, -3.19960880279541, -2.967881202697754, -2.7361533641815186, -2.504425525665283, -2.272697925567627, -2.0409703254699707, -1.8092424869537354, -1.5775147676467896, -1.3457870483398438, -1.114059329032898, -0.8823316097259521, -0.6506038904190063, -0.41887617111206055, -0.18714845180511475, 0.044579267501831055, 0.27630698680877686, 0.5080347061157227, 0.7397624254226685, 0.9714901447296143, 1.20321786403656, 1.434946060180664, 1.6666737794876099, 1.8984014987945557, 2.130129337310791, 2.3618569374084473, 2.5935845375061035, 2.825312376022339, 3.057040214538574, 3.2887678146362305, 3.5204954147338867, 3.752223253250122, 3.9839510917663574, 4.215678691864014, 4.44740629196167, 4.679134368896484, 4.910861968994141, 5.142589569091797, 5.374317169189453, 5.606044769287109, 5.837772846221924, 6.06950044631958, 6.301228046417236, 6.532956123352051, 6.764683723449707, 6.996411323547363, 7.2281389236450195, 7.459866523742676, 7.69159460067749, 7.9233222007751465, 8.155050277709961, 8.386777877807617, 8.618505477905273, 8.85023307800293]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 6.0, 20.0, 19.0, 17.0, 20.0, 14.0, 15.0, 37.0, 24.0, 39.0, 28.0, 35.0, 30.0, 35.0, 60.0, 45.0, 53.0, 30.0, 39.0, 42.0, 41.0, 32.0, 40.0, 27.0, 40.0, 22.0, 24.0, 23.0, 14.0, 15.0, 17.0, 14.0, 12.0, 9.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.529907703399658, -6.327966213226318, -6.1260247230529785, -5.924083232879639, -5.722141742706299, -5.520200252532959, -5.318258762359619, -5.116317272186279, -4.9143757820129395, -4.7124342918396, -4.51049280166626, -4.30855131149292, -4.10660982131958, -3.9046683311462402, -3.7027268409729004, -3.5007853507995605, -3.2988440990448, -3.09690260887146, -2.89496111869812, -2.6930196285247803, -2.4910781383514404, -2.2891368865966797, -2.08719539642334, -1.8852537870407104, -1.6833122968673706, -1.4813708066940308, -1.279429316520691, -1.0774879455566406, -0.875546395778656, -0.6736049652099609, -0.4716634750366211, -0.26972198486328125, -0.0677804946899414, 0.13416098058223724, 0.3361024558544159, 0.5380439162254333, 0.7399854063987732, 0.9419268369674683, 1.143868327140808, 1.345809817314148, 1.5477513074874878, 1.7496927976608276, 1.9516342878341675, 2.1535756587982178, 2.3555171489715576, 2.5574586391448975, 2.7594001293182373, 2.961341619491577, 3.163283109664917, 3.365224599838257, 3.5671660900115967, 3.7691075801849365, 3.9710490703582764, 4.172990322113037, 4.374931812286377, 4.576873302459717, 4.778814792633057, 4.9807562828063965, 5.182697772979736, 5.384639263153076, 5.586580753326416, 5.788522243499756, 5.990463733673096, 6.1924052238464355, 6.394346714019775]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 10.0, 15.0, 29.0, 39.0, 43.0, 82.0, 105.0, 173.0, 251.0, 370.0, 568.0, 880.0, 1353.0, 2032.0, 3212.0, 4813.0, 7645.0, 11923.0, 18948.0, 29840.0, 47838.0, 76916.0, 120870.0, 171042.0, 180682.0, 134397.0, 87342.0, 54487.0, 33739.0, 21187.0, 13488.0, 8414.0, 5476.0, 3585.0, 2256.0, 1623.0, 1007.0, 621.0, 407.0, 259.0, 183.0, 134.0, 86.0, 64.0, 43.0, 23.0, 26.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.5625, -8.2960205078125, -8.029541015625, -7.7630615234375, -7.49658203125, -7.2301025390625, -6.963623046875, -6.6971435546875, -6.4306640625, -6.1641845703125, -5.897705078125, -5.6312255859375, -5.36474609375, -5.0982666015625, -4.831787109375, -4.5653076171875, -4.298828125, -4.0323486328125, -3.765869140625, -3.4993896484375, -3.23291015625, -2.9664306640625, -2.699951171875, -2.4334716796875, -2.1669921875, -1.9005126953125, -1.634033203125, -1.3675537109375, -1.10107421875, -0.8345947265625, -0.568115234375, -0.3016357421875, -0.03515625, 0.2313232421875, 0.497802734375, 0.7642822265625, 1.03076171875, 1.2972412109375, 1.563720703125, 1.8302001953125, 2.0966796875, 2.3631591796875, 2.629638671875, 2.8961181640625, 3.16259765625, 3.4290771484375, 3.695556640625, 3.9620361328125, 4.228515625, 4.4949951171875, 4.761474609375, 5.0279541015625, 5.29443359375, 5.5609130859375, 5.827392578125, 6.0938720703125, 6.3603515625, 6.6268310546875, 6.893310546875, 7.1597900390625, 7.42626953125, 7.6927490234375, 7.959228515625, 8.2257080078125, 8.4921875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 18.0, 10.0, 12.0, 18.0, 17.0, 14.0, 17.0, 28.0, 22.0, 24.0, 27.0, 37.0, 33.0, 38.0, 49.0, 44.0, 54.0, 56.0, 54.0, 35.0, 42.0, 28.0, 45.0, 34.0, 31.0, 31.0, 32.0, 25.0, 15.0, 23.0, 10.0, 16.0, 11.0, 9.0, 8.0, 6.0, 8.0, 11.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0390625, -5.84173583984375, -5.6444091796875, -5.44708251953125, -5.249755859375, -5.05242919921875, -4.8551025390625, -4.65777587890625, -4.46044921875, -4.26312255859375, -4.0657958984375, -3.86846923828125, -3.671142578125, -3.47381591796875, -3.2764892578125, -3.07916259765625, -2.8818359375, -2.68450927734375, -2.4871826171875, -2.28985595703125, -2.092529296875, -1.89520263671875, -1.6978759765625, -1.50054931640625, -1.30322265625, -1.10589599609375, -0.9085693359375, -0.71124267578125, -0.513916015625, -0.31658935546875, -0.1192626953125, 0.07806396484375, 0.275390625, 0.47271728515625, 0.6700439453125, 0.86737060546875, 1.064697265625, 1.26202392578125, 1.4593505859375, 1.65667724609375, 1.85400390625, 2.05133056640625, 2.2486572265625, 2.44598388671875, 2.643310546875, 2.84063720703125, 3.0379638671875, 3.23529052734375, 3.4326171875, 3.62994384765625, 3.8272705078125, 4.02459716796875, 4.221923828125, 4.41925048828125, 4.6165771484375, 4.81390380859375, 5.01123046875, 5.20855712890625, 5.4058837890625, 5.60321044921875, 5.800537109375, 5.99786376953125, 6.1951904296875, 6.39251708984375, 6.58984375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 7.0, 10.0, 13.0, 20.0, 33.0, 56.0, 70.0, 104.0, 152.0, 246.0, 365.0, 495.0, 774.0, 1011.0, 1680.0, 2554.0, 3526.0, 5308.0, 8152.0, 12626.0, 19025.0, 30626.0, 48479.0, 76134.0, 115407.0, 157467.0, 167696.0, 136393.0, 93535.0, 59953.0, 38026.0, 23628.0, 15258.0, 9795.0, 6403.0, 4344.0, 2896.0, 2098.0, 1354.0, 848.0, 646.0, 456.0, 303.0, 187.0, 137.0, 93.0, 54.0, 40.0, 29.0, 18.0, 11.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.7578125, -7.501220703125, -7.24462890625, -6.988037109375, -6.7314453125, -6.474853515625, -6.21826171875, -5.961669921875, -5.705078125, -5.448486328125, -5.19189453125, -4.935302734375, -4.6787109375, -4.422119140625, -4.16552734375, -3.908935546875, -3.65234375, -3.395751953125, -3.13916015625, -2.882568359375, -2.6259765625, -2.369384765625, -2.11279296875, -1.856201171875, -1.599609375, -1.343017578125, -1.08642578125, -0.829833984375, -0.5732421875, -0.316650390625, -0.06005859375, 0.196533203125, 0.453125, 0.709716796875, 0.96630859375, 1.222900390625, 1.4794921875, 1.736083984375, 1.99267578125, 2.249267578125, 2.505859375, 2.762451171875, 3.01904296875, 3.275634765625, 3.5322265625, 3.788818359375, 4.04541015625, 4.302001953125, 4.55859375, 4.815185546875, 5.07177734375, 5.328369140625, 5.5849609375, 5.841552734375, 6.09814453125, 6.354736328125, 6.611328125, 6.867919921875, 7.12451171875, 7.381103515625, 7.6376953125, 7.894287109375, 8.15087890625, 8.407470703125, 8.6640625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 6.0, 4.0, 6.0, 5.0, 9.0, 13.0, 10.0, 17.0, 15.0, 11.0, 16.0, 18.0, 28.0, 24.0, 29.0, 34.0, 42.0, 28.0, 46.0, 41.0, 41.0, 48.0, 44.0, 44.0, 41.0, 48.0, 46.0, 35.0, 44.0, 43.0, 32.0, 19.0, 18.0, 17.0, 13.0, 18.0, 14.0, 10.0, 15.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07513427734375, -3.9432373046875, -3.81134033203125, -3.679443359375, -3.54754638671875, -3.4156494140625, -3.28375244140625, -3.15185546875, -3.01995849609375, -2.8880615234375, -2.75616455078125, -2.624267578125, -2.49237060546875, -2.3604736328125, -2.22857666015625, -2.0966796875, -1.96478271484375, -1.8328857421875, -1.70098876953125, -1.569091796875, -1.43719482421875, -1.3052978515625, -1.17340087890625, -1.04150390625, -0.90960693359375, -0.7777099609375, -0.64581298828125, -0.513916015625, -0.38201904296875, -0.2501220703125, -0.11822509765625, 0.013671875, 0.14556884765625, 0.2774658203125, 0.40936279296875, 0.541259765625, 0.67315673828125, 0.8050537109375, 0.93695068359375, 1.06884765625, 1.20074462890625, 1.3326416015625, 1.46453857421875, 1.596435546875, 1.72833251953125, 1.8602294921875, 1.99212646484375, 2.1240234375, 2.25592041015625, 2.3878173828125, 2.51971435546875, 2.651611328125, 2.78350830078125, 2.9154052734375, 3.04730224609375, 3.17919921875, 3.31109619140625, 3.4429931640625, 3.57489013671875, 3.706787109375, 3.83868408203125, 3.9705810546875, 4.10247802734375, 4.234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 11.0, 23.0, 33.0, 36.0, 74.0, 78.0, 129.0, 183.0, 266.0, 399.0, 582.0, 871.0, 1311.0, 1916.0, 3003.0, 4714.0, 7437.0, 12902.0, 22874.0, 46122.0, 113104.0, 401011.0, 266951.0, 80957.0, 36048.0, 18694.0, 10499.0, 6455.0, 4088.0, 2587.0, 1659.0, 1110.0, 774.0, 516.0, 345.0, 247.0, 169.0, 106.0, 79.0, 62.0, 38.0, 27.0, 20.0, 11.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9296875, -3.806243896484375, -3.68280029296875, -3.559356689453125, -3.4359130859375, -3.312469482421875, -3.18902587890625, -3.065582275390625, -2.942138671875, -2.818695068359375, -2.69525146484375, -2.571807861328125, -2.4483642578125, -2.324920654296875, -2.20147705078125, -2.078033447265625, -1.95458984375, -1.831146240234375, -1.70770263671875, -1.584259033203125, -1.4608154296875, -1.337371826171875, -1.21392822265625, -1.090484619140625, -0.967041015625, -0.843597412109375, -0.72015380859375, -0.596710205078125, -0.4732666015625, -0.349822998046875, -0.22637939453125, -0.102935791015625, 0.0205078125, 0.143951416015625, 0.26739501953125, 0.390838623046875, 0.5142822265625, 0.637725830078125, 0.76116943359375, 0.884613037109375, 1.008056640625, 1.131500244140625, 1.25494384765625, 1.378387451171875, 1.5018310546875, 1.625274658203125, 1.74871826171875, 1.872161865234375, 1.99560546875, 2.119049072265625, 2.24249267578125, 2.365936279296875, 2.4893798828125, 2.612823486328125, 2.73626708984375, 2.859710693359375, 2.983154296875, 3.106597900390625, 3.23004150390625, 3.353485107421875, 3.4769287109375, 3.600372314453125, 3.72381591796875, 3.847259521484375, 3.970703125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 10.0, 5.0, 2.0, 10.0, 10.0, 7.0, 20.0, 23.0, 30.0, 35.0, 59.0, 71.0, 121.0, 98.0, 96.0, 98.0, 82.0, 59.0, 48.0, 26.0, 28.0, 16.0, 10.0, 13.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019800662994384766, -0.00019143521785736084, -0.00018486380577087402, -0.0001782923936843872, -0.0001717209815979004, -0.00016514956951141357, -0.00015857815742492676, -0.00015200674533843994, -0.00014543533325195312, -0.0001388639211654663, -0.0001322925090789795, -0.00012572109699249268, -0.00011914968490600586, -0.00011257827281951904, -0.00010600686073303223, -9.943544864654541e-05, -9.28640365600586e-05, -8.629262447357178e-05, -7.972121238708496e-05, -7.314980030059814e-05, -6.657838821411133e-05, -6.000697612762451e-05, -5.3435564041137695e-05, -4.686415195465088e-05, -4.029273986816406e-05, -3.3721327781677246e-05, -2.714991569519043e-05, -2.0578503608703613e-05, -1.4007091522216797e-05, -7.4356794357299805e-06, -8.642673492431641e-07, 5.707144737243652e-06, 1.2278556823730469e-05, 1.8849968910217285e-05, 2.54213809967041e-05, 3.199279308319092e-05, 3.8564205169677734e-05, 4.513561725616455e-05, 5.170702934265137e-05, 5.8278441429138184e-05, 6.4849853515625e-05, 7.142126560211182e-05, 7.799267768859863e-05, 8.456408977508545e-05, 9.113550186157227e-05, 9.770691394805908e-05, 0.0001042783260345459, 0.00011084973812103271, 0.00011742115020751953, 0.00012399256229400635, 0.00013056397438049316, 0.00013713538646697998, 0.0001437067985534668, 0.0001502782106399536, 0.00015684962272644043, 0.00016342103481292725, 0.00016999244689941406, 0.00017656385898590088, 0.0001831352710723877, 0.0001897066831588745, 0.00019627809524536133, 0.00020284950733184814, 0.00020942091941833496, 0.00021599233150482178, 0.0002225637435913086]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 6.0, 9.0, 16.0, 17.0, 22.0, 31.0, 32.0, 46.0, 57.0, 94.0, 122.0, 170.0, 232.0, 331.0, 486.0, 645.0, 1064.0, 1582.0, 2499.0, 4238.0, 6954.0, 12337.0, 23325.0, 49283.0, 126656.0, 429231.0, 238963.0, 75533.0, 33750.0, 17028.0, 9350.0, 5200.0, 3248.0, 1897.0, 1265.0, 822.0, 614.0, 392.0, 258.0, 208.0, 127.0, 109.0, 77.0, 70.0, 41.0, 25.0, 32.0, 15.0, 17.0, 9.0, 6.0, 7.0, 3.0, 1.0, 5.0, 1.0], "bins": [-4.38671875, -4.256744384765625, -4.12677001953125, -3.996795654296875, -3.8668212890625, -3.736846923828125, -3.60687255859375, -3.476898193359375, -3.346923828125, -3.216949462890625, -3.08697509765625, -2.957000732421875, -2.8270263671875, -2.697052001953125, -2.56707763671875, -2.437103271484375, -2.30712890625, -2.177154541015625, -2.04718017578125, -1.917205810546875, -1.7872314453125, -1.657257080078125, -1.52728271484375, -1.397308349609375, -1.267333984375, -1.137359619140625, -1.00738525390625, -0.877410888671875, -0.7474365234375, -0.617462158203125, -0.48748779296875, -0.357513427734375, -0.2275390625, -0.097564697265625, 0.03240966796875, 0.162384033203125, 0.2923583984375, 0.422332763671875, 0.55230712890625, 0.682281494140625, 0.812255859375, 0.942230224609375, 1.07220458984375, 1.202178955078125, 1.3321533203125, 1.462127685546875, 1.59210205078125, 1.722076416015625, 1.85205078125, 1.982025146484375, 2.11199951171875, 2.241973876953125, 2.3719482421875, 2.501922607421875, 2.63189697265625, 2.761871337890625, 2.891845703125, 3.021820068359375, 3.15179443359375, 3.281768798828125, 3.4117431640625, 3.541717529296875, 3.67169189453125, 3.801666259765625, 3.931640625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 9.0, 8.0, 16.0, 30.0, 23.0, 24.0, 37.0, 50.0, 56.0, 65.0, 99.0, 107.0, 100.0, 86.0, 53.0, 50.0, 35.0, 28.0, 17.0, 16.0, 14.0, 22.0, 9.0, 7.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.6708984375, -1.6264190673828125, -1.581939697265625, -1.5374603271484375, -1.49298095703125, -1.4485015869140625, -1.404022216796875, -1.3595428466796875, -1.3150634765625, -1.2705841064453125, -1.226104736328125, -1.1816253662109375, -1.13714599609375, -1.0926666259765625, -1.048187255859375, -1.0037078857421875, -0.959228515625, -0.9147491455078125, -0.870269775390625, -0.8257904052734375, -0.78131103515625, -0.7368316650390625, -0.692352294921875, -0.6478729248046875, -0.6033935546875, -0.5589141845703125, -0.514434814453125, -0.4699554443359375, -0.42547607421875, -0.3809967041015625, -0.336517333984375, -0.2920379638671875, -0.24755859375, -0.2030792236328125, -0.158599853515625, -0.1141204833984375, -0.06964111328125, -0.0251617431640625, 0.019317626953125, 0.0637969970703125, 0.1082763671875, 0.1527557373046875, 0.197235107421875, 0.2417144775390625, 0.28619384765625, 0.3306732177734375, 0.375152587890625, 0.4196319580078125, 0.464111328125, 0.5085906982421875, 0.553070068359375, 0.5975494384765625, 0.64202880859375, 0.6865081787109375, 0.730987548828125, 0.7754669189453125, 0.8199462890625, 0.8644256591796875, 0.908905029296875, 0.9533843994140625, 0.99786376953125, 1.0423431396484375, 1.086822509765625, 1.1313018798828125, 1.17578125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 7.0, 10.0, 14.0, 9.0, 5.0, 27.0, 22.0, 37.0, 43.0, 38.0, 53.0, 62.0, 71.0, 86.0, 74.0, 77.0, 69.0, 57.0, 50.0, 35.0, 35.0, 21.0, 18.0, 16.0, 10.0, 17.0, 9.0, 5.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.365230560302734, -5.123898983001709, -4.882567405700684, -4.6412353515625, -4.399903774261475, -4.158572196960449, -3.917240619659424, -3.6759088039398193, -3.434576988220215, -3.1932454109191895, -2.951913595199585, -2.7105820178985596, -2.469250202178955, -2.2279186248779297, -1.9865869283676147, -1.7452552318572998, -1.5039236545562744, -1.2625919580459595, -1.0212602615356445, -0.7799286246299744, -0.5385969281196594, -0.29726529121398926, -0.055933594703674316, 0.18539810180664062, 0.42672979831695557, 0.6680614948272705, 0.9093931913375854, 1.1507248878479004, 1.3920564651489258, 1.6333881616592407, 1.8747198581695557, 2.11605167388916, 2.3573832511901855, 2.598714828491211, 2.8400466442108154, 3.081378221511841, 3.3227100372314453, 3.5640416145324707, 3.805373191833496, 4.04670524597168, 4.288036823272705, 4.5293684005737305, 4.770699977874756, 5.0120320320129395, 5.253363609313965, 5.49469518661499, 5.736026763916016, 5.977358818054199, 6.218689918518066, 6.460021495819092, 6.701353073120117, 6.942685127258301, 7.184016704559326, 7.425348281860352, 7.666679859161377, 7.908011436462402, 8.149343490600586, 8.39067554473877, 8.632006645202637, 8.87333869934082, 9.114669799804688, 9.356001853942871, 9.597333908081055, 9.838665008544922, 10.079997062683105]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 4.0, 6.0, 4.0, 7.0, 7.0, 5.0, 15.0, 17.0, 10.0, 18.0, 20.0, 22.0, 28.0, 29.0, 38.0, 40.0, 27.0, 32.0, 37.0, 46.0, 49.0, 44.0, 45.0, 48.0, 35.0, 36.0, 21.0, 40.0, 34.0, 23.0, 22.0, 30.0, 19.0, 20.0, 20.0, 16.0, 16.0, 10.0, 11.0, 9.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.173847198486328, -5.9748101234436035, -5.775773048400879, -5.5767364501953125, -5.377699375152588, -5.178662300109863, -4.979625701904297, -4.780588626861572, -4.581551551818848, -4.382514476776123, -4.183477401733398, -3.984440803527832, -3.7854037284851074, -3.586366653442383, -3.3873298168182373, -3.188292980194092, -2.989255905151367, -2.7902188301086426, -2.591181993484497, -2.3921451568603516, -2.193108081817627, -1.994071125984192, -1.7950341701507568, -1.5959972143173218, -1.3969602584838867, -1.1979233026504517, -0.9988863468170166, -0.7998493909835815, -0.6008124351501465, -0.4017754793167114, -0.20273852348327637, -0.0037015676498413086, 0.19533491134643555, 0.3943718671798706, 0.5934088230133057, 0.7924457788467407, 0.9914827346801758, 1.1905196905136108, 1.389556646347046, 1.588593602180481, 1.787630558013916, 1.986667513847351, 2.185704469680786, 2.3847413063049316, 2.5837783813476562, 2.782815456390381, 2.9818522930145264, 3.180889129638672, 3.3799262046813965, 3.578963279724121, 3.7780001163482666, 3.977036952972412, 4.176074028015137, 4.375111103057861, 4.574148178100586, 4.773184776306152, 4.972221851348877, 5.171258926391602, 5.370295524597168, 5.569332599639893, 5.768369674682617, 5.967406749725342, 6.166443824768066, 6.365480422973633, 6.564517498016357]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 14.0, 20.0, 42.0, 63.0, 86.0, 137.0, 218.0, 348.0, 518.0, 824.0, 1352.0, 2254.0, 3883.0, 6521.0, 11626.0, 20760.0, 39471.0, 79079.0, 173070.0, 465438.0, 1386882.0, 1273456.0, 411807.0, 158600.0, 74551.0, 38369.0, 19983.0, 10743.0, 6054.0, 3406.0, 1888.0, 1132.0, 635.0, 403.0, 217.0, 152.0, 121.0, 46.0, 42.0, 27.0, 15.0, 9.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8734130859375, -9.543701171875, -9.2139892578125, -8.88427734375, -8.5545654296875, -8.224853515625, -7.8951416015625, -7.5654296875, -7.2357177734375, -6.906005859375, -6.5762939453125, -6.24658203125, -5.9168701171875, -5.587158203125, -5.2574462890625, -4.927734375, -4.5980224609375, -4.268310546875, -3.9385986328125, -3.60888671875, -3.2791748046875, -2.949462890625, -2.6197509765625, -2.2900390625, -1.9603271484375, -1.630615234375, -1.3009033203125, -0.97119140625, -0.6414794921875, -0.311767578125, 0.0179443359375, 0.34765625, 0.6773681640625, 1.007080078125, 1.3367919921875, 1.66650390625, 1.9962158203125, 2.325927734375, 2.6556396484375, 2.9853515625, 3.3150634765625, 3.644775390625, 3.9744873046875, 4.30419921875, 4.6339111328125, 4.963623046875, 5.2933349609375, 5.623046875, 5.9527587890625, 6.282470703125, 6.6121826171875, 6.94189453125, 7.2716064453125, 7.601318359375, 7.9310302734375, 8.2607421875, 8.5904541015625, 8.920166015625, 9.2498779296875, 9.57958984375, 9.9093017578125, 10.239013671875, 10.5687255859375, 10.8984375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 8.0, 5.0, 3.0, 8.0, 15.0, 15.0, 16.0, 22.0, 22.0, 22.0, 43.0, 21.0, 39.0, 40.0, 48.0, 39.0, 47.0, 50.0, 43.0, 48.0, 48.0, 38.0, 35.0, 39.0, 37.0, 31.0, 25.0, 23.0, 31.0, 27.0, 17.0, 12.0, 19.0, 11.0, 8.0, 9.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5859375, -5.4024658203125, -5.218994140625, -5.0355224609375, -4.85205078125, -4.6685791015625, -4.485107421875, -4.3016357421875, -4.1181640625, -3.9346923828125, -3.751220703125, -3.5677490234375, -3.38427734375, -3.2008056640625, -3.017333984375, -2.8338623046875, -2.650390625, -2.4669189453125, -2.283447265625, -2.0999755859375, -1.91650390625, -1.7330322265625, -1.549560546875, -1.3660888671875, -1.1826171875, -0.9991455078125, -0.815673828125, -0.6322021484375, -0.44873046875, -0.2652587890625, -0.081787109375, 0.1016845703125, 0.28515625, 0.4686279296875, 0.652099609375, 0.8355712890625, 1.01904296875, 1.2025146484375, 1.385986328125, 1.5694580078125, 1.7529296875, 1.9364013671875, 2.119873046875, 2.3033447265625, 2.48681640625, 2.6702880859375, 2.853759765625, 3.0372314453125, 3.220703125, 3.4041748046875, 3.587646484375, 3.7711181640625, 3.95458984375, 4.1380615234375, 4.321533203125, 4.5050048828125, 4.6884765625, 4.8719482421875, 5.055419921875, 5.2388916015625, 5.42236328125, 5.6058349609375, 5.789306640625, 5.9727783203125, 6.15625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 9.0, 23.0, 39.0, 42.0, 87.0, 120.0, 141.0, 234.0, 414.0, 656.0, 946.0, 1515.0, 2524.0, 4203.0, 6931.0, 12356.0, 21391.0, 39408.0, 75807.0, 150346.0, 318010.0, 701650.0, 1253209.0, 843616.0, 386245.0, 179941.0, 88998.0, 45863.0, 24984.0, 14057.0, 8053.0, 4791.0, 2946.0, 1705.0, 1118.0, 655.0, 443.0, 272.0, 194.0, 115.0, 90.0, 53.0, 31.0, 17.0, 15.0, 12.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.337890625, -8.07421875, -7.810546875, -7.546875, -7.283203125, -7.01953125, -6.755859375, -6.4921875, -6.228515625, -5.96484375, -5.701171875, -5.4375, -5.173828125, -4.91015625, -4.646484375, -4.3828125, -4.119140625, -3.85546875, -3.591796875, -3.328125, -3.064453125, -2.80078125, -2.537109375, -2.2734375, -2.009765625, -1.74609375, -1.482421875, -1.21875, -0.955078125, -0.69140625, -0.427734375, -0.1640625, 0.099609375, 0.36328125, 0.626953125, 0.890625, 1.154296875, 1.41796875, 1.681640625, 1.9453125, 2.208984375, 2.47265625, 2.736328125, 3.0, 3.263671875, 3.52734375, 3.791015625, 4.0546875, 4.318359375, 4.58203125, 4.845703125, 5.109375, 5.373046875, 5.63671875, 5.900390625, 6.1640625, 6.427734375, 6.69140625, 6.955078125, 7.21875, 7.482421875, 7.74609375, 8.009765625, 8.2734375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 7.0, 10.0, 18.0, 20.0, 26.0, 29.0, 26.0, 49.0, 46.0, 65.0, 73.0, 109.0, 139.0, 151.0, 160.0, 201.0, 213.0, 240.0, 297.0, 290.0, 277.0, 245.0, 222.0, 209.0, 165.0, 134.0, 114.0, 99.0, 82.0, 71.0, 36.0, 47.0, 38.0, 31.0, 23.0, 17.0, 12.0, 12.0, 10.0, 11.0, 9.0, 5.0, 2.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-2.76953125, -2.683929443359375, -2.59832763671875, -2.512725830078125, -2.4271240234375, -2.341522216796875, -2.25592041015625, -2.170318603515625, -2.084716796875, -1.999114990234375, -1.91351318359375, -1.827911376953125, -1.7423095703125, -1.656707763671875, -1.57110595703125, -1.485504150390625, -1.39990234375, -1.314300537109375, -1.22869873046875, -1.143096923828125, -1.0574951171875, -0.971893310546875, -0.88629150390625, -0.800689697265625, -0.715087890625, -0.629486083984375, -0.54388427734375, -0.458282470703125, -0.3726806640625, -0.287078857421875, -0.20147705078125, -0.115875244140625, -0.0302734375, 0.055328369140625, 0.14093017578125, 0.226531982421875, 0.3121337890625, 0.397735595703125, 0.48333740234375, 0.568939208984375, 0.654541015625, 0.740142822265625, 0.82574462890625, 0.911346435546875, 0.9969482421875, 1.082550048828125, 1.16815185546875, 1.253753662109375, 1.33935546875, 1.424957275390625, 1.51055908203125, 1.596160888671875, 1.6817626953125, 1.767364501953125, 1.85296630859375, 1.938568115234375, 2.024169921875, 2.109771728515625, 2.19537353515625, 2.280975341796875, 2.3665771484375, 2.452178955078125, 2.53778076171875, 2.623382568359375, 2.708984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 11.0, 13.0, 14.0, 19.0, 26.0, 26.0, 38.0, 51.0, 62.0, 74.0, 95.0, 81.0, 71.0, 89.0, 69.0, 52.0, 40.0, 42.0, 24.0, 18.0, 16.0, 12.0, 11.0, 11.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.727033615112305, -6.4767656326293945, -6.226497650146484, -5.976229667663574, -5.725961685180664, -5.475693702697754, -5.225426197052002, -4.975158214569092, -4.724890232086182, -4.4746222496032715, -4.224354267120361, -3.9740865230560303, -3.72381854057312, -3.47355055809021, -3.223282814025879, -2.9730148315429688, -2.7227468490600586, -2.4724788665771484, -2.2222108840942383, -1.9719431400299072, -1.721675157546997, -1.471407175064087, -1.2211393117904663, -0.9708714485168457, -0.7206034660339355, -0.47033554315567017, -0.22006762027740479, 0.030200302600860596, 0.280468225479126, 0.5307362079620361, 0.7810040712356567, 1.0312719345092773, 1.281540870666504, 1.531808853149414, 1.7820767164230347, 2.0323445796966553, 2.2826125621795654, 2.5328805446624756, 2.7831482887268066, 3.033416271209717, 3.283684253692627, 3.533952236175537, 3.7842202186584473, 4.034488201141357, 4.284755706787109, 4.5350236892700195, 4.78529167175293, 5.03555965423584, 5.28582763671875, 5.53609561920166, 5.78636360168457, 6.0366315841674805, 6.286899566650391, 6.537167549133301, 6.787435054779053, 7.037703037261963, 7.287971019744873, 7.538239002227783, 7.788506984710693, 8.038774490356445, 8.289042472839355, 8.539310455322266, 8.789578437805176, 9.039846420288086, 9.290114402770996]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 3.0, 9.0, 3.0, 6.0, 11.0, 8.0, 17.0, 15.0, 17.0, 25.0, 21.0, 24.0, 30.0, 24.0, 33.0, 33.0, 37.0, 45.0, 31.0, 53.0, 49.0, 30.0, 38.0, 44.0, 46.0, 29.0, 35.0, 40.0, 27.0, 22.0, 36.0, 14.0, 34.0, 18.0, 20.0, 17.0, 16.0, 8.0, 6.0, 6.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.462332248687744, -5.268728256225586, -5.075124263763428, -4.8815202713012695, -4.6879167556762695, -4.494312763214111, -4.300708770751953, -4.107104778289795, -3.913501024246216, -3.7198970317840576, -3.5262932777404785, -3.3326892852783203, -3.139085292816162, -2.945481538772583, -2.751877546310425, -2.5582737922668457, -2.3646697998046875, -2.1710658073425293, -1.9774620532989502, -1.783858060836792, -1.5902541875839233, -1.3966503143310547, -1.2030463218688965, -1.0094424486160278, -0.8158385753631592, -0.6222347021102905, -0.4286307692527771, -0.23502683639526367, -0.04142296314239502, 0.15218091011047363, 0.34578490257263184, 0.5393887758255005, 0.7329921722412109, 0.9265960454940796, 1.1201999187469482, 1.3138039112091064, 1.507407784461975, 1.7010116577148438, 1.894615650177002, 2.08821964263916, 2.2818233966827393, 2.4754273891448975, 2.6690311431884766, 2.8626351356506348, 3.056239128112793, 3.249842882156372, 3.4434468746185303, 3.6370506286621094, 3.8306546211242676, 4.024258613586426, 4.217862606048584, 4.411466598510742, 4.605070114135742, 4.7986741065979, 4.992278099060059, 5.185882091522217, 5.379486083984375, 5.573090076446533, 5.766694068908691, 5.960297584533691, 6.15390157699585, 6.347505569458008, 6.541109561920166, 6.734713554382324, 6.928317070007324]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 11.0, 11.0, 11.0, 16.0, 26.0, 48.0, 56.0, 89.0, 171.0, 220.0, 363.0, 575.0, 790.0, 1299.0, 2007.0, 3127.0, 4861.0, 7805.0, 12179.0, 19061.0, 30216.0, 47784.0, 76370.0, 123175.0, 191309.0, 192678.0, 124929.0, 77542.0, 48367.0, 30278.0, 19110.0, 12281.0, 7875.0, 4850.0, 3350.0, 2036.0, 1332.0, 871.0, 499.0, 351.0, 233.0, 139.0, 95.0, 52.0, 42.0, 27.0, 16.0, 12.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.41290283203125, -2.3375244140625, -2.26214599609375, -2.186767578125, -2.11138916015625, -2.0360107421875, -1.96063232421875, -1.88525390625, -1.80987548828125, -1.7344970703125, -1.65911865234375, -1.583740234375, -1.50836181640625, -1.4329833984375, -1.35760498046875, -1.2822265625, -1.20684814453125, -1.1314697265625, -1.05609130859375, -0.980712890625, -0.90533447265625, -0.8299560546875, -0.75457763671875, -0.67919921875, -0.60382080078125, -0.5284423828125, -0.45306396484375, -0.377685546875, -0.30230712890625, -0.2269287109375, -0.15155029296875, -0.076171875, -0.00079345703125, 0.0745849609375, 0.14996337890625, 0.225341796875, 0.30072021484375, 0.3760986328125, 0.45147705078125, 0.52685546875, 0.60223388671875, 0.6776123046875, 0.75299072265625, 0.828369140625, 0.90374755859375, 0.9791259765625, 1.05450439453125, 1.1298828125, 1.20526123046875, 1.2806396484375, 1.35601806640625, 1.431396484375, 1.50677490234375, 1.5821533203125, 1.65753173828125, 1.73291015625, 1.80828857421875, 1.8836669921875, 1.95904541015625, 2.034423828125, 2.10980224609375, 2.1851806640625, 2.26055908203125, 2.3359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 5.0, 12.0, 11.0, 17.0, 14.0, 13.0, 18.0, 18.0, 22.0, 27.0, 30.0, 31.0, 49.0, 40.0, 44.0, 43.0, 36.0, 51.0, 45.0, 37.0, 45.0, 37.0, 38.0, 29.0, 28.0, 29.0, 32.0, 38.0, 24.0, 19.0, 17.0, 24.0, 17.0, 9.0, 13.0, 9.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.588623046875, -5.38427734375, -5.179931640625, -4.9755859375, -4.771240234375, -4.56689453125, -4.362548828125, -4.158203125, -3.953857421875, -3.74951171875, -3.545166015625, -3.3408203125, -3.136474609375, -2.93212890625, -2.727783203125, -2.5234375, -2.319091796875, -2.11474609375, -1.910400390625, -1.7060546875, -1.501708984375, -1.29736328125, -1.093017578125, -0.888671875, -0.684326171875, -0.47998046875, -0.275634765625, -0.0712890625, 0.133056640625, 0.33740234375, 0.541748046875, 0.74609375, 0.950439453125, 1.15478515625, 1.359130859375, 1.5634765625, 1.767822265625, 1.97216796875, 2.176513671875, 2.380859375, 2.585205078125, 2.78955078125, 2.993896484375, 3.1982421875, 3.402587890625, 3.60693359375, 3.811279296875, 4.015625, 4.219970703125, 4.42431640625, 4.628662109375, 4.8330078125, 5.037353515625, 5.24169921875, 5.446044921875, 5.650390625, 5.854736328125, 6.05908203125, 6.263427734375, 6.4677734375, 6.672119140625, 6.87646484375, 7.080810546875, 7.28515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 6.0, 8.0, 8.0, 32.0, 34.0, 44.0, 95.0, 123.0, 209.0, 301.0, 516.0, 810.0, 1279.0, 2160.0, 3621.0, 6365.0, 11194.0, 20191.0, 38913.0, 77129.0, 165004.0, 339868.0, 194083.0, 89580.0, 44086.0, 23058.0, 12535.0, 7022.0, 4053.0, 2360.0, 1471.0, 912.0, 514.0, 335.0, 222.0, 138.0, 87.0, 64.0, 44.0, 28.0, 22.0, 11.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.40234375, -3.2979736328125, -3.193603515625, -3.0892333984375, -2.98486328125, -2.8804931640625, -2.776123046875, -2.6717529296875, -2.5673828125, -2.4630126953125, -2.358642578125, -2.2542724609375, -2.14990234375, -2.0455322265625, -1.941162109375, -1.8367919921875, -1.732421875, -1.6280517578125, -1.523681640625, -1.4193115234375, -1.31494140625, -1.2105712890625, -1.106201171875, -1.0018310546875, -0.8974609375, -0.7930908203125, -0.688720703125, -0.5843505859375, -0.47998046875, -0.3756103515625, -0.271240234375, -0.1668701171875, -0.0625, 0.0418701171875, 0.146240234375, 0.2506103515625, 0.35498046875, 0.4593505859375, 0.563720703125, 0.6680908203125, 0.7724609375, 0.8768310546875, 0.981201171875, 1.0855712890625, 1.18994140625, 1.2943115234375, 1.398681640625, 1.5030517578125, 1.607421875, 1.7117919921875, 1.816162109375, 1.9205322265625, 2.02490234375, 2.1292724609375, 2.233642578125, 2.3380126953125, 2.4423828125, 2.5467529296875, 2.651123046875, 2.7554931640625, 2.85986328125, 2.9642333984375, 3.068603515625, 3.1729736328125, 3.27734375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 11.0, 7.0, 11.0, 19.0, 11.0, 17.0, 6.0, 24.0, 29.0, 28.0, 32.0, 41.0, 23.0, 30.0, 48.0, 33.0, 53.0, 38.0, 45.0, 49.0, 38.0, 36.0, 32.0, 36.0, 31.0, 32.0, 27.0, 25.0, 21.0, 24.0, 19.0, 17.0, 19.0, 15.0, 11.0, 6.0, 12.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.966796875, -3.850921630859375, -3.73504638671875, -3.619171142578125, -3.5032958984375, -3.387420654296875, -3.27154541015625, -3.155670166015625, -3.039794921875, -2.923919677734375, -2.80804443359375, -2.692169189453125, -2.5762939453125, -2.460418701171875, -2.34454345703125, -2.228668212890625, -2.11279296875, -1.996917724609375, -1.88104248046875, -1.765167236328125, -1.6492919921875, -1.533416748046875, -1.41754150390625, -1.301666259765625, -1.185791015625, -1.069915771484375, -0.95404052734375, -0.838165283203125, -0.7222900390625, -0.606414794921875, -0.49053955078125, -0.374664306640625, -0.2587890625, -0.142913818359375, -0.02703857421875, 0.088836669921875, 0.2047119140625, 0.320587158203125, 0.43646240234375, 0.552337646484375, 0.668212890625, 0.784088134765625, 0.89996337890625, 1.015838623046875, 1.1317138671875, 1.247589111328125, 1.36346435546875, 1.479339599609375, 1.59521484375, 1.711090087890625, 1.82696533203125, 1.942840576171875, 2.0587158203125, 2.174591064453125, 2.29046630859375, 2.406341552734375, 2.522216796875, 2.638092041015625, 2.75396728515625, 2.869842529296875, 2.9857177734375, 3.101593017578125, 3.21746826171875, 3.333343505859375, 3.44921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 11.0, 10.0, 9.0, 23.0, 44.0, 52.0, 79.0, 130.0, 196.0, 315.0, 541.0, 922.0, 1713.0, 3291.0, 6436.0, 14299.0, 35566.0, 114287.0, 468169.0, 284717.0, 71492.0, 24936.0, 10572.0, 4915.0, 2500.0, 1393.0, 757.0, 422.0, 282.0, 163.0, 100.0, 72.0, 51.0, 19.0, 29.0, 12.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03912353515625, -0.03803110122680664, -0.03693866729736328, -0.03584623336791992, -0.03475379943847656, -0.0336613655090332, -0.032568931579589844, -0.031476497650146484, -0.030384063720703125, -0.029291629791259766, -0.028199195861816406, -0.027106761932373047, -0.026014328002929688, -0.024921894073486328, -0.02382946014404297, -0.02273702621459961, -0.02164459228515625, -0.02055215835571289, -0.01945972442626953, -0.018367290496826172, -0.017274856567382812, -0.016182422637939453, -0.015089988708496094, -0.013997554779052734, -0.012905120849609375, -0.011812686920166016, -0.010720252990722656, -0.009627819061279297, -0.008535385131835938, -0.007442951202392578, -0.006350517272949219, -0.005258083343505859, -0.0041656494140625, -0.0030732154846191406, -0.0019807815551757812, -0.0008883476257324219, 0.0002040863037109375, 0.0012965202331542969, 0.0023889541625976562, 0.0034813880920410156, 0.004573822021484375, 0.005666255950927734, 0.006758689880371094, 0.007851123809814453, 0.008943557739257812, 0.010035991668701172, 0.011128425598144531, 0.01222085952758789, 0.01331329345703125, 0.01440572738647461, 0.015498161315917969, 0.016590595245361328, 0.017683029174804688, 0.018775463104248047, 0.019867897033691406, 0.020960330963134766, 0.022052764892578125, 0.023145198822021484, 0.024237632751464844, 0.025330066680908203, 0.026422500610351562, 0.027514934539794922, 0.02860736846923828, 0.02969980239868164, 0.030792236328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 8.0, 1.0, 8.0, 8.0, 6.0, 11.0, 17.0, 11.0, 26.0, 22.0, 40.0, 38.0, 63.0, 66.0, 90.0, 100.0, 95.0, 69.0, 61.0, 64.0, 39.0, 36.0, 21.0, 20.0, 23.0, 9.0, 7.0, 8.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.758848369121552e-06, -7.471069693565369e-06, -7.183291018009186e-06, -6.895512342453003e-06, -6.60773366689682e-06, -6.319954991340637e-06, -6.032176315784454e-06, -5.7443976402282715e-06, -5.456618964672089e-06, -5.168840289115906e-06, -4.881061613559723e-06, -4.59328293800354e-06, -4.305504262447357e-06, -4.017725586891174e-06, -3.7299469113349915e-06, -3.4421682357788086e-06, -3.1543895602226257e-06, -2.866610884666443e-06, -2.57883220911026e-06, -2.291053533554077e-06, -2.0032748579978943e-06, -1.7154961824417114e-06, -1.4277175068855286e-06, -1.1399388313293457e-06, -8.521601557731628e-07, -5.6438148021698e-07, -2.766028046607971e-07, 1.1175870895385742e-08, 2.989545464515686e-07, 5.867332220077515e-07, 8.745118975639343e-07, 1.1622905731201172e-06, 1.4500692486763e-06, 1.737847924232483e-06, 2.0256265997886658e-06, 2.3134052753448486e-06, 2.6011839509010315e-06, 2.8889626264572144e-06, 3.1767413020133972e-06, 3.46451997756958e-06, 3.752298653125763e-06, 4.040077328681946e-06, 4.327856004238129e-06, 4.6156346797943115e-06, 4.903413355350494e-06, 5.191192030906677e-06, 5.47897070646286e-06, 5.766749382019043e-06, 6.054528057575226e-06, 6.342306733131409e-06, 6.6300854086875916e-06, 6.917864084243774e-06, 7.205642759799957e-06, 7.49342143535614e-06, 7.781200110912323e-06, 8.068978786468506e-06, 8.356757462024689e-06, 8.644536137580872e-06, 8.932314813137054e-06, 9.220093488693237e-06, 9.50787216424942e-06, 9.795650839805603e-06, 1.0083429515361786e-05, 1.0371208190917969e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 6.0, 7.0, 14.0, 14.0, 22.0, 27.0, 45.0, 60.0, 68.0, 142.0, 224.0, 275.0, 412.0, 661.0, 962.0, 1469.0, 2116.0, 3408.0, 4963.0, 7807.0, 12185.0, 20114.0, 34836.0, 62086.0, 119906.0, 243720.0, 251486.0, 124553.0, 64184.0, 35734.0, 21051.0, 12767.0, 8004.0, 5168.0, 3264.0, 2248.0, 1464.0, 1039.0, 693.0, 437.0, 296.0, 204.0, 131.0, 91.0, 67.0, 41.0, 35.0, 17.0, 15.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.020477294921875, -0.019875526428222656, -0.019273757934570312, -0.01867198944091797, -0.018070220947265625, -0.01746845245361328, -0.016866683959960938, -0.016264915466308594, -0.01566314697265625, -0.015061378479003906, -0.014459609985351562, -0.013857841491699219, -0.013256072998046875, -0.012654304504394531, -0.012052536010742188, -0.011450767517089844, -0.0108489990234375, -0.010247230529785156, -0.009645462036132812, -0.009043693542480469, -0.008441925048828125, -0.007840156555175781, -0.0072383880615234375, -0.006636619567871094, -0.00603485107421875, -0.005433082580566406, -0.0048313140869140625, -0.004229545593261719, -0.003627777099609375, -0.0030260086059570312, -0.0024242401123046875, -0.0018224716186523438, -0.001220703125, -0.0006189346313476562, -1.71661376953125e-05, 0.0005846023559570312, 0.001186370849609375, 0.0017881393432617188, 0.0023899078369140625, 0.0029916763305664062, 0.00359344482421875, 0.004195213317871094, 0.0047969818115234375, 0.005398750305175781, 0.006000518798828125, 0.006602287292480469, 0.0072040557861328125, 0.007805824279785156, 0.0084075927734375, 0.009009361267089844, 0.009611129760742188, 0.010212898254394531, 0.010814666748046875, 0.011416435241699219, 0.012018203735351562, 0.012619972229003906, 0.01322174072265625, 0.013823509216308594, 0.014425277709960938, 0.015027046203613281, 0.015628814697265625, 0.01623058319091797, 0.016832351684570312, 0.017434120178222656, 0.018035888671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 1.0, 12.0, 11.0, 15.0, 18.0, 23.0, 24.0, 21.0, 25.0, 39.0, 44.0, 42.0, 53.0, 49.0, 62.0, 56.0, 59.0, 55.0, 46.0, 49.0, 55.0, 32.0, 39.0, 16.0, 24.0, 16.0, 17.0, 12.0, 16.0, 14.0, 7.0, 1.0, 7.0, 5.0, 6.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0050506591796875, -0.004868268966674805, -0.004685878753662109, -0.004503488540649414, -0.004321098327636719, -0.0041387081146240234, -0.003956317901611328, -0.003773927688598633, -0.0035915374755859375, -0.003409147262573242, -0.003226757049560547, -0.0030443668365478516, -0.0028619766235351562, -0.002679586410522461, -0.0024971961975097656, -0.0023148059844970703, -0.002132415771484375, -0.0019500255584716797, -0.0017676353454589844, -0.001585245132446289, -0.0014028549194335938, -0.0012204647064208984, -0.0010380744934082031, -0.0008556842803955078, -0.0006732940673828125, -0.0004909038543701172, -0.0003085136413574219, -0.00012612342834472656, 5.626678466796875e-05, 0.00023865699768066406, 0.0004210472106933594, 0.0006034374237060547, 0.00078582763671875, 0.0009682178497314453, 0.0011506080627441406, 0.001332998275756836, 0.0015153884887695312, 0.0016977787017822266, 0.0018801689147949219, 0.002062559127807617, 0.0022449493408203125, 0.002427339553833008, 0.002609729766845703, 0.0027921199798583984, 0.0029745101928710938, 0.003156900405883789, 0.0033392906188964844, 0.0035216808319091797, 0.003704071044921875, 0.0038864612579345703, 0.004068851470947266, 0.004251241683959961, 0.004433631896972656, 0.0046160221099853516, 0.004798412322998047, 0.004980802536010742, 0.0051631927490234375, 0.005345582962036133, 0.005527973175048828, 0.0057103633880615234, 0.005892753601074219, 0.006075143814086914, 0.006257534027099609, 0.006439924240112305, 0.006622314453125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 14.0, 12.0, 11.0, 29.0, 22.0, 33.0, 36.0, 56.0, 71.0, 95.0, 90.0, 78.0, 84.0, 80.0, 58.0, 54.0, 37.0, 34.0, 16.0, 17.0, 20.0, 6.0, 10.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.582271575927734, -6.323905944824219, -6.065540790557861, -5.807175159454346, -5.548810005187988, -5.290444374084473, -5.032078742980957, -4.7737135887146, -4.515348434448242, -4.256982803344727, -3.998617649078369, -3.7402520179748535, -3.481886863708496, -3.2235212326049805, -2.965155839920044, -2.7067904472351074, -2.448424816131592, -2.1900594234466553, -1.9316940307617188, -1.6733285188674927, -1.4149631261825562, -1.1565977334976196, -0.8982322216033936, -0.639866828918457, -0.3815014362335205, -0.1231360137462616, 0.13522940874099731, 0.3935948610305786, 0.6519602537155151, 0.9103256464004517, 1.1686911582946777, 1.4270565509796143, 1.6854219436645508, 1.9437873363494873, 2.202152729034424, 2.4605183601379395, 2.718883514404297, 2.9772491455078125, 3.235614538192749, 3.4939799308776855, 3.752345323562622, 4.010710716247559, 4.269076347351074, 4.527441501617432, 4.785807132720947, 5.044172286987305, 5.30253791809082, 5.560903549194336, 5.819268703460693, 6.077634334564209, 6.335999488830566, 6.594365119934082, 6.8527302742004395, 7.111095905303955, 7.3694610595703125, 7.627826690673828, 7.886192321777344, 8.14455795288086, 8.402923583984375, 8.661288261413574, 8.91965389251709, 9.178019523620605, 9.436385154724121, 9.69474983215332, 9.953115463256836]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 9.0, 2.0, 9.0, 3.0, 6.0, 11.0, 8.0, 17.0, 16.0, 19.0, 23.0, 23.0, 21.0, 30.0, 25.0, 35.0, 32.0, 36.0, 44.0, 35.0, 51.0, 51.0, 28.0, 36.0, 45.0, 46.0, 31.0, 34.0, 38.0, 26.0, 23.0, 36.0, 14.0, 34.0, 20.0, 18.0, 19.0, 14.0, 8.0, 6.0, 6.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.406991481781006, -5.215378284454346, -5.0237650871276855, -4.832151889801025, -4.640538692474365, -4.448925495147705, -4.257312774658203, -4.065699577331543, -3.8740861415863037, -3.6824729442596436, -3.4908597469329834, -3.2992467880249023, -3.107633590698242, -2.916020393371582, -2.724407196044922, -2.5327939987182617, -2.3411808013916016, -2.1495676040649414, -1.9579544067382812, -1.7663413286209106, -1.5747281312942505, -1.3831149339675903, -1.1915018558502197, -0.9998886585235596, -0.8082754611968994, -0.6166622638702393, -0.4250491261482239, -0.2334359884262085, -0.04182279109954834, 0.14979040622711182, 0.3414034843444824, 0.5330166816711426, 0.7246298789978027, 0.9162430763244629, 1.107856273651123, 1.2994693517684937, 1.4910825490951538, 1.682695746421814, 1.8743088245391846, 2.0659220218658447, 2.257535219192505, 2.449148416519165, 2.640761613845825, 2.8323745727539062, 3.0239877700805664, 3.2156009674072266, 3.4072141647338867, 3.598827362060547, 3.790440559387207, 3.982053756713867, 4.173666954040527, 4.3652801513671875, 4.556893348693848, 4.748506546020508, 4.940119743347168, 5.131732940673828, 5.323346138000488, 5.514959335327148, 5.706572532653809, 5.898185729980469, 6.089798927307129, 6.281412124633789, 6.473025321960449, 6.664638519287109, 6.856251239776611]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 11.0, 15.0, 22.0, 29.0, 63.0, 108.0, 128.0, 195.0, 285.0, 413.0, 684.0, 1025.0, 1554.0, 2397.0, 3627.0, 5385.0, 8281.0, 12893.0, 20032.0, 31193.0, 48920.0, 76654.0, 116229.0, 155347.0, 166364.0, 135715.0, 93290.0, 59773.0, 38273.0, 24443.0, 15665.0, 10196.0, 6780.0, 4276.0, 2848.0, 1810.0, 1275.0, 787.0, 566.0, 325.0, 215.0, 148.0, 98.0, 78.0, 47.0, 34.0, 21.0, 10.0, 7.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.16796875, -6.93841552734375, -6.7088623046875, -6.47930908203125, -6.249755859375, -6.02020263671875, -5.7906494140625, -5.56109619140625, -5.33154296875, -5.10198974609375, -4.8724365234375, -4.64288330078125, -4.413330078125, -4.18377685546875, -3.9542236328125, -3.72467041015625, -3.4951171875, -3.26556396484375, -3.0360107421875, -2.80645751953125, -2.576904296875, -2.34735107421875, -2.1177978515625, -1.88824462890625, -1.65869140625, -1.42913818359375, -1.1995849609375, -0.97003173828125, -0.740478515625, -0.51092529296875, -0.2813720703125, -0.05181884765625, 0.177734375, 0.40728759765625, 0.6368408203125, 0.86639404296875, 1.095947265625, 1.32550048828125, 1.5550537109375, 1.78460693359375, 2.01416015625, 2.24371337890625, 2.4732666015625, 2.70281982421875, 2.932373046875, 3.16192626953125, 3.3914794921875, 3.62103271484375, 3.8505859375, 4.08013916015625, 4.3096923828125, 4.53924560546875, 4.768798828125, 4.99835205078125, 5.2279052734375, 5.45745849609375, 5.68701171875, 5.91656494140625, 6.1461181640625, 6.37567138671875, 6.605224609375, 6.83477783203125, 7.0643310546875, 7.29388427734375, 7.5234375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 5.0, 12.0, 13.0, 16.0, 14.0, 22.0, 21.0, 26.0, 25.0, 23.0, 39.0, 34.0, 36.0, 42.0, 38.0, 48.0, 54.0, 45.0, 42.0, 36.0, 41.0, 41.0, 45.0, 31.0, 32.0, 33.0, 22.0, 32.0, 23.0, 16.0, 18.0, 15.0, 6.0, 11.0, 7.0, 4.0, 7.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.20703125, -5.01654052734375, -4.8260498046875, -4.63555908203125, -4.445068359375, -4.25457763671875, -4.0640869140625, -3.87359619140625, -3.68310546875, -3.49261474609375, -3.3021240234375, -3.11163330078125, -2.921142578125, -2.73065185546875, -2.5401611328125, -2.34967041015625, -2.1591796875, -1.96868896484375, -1.7781982421875, -1.58770751953125, -1.397216796875, -1.20672607421875, -1.0162353515625, -0.82574462890625, -0.63525390625, -0.44476318359375, -0.2542724609375, -0.06378173828125, 0.126708984375, 0.31719970703125, 0.5076904296875, 0.69818115234375, 0.888671875, 1.07916259765625, 1.2696533203125, 1.46014404296875, 1.650634765625, 1.84112548828125, 2.0316162109375, 2.22210693359375, 2.41259765625, 2.60308837890625, 2.7935791015625, 2.98406982421875, 3.174560546875, 3.36505126953125, 3.5555419921875, 3.74603271484375, 3.9365234375, 4.12701416015625, 4.3175048828125, 4.50799560546875, 4.698486328125, 4.88897705078125, 5.0794677734375, 5.26995849609375, 5.46044921875, 5.65093994140625, 5.8414306640625, 6.03192138671875, 6.222412109375, 6.41290283203125, 6.6033935546875, 6.79388427734375, 6.984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 11.0, 17.0, 26.0, 43.0, 49.0, 100.0, 151.0, 188.0, 338.0, 484.0, 799.0, 1179.0, 1856.0, 2844.0, 4404.0, 6773.0, 10523.0, 16438.0, 26019.0, 41894.0, 67328.0, 105438.0, 150762.0, 174930.0, 150525.0, 104771.0, 67099.0, 41760.0, 25988.0, 16342.0, 10539.0, 6663.0, 4271.0, 2844.0, 1761.0, 1198.0, 760.0, 483.0, 318.0, 216.0, 134.0, 89.0, 61.0, 48.0, 33.0, 15.0, 16.0, 13.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-7.97265625, -7.734619140625, -7.49658203125, -7.258544921875, -7.0205078125, -6.782470703125, -6.54443359375, -6.306396484375, -6.068359375, -5.830322265625, -5.59228515625, -5.354248046875, -5.1162109375, -4.878173828125, -4.64013671875, -4.402099609375, -4.1640625, -3.926025390625, -3.68798828125, -3.449951171875, -3.2119140625, -2.973876953125, -2.73583984375, -2.497802734375, -2.259765625, -2.021728515625, -1.78369140625, -1.545654296875, -1.3076171875, -1.069580078125, -0.83154296875, -0.593505859375, -0.35546875, -0.117431640625, 0.12060546875, 0.358642578125, 0.5966796875, 0.834716796875, 1.07275390625, 1.310791015625, 1.548828125, 1.786865234375, 2.02490234375, 2.262939453125, 2.5009765625, 2.739013671875, 2.97705078125, 3.215087890625, 3.453125, 3.691162109375, 3.92919921875, 4.167236328125, 4.4052734375, 4.643310546875, 4.88134765625, 5.119384765625, 5.357421875, 5.595458984375, 5.83349609375, 6.071533203125, 6.3095703125, 6.547607421875, 6.78564453125, 7.023681640625, 7.26171875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 11.0, 9.0, 12.0, 10.0, 17.0, 14.0, 17.0, 21.0, 25.0, 25.0, 19.0, 32.0, 31.0, 31.0, 29.0, 38.0, 31.0, 29.0, 50.0, 51.0, 46.0, 41.0, 54.0, 33.0, 39.0, 30.0, 33.0, 21.0, 20.0, 30.0, 26.0, 21.0, 16.0, 13.0, 10.0, 14.0, 12.0, 9.0, 11.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.947265625, -3.837066650390625, -3.72686767578125, -3.616668701171875, -3.5064697265625, -3.396270751953125, -3.28607177734375, -3.175872802734375, -3.065673828125, -2.955474853515625, -2.84527587890625, -2.735076904296875, -2.6248779296875, -2.514678955078125, -2.40447998046875, -2.294281005859375, -2.18408203125, -2.073883056640625, -1.96368408203125, -1.853485107421875, -1.7432861328125, -1.633087158203125, -1.52288818359375, -1.412689208984375, -1.302490234375, -1.192291259765625, -1.08209228515625, -0.971893310546875, -0.8616943359375, -0.751495361328125, -0.64129638671875, -0.531097412109375, -0.4208984375, -0.310699462890625, -0.20050048828125, -0.090301513671875, 0.0198974609375, 0.130096435546875, 0.24029541015625, 0.350494384765625, 0.460693359375, 0.570892333984375, 0.68109130859375, 0.791290283203125, 0.9014892578125, 1.011688232421875, 1.12188720703125, 1.232086181640625, 1.34228515625, 1.452484130859375, 1.56268310546875, 1.672882080078125, 1.7830810546875, 1.893280029296875, 2.00347900390625, 2.113677978515625, 2.223876953125, 2.334075927734375, 2.44427490234375, 2.554473876953125, 2.6646728515625, 2.774871826171875, 2.88507080078125, 2.995269775390625, 3.10546875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 13.0, 12.0, 15.0, 27.0, 38.0, 48.0, 70.0, 123.0, 141.0, 191.0, 317.0, 402.0, 590.0, 879.0, 1236.0, 1888.0, 3129.0, 4883.0, 8517.0, 16646.0, 41240.0, 172064.0, 603826.0, 123210.0, 34012.0, 14417.0, 7673.0, 4494.0, 2815.0, 1770.0, 1176.0, 821.0, 554.0, 355.0, 286.0, 198.0, 130.0, 109.0, 70.0, 54.0, 38.0, 18.0, 26.0, 13.0, 4.0, 6.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.06640625, -4.90509033203125, -4.7437744140625, -4.58245849609375, -4.421142578125, -4.25982666015625, -4.0985107421875, -3.93719482421875, -3.77587890625, -3.61456298828125, -3.4532470703125, -3.29193115234375, -3.130615234375, -2.96929931640625, -2.8079833984375, -2.64666748046875, -2.4853515625, -2.32403564453125, -2.1627197265625, -2.00140380859375, -1.840087890625, -1.67877197265625, -1.5174560546875, -1.35614013671875, -1.19482421875, -1.03350830078125, -0.8721923828125, -0.71087646484375, -0.549560546875, -0.38824462890625, -0.2269287109375, -0.06561279296875, 0.095703125, 0.25701904296875, 0.4183349609375, 0.57965087890625, 0.740966796875, 0.90228271484375, 1.0635986328125, 1.22491455078125, 1.38623046875, 1.54754638671875, 1.7088623046875, 1.87017822265625, 2.031494140625, 2.19281005859375, 2.3541259765625, 2.51544189453125, 2.6767578125, 2.83807373046875, 2.9993896484375, 3.16070556640625, 3.322021484375, 3.48333740234375, 3.6446533203125, 3.80596923828125, 3.96728515625, 4.12860107421875, 4.2899169921875, 4.45123291015625, 4.612548828125, 4.77386474609375, 4.9351806640625, 5.09649658203125, 5.2578125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 5.0, 11.0, 29.0, 20.0, 40.0, 70.0, 99.0, 159.0, 207.0, 130.0, 89.0, 57.0, 24.0, 20.0, 12.0, 8.0, 12.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004024505615234375, -0.000392913818359375, -0.0003833770751953125, -0.00037384033203125, -0.0003643035888671875, -0.000354766845703125, -0.0003452301025390625, -0.000335693359375, -0.0003261566162109375, -0.000316619873046875, -0.0003070831298828125, -0.00029754638671875, -0.0002880096435546875, -0.000278472900390625, -0.0002689361572265625, -0.0002593994140625, -0.0002498626708984375, -0.000240325927734375, -0.0002307891845703125, -0.00022125244140625, -0.0002117156982421875, -0.000202178955078125, -0.0001926422119140625, -0.00018310546875, -0.0001735687255859375, -0.000164031982421875, -0.0001544952392578125, -0.00014495849609375, -0.0001354217529296875, -0.000125885009765625, -0.0001163482666015625, -0.0001068115234375, -9.72747802734375e-05, -8.7738037109375e-05, -7.82012939453125e-05, -6.866455078125e-05, -5.91278076171875e-05, -4.9591064453125e-05, -4.00543212890625e-05, -3.0517578125e-05, -2.09808349609375e-05, -1.1444091796875e-05, -1.9073486328125e-06, 7.62939453125e-06, 1.71661376953125e-05, 2.6702880859375e-05, 3.62396240234375e-05, 4.57763671875e-05, 5.53131103515625e-05, 6.4849853515625e-05, 7.43865966796875e-05, 8.392333984375e-05, 9.34600830078125e-05, 0.000102996826171875, 0.0001125335693359375, 0.0001220703125, 0.0001316070556640625, 0.000141143798828125, 0.0001506805419921875, 0.00016021728515625, 0.0001697540283203125, 0.000179290771484375, 0.0001888275146484375, 0.0001983642578125, 0.0002079010009765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 2.0, 7.0, 6.0, 7.0, 9.0, 8.0, 9.0, 19.0, 31.0, 39.0, 37.0, 67.0, 102.0, 165.0, 220.0, 297.0, 467.0, 708.0, 1136.0, 1942.0, 3306.0, 6261.0, 13291.0, 32966.0, 122298.0, 618517.0, 173179.0, 41119.0, 15477.0, 7316.0, 3797.0, 2155.0, 1222.0, 780.0, 517.0, 315.0, 215.0, 156.0, 85.0, 86.0, 57.0, 46.0, 26.0, 15.0, 21.0, 13.0, 9.0, 7.0, 11.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.640625, -5.46759033203125, -5.2945556640625, -5.12152099609375, -4.948486328125, -4.77545166015625, -4.6024169921875, -4.42938232421875, -4.25634765625, -4.08331298828125, -3.9102783203125, -3.73724365234375, -3.564208984375, -3.39117431640625, -3.2181396484375, -3.04510498046875, -2.8720703125, -2.69903564453125, -2.5260009765625, -2.35296630859375, -2.179931640625, -2.00689697265625, -1.8338623046875, -1.66082763671875, -1.48779296875, -1.31475830078125, -1.1417236328125, -0.96868896484375, -0.795654296875, -0.62261962890625, -0.4495849609375, -0.27655029296875, -0.103515625, 0.06951904296875, 0.2425537109375, 0.41558837890625, 0.588623046875, 0.76165771484375, 0.9346923828125, 1.10772705078125, 1.28076171875, 1.45379638671875, 1.6268310546875, 1.79986572265625, 1.972900390625, 2.14593505859375, 2.3189697265625, 2.49200439453125, 2.6650390625, 2.83807373046875, 3.0111083984375, 3.18414306640625, 3.357177734375, 3.53021240234375, 3.7032470703125, 3.87628173828125, 4.04931640625, 4.22235107421875, 4.3953857421875, 4.56842041015625, 4.741455078125, 4.91448974609375, 5.0875244140625, 5.26055908203125, 5.43359375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 3.0, 15.0, 15.0, 25.0, 20.0, 49.0, 60.0, 106.0, 175.0, 200.0, 106.0, 55.0, 33.0, 26.0, 19.0, 18.0, 16.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.236328125, -1.18255615234375, -1.1287841796875, -1.07501220703125, -1.021240234375, -0.96746826171875, -0.9136962890625, -0.85992431640625, -0.80615234375, -0.75238037109375, -0.6986083984375, -0.64483642578125, -0.591064453125, -0.53729248046875, -0.4835205078125, -0.42974853515625, -0.3759765625, -0.32220458984375, -0.2684326171875, -0.21466064453125, -0.160888671875, -0.10711669921875, -0.0533447265625, 0.00042724609375, 0.05419921875, 0.10797119140625, 0.1617431640625, 0.21551513671875, 0.269287109375, 0.32305908203125, 0.3768310546875, 0.43060302734375, 0.484375, 0.53814697265625, 0.5919189453125, 0.64569091796875, 0.699462890625, 0.75323486328125, 0.8070068359375, 0.86077880859375, 0.91455078125, 0.96832275390625, 1.0220947265625, 1.07586669921875, 1.129638671875, 1.18341064453125, 1.2371826171875, 1.29095458984375, 1.3447265625, 1.39849853515625, 1.4522705078125, 1.50604248046875, 1.559814453125, 1.61358642578125, 1.6673583984375, 1.72113037109375, 1.77490234375, 1.82867431640625, 1.8824462890625, 1.93621826171875, 1.989990234375, 2.04376220703125, 2.0975341796875, 2.15130615234375, 2.205078125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 7.0, 11.0, 16.0, 18.0, 28.0, 40.0, 39.0, 51.0, 75.0, 95.0, 95.0, 90.0, 77.0, 82.0, 45.0, 53.0, 34.0, 29.0, 21.0, 15.0, 15.0, 10.0, 12.0, 8.0, 3.0, 3.0, 3.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.612399578094482, -6.362186431884766, -6.111973285675049, -5.861760139465332, -5.611547470092773, -5.361333847045898, -5.11112117767334, -4.860908031463623, -4.610694885253906, -4.3604817390441895, -4.110268592834473, -3.860055685043335, -3.609842538833618, -3.3596293926239014, -3.1094164848327637, -2.859203338623047, -2.60899019241333, -2.3587770462036133, -2.1085638999938965, -1.8583509922027588, -1.608137845993042, -1.3579246997833252, -1.107711672782898, -0.8574986457824707, -0.6072854995727539, -0.3570724129676819, -0.10685932636260986, 0.14335376024246216, 0.3935668468475342, 0.643779993057251, 0.8939930200576782, 1.1442060470581055, 1.394418716430664, 1.6446318626403809, 1.894844889640808, 2.1450579166412354, 2.395271062850952, 2.645484209060669, 2.8956971168518066, 3.1459102630615234, 3.3961234092712402, 3.646336555480957, 3.896549701690674, 4.146762847900391, 4.396975517272949, 4.647189140319824, 4.897401809692383, 5.1476149559021, 5.397828102111816, 5.648041248321533, 5.89825439453125, 6.148467540740967, 6.398680686950684, 6.648893356323242, 6.899106502532959, 7.149319648742676, 7.399532794952393, 7.649745941162109, 7.899959087371826, 8.150172233581543, 8.400384902954102, 8.650598526000977, 8.900811195373535, 9.151023864746094, 9.401237487792969]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 10.0, 6.0, 11.0, 17.0, 7.0, 14.0, 18.0, 18.0, 22.0, 23.0, 23.0, 30.0, 32.0, 33.0, 32.0, 39.0, 35.0, 33.0, 48.0, 52.0, 38.0, 30.0, 37.0, 47.0, 39.0, 31.0, 39.0, 27.0, 37.0, 24.0, 23.0, 18.0, 19.0, 13.0, 11.0, 15.0, 10.0, 11.0, 9.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8031721115112305, -5.610118865966797, -5.417065620422363, -5.22401237487793, -5.030959129333496, -4.837906360626221, -4.644853115081787, -4.4517998695373535, -4.25874662399292, -4.065693378448486, -3.8726401329040527, -3.6795871257781982, -3.4865338802337646, -3.293480634689331, -3.1004276275634766, -2.907374382019043, -2.7143211364746094, -2.521267890930176, -2.328214645385742, -2.1351616382598877, -1.942108392715454, -1.7490551471710205, -1.5560020208358765, -1.3629488945007324, -1.1698956489562988, -0.97684246301651, -0.7837892770767212, -0.5907360911369324, -0.39768290519714355, -0.20462971925735474, -0.011576533317565918, 0.18147659301757812, 0.3745298385620117, 0.5675830245018005, 0.7606362104415894, 0.9536893963813782, 1.146742582321167, 1.3397958278656006, 1.5328489542007446, 1.7259020805358887, 1.9189553260803223, 2.112008571624756, 2.3050618171691895, 2.498114824295044, 2.6911680698394775, 2.884221315383911, 3.0772743225097656, 3.270327568054199, 3.463380813598633, 3.6564340591430664, 3.8494873046875, 4.042540550231934, 4.235593795776367, 4.428646564483643, 4.621699810028076, 4.81475305557251, 5.007806301116943, 5.200859546661377, 5.3939127922058105, 5.586966037750244, 5.7800188064575195, 5.973072052001953, 6.166125297546387, 6.35917854309082, 6.552231788635254]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 7.0, 13.0, 20.0, 22.0, 49.0, 75.0, 99.0, 153.0, 263.0, 375.0, 597.0, 994.0, 1571.0, 2668.0, 4212.0, 7468.0, 12431.0, 22285.0, 40234.0, 75608.0, 150338.0, 353989.0, 1035795.0, 1435329.0, 606116.0, 223620.0, 102589.0, 52471.0, 28048.0, 15494.0, 8593.0, 5104.0, 3057.0, 1719.0, 1065.0, 654.0, 386.0, 267.0, 180.0, 113.0, 59.0, 52.0, 32.0, 25.0, 19.0, 14.0, 4.0, 4.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.25848388671875, -6.9818115234375, -6.70513916015625, -6.428466796875, -6.15179443359375, -5.8751220703125, -5.59844970703125, -5.32177734375, -5.04510498046875, -4.7684326171875, -4.49176025390625, -4.215087890625, -3.93841552734375, -3.6617431640625, -3.38507080078125, -3.1083984375, -2.83172607421875, -2.5550537109375, -2.27838134765625, -2.001708984375, -1.72503662109375, -1.4483642578125, -1.17169189453125, -0.89501953125, -0.61834716796875, -0.3416748046875, -0.06500244140625, 0.211669921875, 0.48834228515625, 0.7650146484375, 1.04168701171875, 1.318359375, 1.59503173828125, 1.8717041015625, 2.14837646484375, 2.425048828125, 2.70172119140625, 2.9783935546875, 3.25506591796875, 3.53173828125, 3.80841064453125, 4.0850830078125, 4.36175537109375, 4.638427734375, 4.91510009765625, 5.1917724609375, 5.46844482421875, 5.7451171875, 6.02178955078125, 6.2984619140625, 6.57513427734375, 6.851806640625, 7.12847900390625, 7.4051513671875, 7.68182373046875, 7.95849609375, 8.23516845703125, 8.5118408203125, 8.78851318359375, 9.065185546875, 9.34185791015625, 9.6185302734375, 9.89520263671875, 10.171875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 5.0, 11.0, 4.0, 15.0, 12.0, 8.0, 24.0, 19.0, 25.0, 16.0, 29.0, 25.0, 26.0, 37.0, 38.0, 39.0, 48.0, 49.0, 46.0, 45.0, 32.0, 53.0, 47.0, 39.0, 38.0, 36.0, 42.0, 29.0, 25.0, 28.0, 17.0, 14.0, 15.0, 14.0, 14.0, 8.0, 7.0, 8.0, 2.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.924560546875, -4.75146484375, -4.578369140625, -4.4052734375, -4.232177734375, -4.05908203125, -3.885986328125, -3.712890625, -3.539794921875, -3.36669921875, -3.193603515625, -3.0205078125, -2.847412109375, -2.67431640625, -2.501220703125, -2.328125, -2.155029296875, -1.98193359375, -1.808837890625, -1.6357421875, -1.462646484375, -1.28955078125, -1.116455078125, -0.943359375, -0.770263671875, -0.59716796875, -0.424072265625, -0.2509765625, -0.077880859375, 0.09521484375, 0.268310546875, 0.44140625, 0.614501953125, 0.78759765625, 0.960693359375, 1.1337890625, 1.306884765625, 1.47998046875, 1.653076171875, 1.826171875, 1.999267578125, 2.17236328125, 2.345458984375, 2.5185546875, 2.691650390625, 2.86474609375, 3.037841796875, 3.2109375, 3.384033203125, 3.55712890625, 3.730224609375, 3.9033203125, 4.076416015625, 4.24951171875, 4.422607421875, 4.595703125, 4.768798828125, 4.94189453125, 5.114990234375, 5.2880859375, 5.461181640625, 5.63427734375, 5.807373046875, 5.98046875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 5.0, 18.0, 16.0, 34.0, 44.0, 105.0, 146.0, 304.0, 516.0, 872.0, 1544.0, 2858.0, 5045.0, 9202.0, 18014.0, 35509.0, 73437.0, 161043.0, 376571.0, 922512.0, 1379631.0, 686971.0, 280547.0, 123065.0, 56708.0, 28132.0, 14337.0, 7631.0, 4149.0, 2249.0, 1335.0, 719.0, 423.0, 242.0, 135.0, 76.0, 51.0, 35.0, 10.0, 16.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.9234619140625, -7.643798828125, -7.3641357421875, -7.08447265625, -6.8048095703125, -6.525146484375, -6.2454833984375, -5.9658203125, -5.6861572265625, -5.406494140625, -5.1268310546875, -4.84716796875, -4.5675048828125, -4.287841796875, -4.0081787109375, -3.728515625, -3.4488525390625, -3.169189453125, -2.8895263671875, -2.60986328125, -2.3302001953125, -2.050537109375, -1.7708740234375, -1.4912109375, -1.2115478515625, -0.931884765625, -0.6522216796875, -0.37255859375, -0.0928955078125, 0.186767578125, 0.4664306640625, 0.74609375, 1.0257568359375, 1.305419921875, 1.5850830078125, 1.86474609375, 2.1444091796875, 2.424072265625, 2.7037353515625, 2.9833984375, 3.2630615234375, 3.542724609375, 3.8223876953125, 4.10205078125, 4.3817138671875, 4.661376953125, 4.9410400390625, 5.220703125, 5.5003662109375, 5.780029296875, 6.0596923828125, 6.33935546875, 6.6190185546875, 6.898681640625, 7.1783447265625, 7.4580078125, 7.7376708984375, 8.017333984375, 8.2969970703125, 8.57666015625, 8.8563232421875, 9.135986328125, 9.4156494140625, 9.6953125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 11.0, 9.0, 7.0, 11.0, 20.0, 30.0, 31.0, 36.0, 57.0, 76.0, 88.0, 116.0, 141.0, 163.0, 186.0, 259.0, 279.0, 324.0, 334.0, 333.0, 299.0, 239.0, 194.0, 167.0, 136.0, 97.0, 81.0, 69.0, 72.0, 55.0, 26.0, 34.0, 28.0, 28.0, 7.0, 12.0, 3.0, 13.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6953125, -2.6007080078125, -2.506103515625, -2.4114990234375, -2.31689453125, -2.2222900390625, -2.127685546875, -2.0330810546875, -1.9384765625, -1.8438720703125, -1.749267578125, -1.6546630859375, -1.56005859375, -1.4654541015625, -1.370849609375, -1.2762451171875, -1.181640625, -1.0870361328125, -0.992431640625, -0.8978271484375, -0.80322265625, -0.7086181640625, -0.614013671875, -0.5194091796875, -0.4248046875, -0.3302001953125, -0.235595703125, -0.1409912109375, -0.04638671875, 0.0482177734375, 0.142822265625, 0.2374267578125, 0.33203125, 0.4266357421875, 0.521240234375, 0.6158447265625, 0.71044921875, 0.8050537109375, 0.899658203125, 0.9942626953125, 1.0888671875, 1.1834716796875, 1.278076171875, 1.3726806640625, 1.46728515625, 1.5618896484375, 1.656494140625, 1.7510986328125, 1.845703125, 1.9403076171875, 2.034912109375, 2.1295166015625, 2.22412109375, 2.3187255859375, 2.413330078125, 2.5079345703125, 2.6025390625, 2.6971435546875, 2.791748046875, 2.8863525390625, 2.98095703125, 3.0755615234375, 3.170166015625, 3.2647705078125, 3.359375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 9.0, 9.0, 11.0, 14.0, 11.0, 18.0, 18.0, 35.0, 32.0, 38.0, 57.0, 57.0, 68.0, 74.0, 75.0, 70.0, 74.0, 58.0, 48.0, 49.0, 36.0, 22.0, 20.0, 17.0, 20.0, 5.0, 6.0, 15.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.081671714782715, -4.884668350219727, -4.687664985656738, -4.49066162109375, -4.293658256530762, -4.096654891967773, -3.899651527404785, -3.702648162841797, -3.5056447982788086, -3.3086414337158203, -3.111638069152832, -2.9146347045898438, -2.7176313400268555, -2.520627975463867, -2.323624610900879, -2.1266212463378906, -1.9296176433563232, -1.732614278793335, -1.5356109142303467, -1.3386075496673584, -1.1416041851043701, -0.9446007609367371, -0.747597336769104, -0.5505939722061157, -0.35359060764312744, -0.15658722817897797, 0.04041615128517151, 0.23741954565048218, 0.43442291021347046, 0.6314262747764587, 0.8284296989440918, 1.02543306350708, 1.2224364280700684, 1.4194397926330566, 1.616443157196045, 1.8134465217590332, 2.0104498863220215, 2.2074532508850098, 2.404456615447998, 2.6014599800109863, 2.7984633445739746, 2.995466709136963, 3.192470073699951, 3.3894734382629395, 3.5864768028259277, 3.783480167388916, 3.9804835319519043, 4.177486896514893, 4.374490737915039, 4.571494102478027, 4.768497467041016, 4.965500831604004, 5.162504196166992, 5.3595075607299805, 5.556510925292969, 5.753514289855957, 5.950517654418945, 6.147521018981934, 6.344524383544922, 6.54152774810791, 6.738531112670898, 6.935534477233887, 7.132537841796875, 7.329541206359863, 7.526544570922852]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 0.0, 4.0, 7.0, 7.0, 8.0, 7.0, 13.0, 8.0, 15.0, 17.0, 17.0, 8.0, 23.0, 23.0, 31.0, 26.0, 40.0, 32.0, 38.0, 41.0, 37.0, 26.0, 32.0, 33.0, 38.0, 35.0, 33.0, 41.0, 36.0, 43.0, 34.0, 37.0, 21.0, 26.0, 24.0, 20.0, 16.0, 14.0, 17.0, 15.0, 12.0, 8.0, 11.0, 9.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.153041362762451, -4.986894130706787, -4.820746898651123, -4.654600143432617, -4.488452911376953, -4.322305679321289, -4.156158447265625, -3.990011215209961, -3.823863983154297, -3.657716751098633, -3.491569757461548, -3.325422525405884, -3.1592752933502197, -2.9931282997131348, -2.8269810676574707, -2.6608338356018066, -2.4946868419647217, -2.3285396099090576, -2.1623926162719727, -1.9962453842163086, -1.8300981521606445, -1.66395103931427, -1.4978039264678955, -1.3316566944122314, -1.165509581565857, -0.9993624091148376, -0.8332152366638184, -0.6670681238174438, -0.5009209513664246, -0.3347737789154053, -0.16862666606903076, -0.0024794340133666992, 0.1636676788330078, 0.3298148512840271, 0.495961993932724, 0.6621091365814209, 0.8282563090324402, 0.9944034814834595, 1.160550594329834, 1.326697826385498, 1.4928449392318726, 1.658992052078247, 1.8251392841339111, 1.9912863969802856, 2.15743350982666, 2.323580741882324, 2.4897279739379883, 2.6558752059936523, 2.8220221996307373, 2.9881694316864014, 3.1543164253234863, 3.3204636573791504, 3.4866108894348145, 3.6527581214904785, 3.8189051151275635, 3.9850523471832275, 4.1511993408203125, 4.317346572875977, 4.483493804931641, 4.649641036987305, 4.8157877922058105, 4.981935024261475, 5.148082256317139, 5.314229488372803, 5.480376720428467]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 14.0, 18.0, 32.0, 46.0, 76.0, 108.0, 129.0, 236.0, 276.0, 401.0, 584.0, 931.0, 1332.0, 1953.0, 2914.0, 4282.0, 6344.0, 9576.0, 14217.0, 21192.0, 32279.0, 49245.0, 76094.0, 121211.0, 187840.0, 184042.0, 117395.0, 73834.0, 48160.0, 31235.0, 20470.0, 13610.0, 9246.0, 6158.0, 4247.0, 2851.0, 1853.0, 1286.0, 877.0, 629.0, 403.0, 310.0, 191.0, 146.0, 97.0, 60.0, 42.0, 23.0, 27.0, 7.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.984375, -1.9202880859375, -1.856201171875, -1.7921142578125, -1.72802734375, -1.6639404296875, -1.599853515625, -1.5357666015625, -1.4716796875, -1.4075927734375, -1.343505859375, -1.2794189453125, -1.21533203125, -1.1512451171875, -1.087158203125, -1.0230712890625, -0.958984375, -0.8948974609375, -0.830810546875, -0.7667236328125, -0.70263671875, -0.6385498046875, -0.574462890625, -0.5103759765625, -0.4462890625, -0.3822021484375, -0.318115234375, -0.2540283203125, -0.18994140625, -0.1258544921875, -0.061767578125, 0.0023193359375, 0.06640625, 0.1304931640625, 0.194580078125, 0.2586669921875, 0.32275390625, 0.3868408203125, 0.450927734375, 0.5150146484375, 0.5791015625, 0.6431884765625, 0.707275390625, 0.7713623046875, 0.83544921875, 0.8995361328125, 0.963623046875, 1.0277099609375, 1.091796875, 1.1558837890625, 1.219970703125, 1.2840576171875, 1.34814453125, 1.4122314453125, 1.476318359375, 1.5404052734375, 1.6044921875, 1.6685791015625, 1.732666015625, 1.7967529296875, 1.86083984375, 1.9249267578125, 1.989013671875, 2.0531005859375, 2.1171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 8.0, 9.0, 6.0, 8.0, 9.0, 14.0, 15.0, 16.0, 17.0, 13.0, 22.0, 27.0, 25.0, 34.0, 40.0, 31.0, 44.0, 42.0, 33.0, 35.0, 39.0, 40.0, 36.0, 37.0, 47.0, 40.0, 40.0, 45.0, 34.0, 29.0, 21.0, 26.0, 21.0, 13.0, 19.0, 11.0, 17.0, 11.0, 10.0, 4.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.538818359375, -5.35498046875, -5.171142578125, -4.9873046875, -4.803466796875, -4.61962890625, -4.435791015625, -4.251953125, -4.068115234375, -3.88427734375, -3.700439453125, -3.5166015625, -3.332763671875, -3.14892578125, -2.965087890625, -2.78125, -2.597412109375, -2.41357421875, -2.229736328125, -2.0458984375, -1.862060546875, -1.67822265625, -1.494384765625, -1.310546875, -1.126708984375, -0.94287109375, -0.759033203125, -0.5751953125, -0.391357421875, -0.20751953125, -0.023681640625, 0.16015625, 0.343994140625, 0.52783203125, 0.711669921875, 0.8955078125, 1.079345703125, 1.26318359375, 1.447021484375, 1.630859375, 1.814697265625, 1.99853515625, 2.182373046875, 2.3662109375, 2.550048828125, 2.73388671875, 2.917724609375, 3.1015625, 3.285400390625, 3.46923828125, 3.653076171875, 3.8369140625, 4.020751953125, 4.20458984375, 4.388427734375, 4.572265625, 4.756103515625, 4.93994140625, 5.123779296875, 5.3076171875, 5.491455078125, 5.67529296875, 5.859130859375, 6.04296875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 6.0, 14.0, 20.0, 30.0, 46.0, 74.0, 96.0, 165.0, 283.0, 407.0, 697.0, 1034.0, 1794.0, 2964.0, 5242.0, 9151.0, 16908.0, 31975.0, 61849.0, 124190.0, 270444.0, 266888.0, 122663.0, 61451.0, 31650.0, 16526.0, 9234.0, 5133.0, 2949.0, 1767.0, 1064.0, 686.0, 435.0, 254.0, 152.0, 105.0, 78.0, 44.0, 29.0, 14.0, 11.0, 6.0, 8.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.3125, -3.21783447265625, -3.1231689453125, -3.02850341796875, -2.933837890625, -2.83917236328125, -2.7445068359375, -2.64984130859375, -2.55517578125, -2.46051025390625, -2.3658447265625, -2.27117919921875, -2.176513671875, -2.08184814453125, -1.9871826171875, -1.89251708984375, -1.7978515625, -1.70318603515625, -1.6085205078125, -1.51385498046875, -1.419189453125, -1.32452392578125, -1.2298583984375, -1.13519287109375, -1.04052734375, -0.94586181640625, -0.8511962890625, -0.75653076171875, -0.661865234375, -0.56719970703125, -0.4725341796875, -0.37786865234375, -0.283203125, -0.18853759765625, -0.0938720703125, 0.00079345703125, 0.095458984375, 0.19012451171875, 0.2847900390625, 0.37945556640625, 0.47412109375, 0.56878662109375, 0.6634521484375, 0.75811767578125, 0.852783203125, 0.94744873046875, 1.0421142578125, 1.13677978515625, 1.2314453125, 1.32611083984375, 1.4207763671875, 1.51544189453125, 1.610107421875, 1.70477294921875, 1.7994384765625, 1.89410400390625, 1.98876953125, 2.08343505859375, 2.1781005859375, 2.27276611328125, 2.367431640625, 2.46209716796875, 2.5567626953125, 2.65142822265625, 2.74609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 12.0, 18.0, 19.0, 16.0, 15.0, 19.0, 26.0, 31.0, 41.0, 39.0, 40.0, 45.0, 36.0, 30.0, 46.0, 45.0, 35.0, 43.0, 41.0, 43.0, 48.0, 33.0, 36.0, 32.0, 28.0, 37.0, 24.0, 20.0, 23.0, 16.0, 13.0, 15.0, 5.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.341796875, -3.219635009765625, -3.09747314453125, -2.975311279296875, -2.8531494140625, -2.730987548828125, -2.60882568359375, -2.486663818359375, -2.364501953125, -2.242340087890625, -2.12017822265625, -1.998016357421875, -1.8758544921875, -1.753692626953125, -1.63153076171875, -1.509368896484375, -1.38720703125, -1.265045166015625, -1.14288330078125, -1.020721435546875, -0.8985595703125, -0.776397705078125, -0.65423583984375, -0.532073974609375, -0.409912109375, -0.287750244140625, -0.16558837890625, -0.043426513671875, 0.0787353515625, 0.200897216796875, 0.32305908203125, 0.445220947265625, 0.5673828125, 0.689544677734375, 0.81170654296875, 0.933868408203125, 1.0560302734375, 1.178192138671875, 1.30035400390625, 1.422515869140625, 1.544677734375, 1.666839599609375, 1.78900146484375, 1.911163330078125, 2.0333251953125, 2.155487060546875, 2.27764892578125, 2.399810791015625, 2.52197265625, 2.644134521484375, 2.76629638671875, 2.888458251953125, 3.0106201171875, 3.132781982421875, 3.25494384765625, 3.377105712890625, 3.499267578125, 3.621429443359375, 3.74359130859375, 3.865753173828125, 3.9879150390625, 4.110076904296875, 4.23223876953125, 4.354400634765625, 4.4765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 15.0, 28.0, 21.0, 35.0, 78.0, 106.0, 153.0, 216.0, 353.0, 518.0, 893.0, 1298.0, 2195.0, 3752.0, 6953.0, 13257.0, 28135.0, 67303.0, 206470.0, 458602.0, 154817.0, 54236.0, 23363.0, 11199.0, 5879.0, 3360.0, 1996.0, 1136.0, 739.0, 504.0, 294.0, 212.0, 141.0, 89.0, 61.0, 42.0, 21.0, 23.0, 15.0, 8.0, 10.0, 5.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.02783203125, -0.027045488357543945, -0.02625894546508789, -0.025472402572631836, -0.02468585968017578, -0.023899316787719727, -0.023112773895263672, -0.022326231002807617, -0.021539688110351562, -0.020753145217895508, -0.019966602325439453, -0.0191800594329834, -0.018393516540527344, -0.01760697364807129, -0.016820430755615234, -0.01603388786315918, -0.015247344970703125, -0.01446080207824707, -0.013674259185791016, -0.012887716293334961, -0.012101173400878906, -0.011314630508422852, -0.010528087615966797, -0.009741544723510742, -0.008955001831054688, -0.008168458938598633, -0.007381916046142578, -0.0065953731536865234, -0.005808830261230469, -0.005022287368774414, -0.004235744476318359, -0.0034492015838623047, -0.00266265869140625, -0.0018761157989501953, -0.0010895729064941406, -0.00030303001403808594, 0.00048351287841796875, 0.0012700557708740234, 0.002056598663330078, 0.002843141555786133, 0.0036296844482421875, 0.004416227340698242, 0.005202770233154297, 0.0059893131256103516, 0.006775856018066406, 0.007562398910522461, 0.008348941802978516, 0.00913548469543457, 0.009922027587890625, 0.01070857048034668, 0.011495113372802734, 0.012281656265258789, 0.013068199157714844, 0.013854742050170898, 0.014641284942626953, 0.015427827835083008, 0.016214370727539062, 0.017000913619995117, 0.017787456512451172, 0.018573999404907227, 0.01936054229736328, 0.020147085189819336, 0.02093362808227539, 0.021720170974731445, 0.0225067138671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 4.0, 5.0, 7.0, 14.0, 9.0, 22.0, 25.0, 37.0, 46.0, 57.0, 93.0, 114.0, 128.0, 128.0, 74.0, 60.0, 40.0, 29.0, 24.0, 19.0, 15.0, 7.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.043081283569336e-05, -1.0075047612190247e-05, -9.719282388687134e-06, -9.363517165184021e-06, -9.007751941680908e-06, -8.651986718177795e-06, -8.296221494674683e-06, -7.94045627117157e-06, -7.584691047668457e-06, -7.228925824165344e-06, -6.8731606006622314e-06, -6.517395377159119e-06, -6.161630153656006e-06, -5.805864930152893e-06, -5.45009970664978e-06, -5.0943344831466675e-06, -4.738569259643555e-06, -4.382804036140442e-06, -4.027038812637329e-06, -3.6712735891342163e-06, -3.3155083656311035e-06, -2.9597431421279907e-06, -2.603977918624878e-06, -2.248212695121765e-06, -1.8924474716186523e-06, -1.5366822481155396e-06, -1.1809170246124268e-06, -8.25151801109314e-07, -4.6938657760620117e-07, -1.1362135410308838e-07, 2.421438694000244e-07, 5.979090929031372e-07, 9.5367431640625e-07, 1.3094395399093628e-06, 1.6652047634124756e-06, 2.0209699869155884e-06, 2.376735210418701e-06, 2.732500433921814e-06, 3.0882656574249268e-06, 3.4440308809280396e-06, 3.7997961044311523e-06, 4.155561327934265e-06, 4.511326551437378e-06, 4.867091774940491e-06, 5.2228569984436035e-06, 5.578622221946716e-06, 5.934387445449829e-06, 6.290152668952942e-06, 6.645917892456055e-06, 7.0016831159591675e-06, 7.35744833946228e-06, 7.713213562965393e-06, 8.068978786468506e-06, 8.424744009971619e-06, 8.780509233474731e-06, 9.136274456977844e-06, 9.492039680480957e-06, 9.84780490398407e-06, 1.0203570127487183e-05, 1.0559335350990295e-05, 1.0915100574493408e-05, 1.1270865797996521e-05, 1.1626631021499634e-05, 1.1982396245002747e-05, 1.233816146850586e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 14.0, 8.0, 26.0, 26.0, 49.0, 53.0, 87.0, 110.0, 173.0, 238.0, 325.0, 466.0, 728.0, 1103.0, 1859.0, 2851.0, 4804.0, 8393.0, 14587.0, 26992.0, 53489.0, 116198.0, 273842.0, 292897.0, 125706.0, 57484.0, 28592.0, 15262.0, 8635.0, 5059.0, 3053.0, 1869.0, 1173.0, 756.0, 506.0, 335.0, 237.0, 166.0, 120.0, 77.0, 59.0, 34.0, 34.0, 27.0, 12.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0197906494140625, -0.019191741943359375, -0.01859283447265625, -0.017993927001953125, -0.01739501953125, -0.016796112060546875, -0.01619720458984375, -0.015598297119140625, -0.0149993896484375, -0.014400482177734375, -0.01380157470703125, -0.013202667236328125, -0.012603759765625, -0.012004852294921875, -0.01140594482421875, -0.010807037353515625, -0.0102081298828125, -0.009609222412109375, -0.00901031494140625, -0.008411407470703125, -0.0078125, -0.007213592529296875, -0.00661468505859375, -0.006015777587890625, -0.0054168701171875, -0.004817962646484375, -0.00421905517578125, -0.003620147705078125, -0.003021240234375, -0.002422332763671875, -0.00182342529296875, -0.001224517822265625, -0.0006256103515625, -2.6702880859375e-05, 0.00057220458984375, 0.001171112060546875, 0.00177001953125, 0.002368927001953125, 0.00296783447265625, 0.003566741943359375, 0.0041656494140625, 0.004764556884765625, 0.00536346435546875, 0.005962371826171875, 0.006561279296875, 0.007160186767578125, 0.00775909423828125, 0.008358001708984375, 0.0089569091796875, 0.009555816650390625, 0.01015472412109375, 0.010753631591796875, 0.0113525390625, 0.011951446533203125, 0.01255035400390625, 0.013149261474609375, 0.0137481689453125, 0.014347076416015625, 0.01494598388671875, 0.015544891357421875, 0.016143798828125, 0.016742706298828125, 0.01734161376953125, 0.017940521240234375, 0.0185394287109375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 11.0, 25.0, 22.0, 33.0, 45.0, 51.0, 43.0, 61.0, 71.0, 159.0, 84.0, 71.0, 62.0, 47.0, 44.0, 37.0, 33.0, 14.0, 15.0, 8.0, 9.0, 9.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00791168212890625, -0.007654786109924316, -0.007397890090942383, -0.007140994071960449, -0.006884098052978516, -0.006627202033996582, -0.0063703060150146484, -0.006113409996032715, -0.005856513977050781, -0.005599617958068848, -0.005342721939086914, -0.0050858259201049805, -0.004828929901123047, -0.004572033882141113, -0.00431513786315918, -0.004058241844177246, -0.0038013458251953125, -0.003544449806213379, -0.0032875537872314453, -0.0030306577682495117, -0.002773761749267578, -0.0025168657302856445, -0.002259969711303711, -0.0020030736923217773, -0.0017461776733398438, -0.0014892816543579102, -0.0012323856353759766, -0.000975489616394043, -0.0007185935974121094, -0.0004616975784301758, -0.0002048015594482422, 5.2094459533691406e-05, 0.000308990478515625, 0.0005658864974975586, 0.0008227825164794922, 0.0010796785354614258, 0.0013365745544433594, 0.001593470573425293, 0.0018503665924072266, 0.00210726261138916, 0.0023641586303710938, 0.0026210546493530273, 0.002877950668334961, 0.0031348466873168945, 0.003391742706298828, 0.0036486387252807617, 0.0039055347442626953, 0.004162430763244629, 0.0044193267822265625, 0.004676222801208496, 0.00493311882019043, 0.005190014839172363, 0.005446910858154297, 0.0057038068771362305, 0.005960702896118164, 0.006217598915100098, 0.006474494934082031, 0.006731390953063965, 0.0069882869720458984, 0.007245182991027832, 0.007502079010009766, 0.007758975028991699, 0.008015871047973633, 0.008272767066955566, 0.0085296630859375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 12.0, 13.0, 6.0, 14.0, 11.0, 20.0, 28.0, 32.0, 39.0, 51.0, 54.0, 66.0, 74.0, 83.0, 53.0, 83.0, 59.0, 45.0, 62.0, 36.0, 30.0, 18.0, 16.0, 18.0, 9.0, 10.0, 11.0, 7.0, 3.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.1085710525512695, -4.913647174835205, -4.718723773956299, -4.523799896240234, -4.328876495361328, -4.133952617645264, -3.9390289783477783, -3.744105339050293, -3.5491816997528076, -3.3542580604553223, -3.159334421157837, -2.9644107818603516, -2.769486904144287, -2.574563503265381, -2.3796396255493164, -2.184715986251831, -1.9897923469543457, -1.7948687076568604, -1.599945068359375, -1.4050213098526, -1.2100976705551147, -1.0151740312576294, -0.8202502727508545, -0.6253266334533691, -0.4304029941558838, -0.23547932505607605, -0.04055565595626831, 0.15436804294586182, 0.34929168224334717, 0.5442153215408325, 0.7391390800476074, 0.9340627193450928, 1.1289863586425781, 1.3239099979400635, 1.5188336372375488, 1.7137573957443237, 1.908681035041809, 2.103604793548584, 2.2985284328460693, 2.4934520721435547, 2.68837571144104, 2.8832993507385254, 3.0782229900360107, 3.273146629333496, 3.4680705070495605, 3.662993907928467, 3.8579177856445312, 4.0528411865234375, 4.247765064239502, 4.442688941955566, 4.637612342834473, 4.832536220550537, 5.027459621429443, 5.222383499145508, 5.417306900024414, 5.6122307777404785, 5.807154655456543, 6.002078533172607, 6.197001934051514, 6.391925811767578, 6.586849212646484, 6.781773090362549, 6.976696968078613, 7.1716203689575195, 7.366543769836426]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 4.0, 9.0, 6.0, 9.0, 7.0, 11.0, 12.0, 13.0, 16.0, 16.0, 11.0, 23.0, 27.0, 27.0, 30.0, 35.0, 32.0, 41.0, 37.0, 39.0, 27.0, 31.0, 36.0, 36.0, 33.0, 36.0, 40.0, 36.0, 40.0, 36.0, 35.0, 24.0, 24.0, 25.0, 18.0, 18.0, 12.0, 17.0, 14.0, 12.0, 9.0, 11.0, 8.0, 9.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0820136070251465, -4.916803359985352, -4.751592636108398, -4.5863823890686035, -4.421172142028809, -4.255961894989014, -4.0907511711120605, -3.9255409240722656, -3.7603306770324707, -3.5951201915740967, -3.4299099445343018, -3.2646994590759277, -3.099489212036133, -2.934278726577759, -2.7690682411193848, -2.60385799407959, -2.438647508621216, -2.273437023162842, -2.108226776123047, -1.9430162906646729, -1.777806043624878, -1.612595558166504, -1.4473851919174194, -1.282174825668335, -1.1169644594192505, -0.951754093170166, -0.7865437269210815, -0.6213333010673523, -0.4561229348182678, -0.29091256856918335, -0.1257021427154541, 0.03950822353363037, 0.20471858978271484, 0.3699289560317993, 0.5351393222808838, 0.700349748134613, 0.8655601143836975, 1.0307705402374268, 1.1959809064865112, 1.3611912727355957, 1.5264016389846802, 1.6916120052337646, 1.8568223714828491, 2.0220327377319336, 2.1872432231903076, 2.3524534702301025, 2.5176639556884766, 2.6828742027282715, 2.8480846881866455, 3.0132951736450195, 3.1785054206848145, 3.3437159061431885, 3.5089261531829834, 3.6741366386413574, 3.8393468856811523, 4.0045576095581055, 4.1697678565979, 4.334978103637695, 4.500188827514648, 4.665399074554443, 4.830609321594238, 4.995819568634033, 5.161030292510986, 5.326240539550781, 5.491450786590576]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 5.0, 4.0, 6.0, 12.0, 23.0, 41.0, 72.0, 78.0, 129.0, 209.0, 252.0, 349.0, 578.0, 796.0, 1255.0, 1819.0, 2646.0, 3858.0, 5759.0, 8698.0, 13245.0, 19811.0, 30507.0, 46482.0, 70866.0, 104866.0, 142916.0, 160619.0, 137458.0, 99210.0, 67292.0, 43747.0, 28606.0, 18601.0, 12526.0, 8289.0, 5498.0, 3671.0, 2516.0, 1688.0, 1195.0, 800.0, 507.0, 365.0, 240.0, 163.0, 98.0, 68.0, 41.0, 25.0, 26.0, 10.0, 14.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.30859375, -6.10125732421875, -5.8939208984375, -5.68658447265625, -5.479248046875, -5.27191162109375, -5.0645751953125, -4.85723876953125, -4.64990234375, -4.44256591796875, -4.2352294921875, -4.02789306640625, -3.820556640625, -3.61322021484375, -3.4058837890625, -3.19854736328125, -2.9912109375, -2.78387451171875, -2.5765380859375, -2.36920166015625, -2.161865234375, -1.95452880859375, -1.7471923828125, -1.53985595703125, -1.33251953125, -1.12518310546875, -0.9178466796875, -0.71051025390625, -0.503173828125, -0.29583740234375, -0.0885009765625, 0.11883544921875, 0.326171875, 0.53350830078125, 0.7408447265625, 0.94818115234375, 1.155517578125, 1.36285400390625, 1.5701904296875, 1.77752685546875, 1.98486328125, 2.19219970703125, 2.3995361328125, 2.60687255859375, 2.814208984375, 3.02154541015625, 3.2288818359375, 3.43621826171875, 3.6435546875, 3.85089111328125, 4.0582275390625, 4.26556396484375, 4.472900390625, 4.68023681640625, 4.8875732421875, 5.09490966796875, 5.30224609375, 5.50958251953125, 5.7169189453125, 5.92425537109375, 6.131591796875, 6.33892822265625, 6.5462646484375, 6.75360107421875, 6.9609375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 2.0, 6.0, 8.0, 6.0, 7.0, 12.0, 15.0, 12.0, 16.0, 14.0, 21.0, 21.0, 23.0, 36.0, 33.0, 27.0, 30.0, 43.0, 34.0, 38.0, 35.0, 41.0, 34.0, 45.0, 25.0, 35.0, 34.0, 44.0, 34.0, 26.0, 35.0, 29.0, 25.0, 27.0, 19.0, 19.0, 19.0, 22.0, 7.0, 10.0, 8.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.5125732421875, -4.353271484375, -4.1939697265625, -4.03466796875, -3.8753662109375, -3.716064453125, -3.5567626953125, -3.3974609375, -3.2381591796875, -3.078857421875, -2.9195556640625, -2.76025390625, -2.6009521484375, -2.441650390625, -2.2823486328125, -2.123046875, -1.9637451171875, -1.804443359375, -1.6451416015625, -1.48583984375, -1.3265380859375, -1.167236328125, -1.0079345703125, -0.8486328125, -0.6893310546875, -0.530029296875, -0.3707275390625, -0.21142578125, -0.0521240234375, 0.107177734375, 0.2664794921875, 0.42578125, 0.5850830078125, 0.744384765625, 0.9036865234375, 1.06298828125, 1.2222900390625, 1.381591796875, 1.5408935546875, 1.7001953125, 1.8594970703125, 2.018798828125, 2.1781005859375, 2.33740234375, 2.4967041015625, 2.656005859375, 2.8153076171875, 2.974609375, 3.1339111328125, 3.293212890625, 3.4525146484375, 3.61181640625, 3.7711181640625, 3.930419921875, 4.0897216796875, 4.2490234375, 4.4083251953125, 4.567626953125, 4.7269287109375, 4.88623046875, 5.0455322265625, 5.204833984375, 5.3641357421875, 5.5234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 9.0, 5.0, 8.0, 22.0, 16.0, 27.0, 43.0, 47.0, 71.0, 126.0, 162.0, 252.0, 356.0, 584.0, 800.0, 1272.0, 1993.0, 2749.0, 4365.0, 6614.0, 10407.0, 16347.0, 25203.0, 39243.0, 60590.0, 92087.0, 130319.0, 159635.0, 152009.0, 116589.0, 79899.0, 52344.0, 33111.0, 21359.0, 13709.0, 9091.0, 5873.0, 3794.0, 2497.0, 1617.0, 1117.0, 730.0, 444.0, 340.0, 220.0, 159.0, 93.0, 60.0, 52.0, 32.0, 14.0, 19.0, 16.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.44140625, -6.232421875, -6.0234375, -5.814453125, -5.60546875, -5.396484375, -5.1875, -4.978515625, -4.76953125, -4.560546875, -4.3515625, -4.142578125, -3.93359375, -3.724609375, -3.515625, -3.306640625, -3.09765625, -2.888671875, -2.6796875, -2.470703125, -2.26171875, -2.052734375, -1.84375, -1.634765625, -1.42578125, -1.216796875, -1.0078125, -0.798828125, -0.58984375, -0.380859375, -0.171875, 0.037109375, 0.24609375, 0.455078125, 0.6640625, 0.873046875, 1.08203125, 1.291015625, 1.5, 1.708984375, 1.91796875, 2.126953125, 2.3359375, 2.544921875, 2.75390625, 2.962890625, 3.171875, 3.380859375, 3.58984375, 3.798828125, 4.0078125, 4.216796875, 4.42578125, 4.634765625, 4.84375, 5.052734375, 5.26171875, 5.470703125, 5.6796875, 5.888671875, 6.09765625, 6.306640625, 6.515625, 6.724609375, 6.93359375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 7.0, 16.0, 21.0, 17.0, 10.0, 22.0, 26.0, 24.0, 30.0, 36.0, 32.0, 30.0, 41.0, 31.0, 41.0, 36.0, 50.0, 43.0, 44.0, 40.0, 30.0, 46.0, 41.0, 26.0, 30.0, 34.0, 23.0, 20.0, 27.0, 19.0, 13.0, 19.0, 15.0, 8.0, 6.0, 8.0, 8.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.46484375, -3.3577880859375, -3.250732421875, -3.1436767578125, -3.03662109375, -2.9295654296875, -2.822509765625, -2.7154541015625, -2.6083984375, -2.5013427734375, -2.394287109375, -2.2872314453125, -2.18017578125, -2.0731201171875, -1.966064453125, -1.8590087890625, -1.751953125, -1.6448974609375, -1.537841796875, -1.4307861328125, -1.32373046875, -1.2166748046875, -1.109619140625, -1.0025634765625, -0.8955078125, -0.7884521484375, -0.681396484375, -0.5743408203125, -0.46728515625, -0.3602294921875, -0.253173828125, -0.1461181640625, -0.0390625, 0.0679931640625, 0.175048828125, 0.2821044921875, 0.38916015625, 0.4962158203125, 0.603271484375, 0.7103271484375, 0.8173828125, 0.9244384765625, 1.031494140625, 1.1385498046875, 1.24560546875, 1.3526611328125, 1.459716796875, 1.5667724609375, 1.673828125, 1.7808837890625, 1.887939453125, 1.9949951171875, 2.10205078125, 2.2091064453125, 2.316162109375, 2.4232177734375, 2.5302734375, 2.6373291015625, 2.744384765625, 2.8514404296875, 2.95849609375, 3.0655517578125, 3.172607421875, 3.2796630859375, 3.38671875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 4.0, 6.0, 7.0, 15.0, 14.0, 25.0, 39.0, 56.0, 92.0, 130.0, 211.0, 317.0, 464.0, 661.0, 1080.0, 1676.0, 2840.0, 5129.0, 9315.0, 18795.0, 43532.0, 125902.0, 523072.0, 204002.0, 59558.0, 24610.0, 11790.0, 6167.0, 3422.0, 2083.0, 1282.0, 767.0, 485.0, 279.0, 201.0, 151.0, 99.0, 79.0, 59.0, 37.0, 36.0, 13.0, 11.0, 6.0, 10.0, 8.0, 3.0, 0.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.3125, -4.18048095703125, -4.0484619140625, -3.91644287109375, -3.784423828125, -3.65240478515625, -3.5203857421875, -3.38836669921875, -3.25634765625, -3.12432861328125, -2.9923095703125, -2.86029052734375, -2.728271484375, -2.59625244140625, -2.4642333984375, -2.33221435546875, -2.2001953125, -2.06817626953125, -1.9361572265625, -1.80413818359375, -1.672119140625, -1.54010009765625, -1.4080810546875, -1.27606201171875, -1.14404296875, -1.01202392578125, -0.8800048828125, -0.74798583984375, -0.615966796875, -0.48394775390625, -0.3519287109375, -0.21990966796875, -0.087890625, 0.04412841796875, 0.1761474609375, 0.30816650390625, 0.440185546875, 0.57220458984375, 0.7042236328125, 0.83624267578125, 0.96826171875, 1.10028076171875, 1.2322998046875, 1.36431884765625, 1.496337890625, 1.62835693359375, 1.7603759765625, 1.89239501953125, 2.0244140625, 2.15643310546875, 2.2884521484375, 2.42047119140625, 2.552490234375, 2.68450927734375, 2.8165283203125, 2.94854736328125, 3.08056640625, 3.21258544921875, 3.3446044921875, 3.47662353515625, 3.608642578125, 3.74066162109375, 3.8726806640625, 4.00469970703125, 4.13671875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 4.0, 17.0, 11.0, 17.0, 20.0, 28.0, 56.0, 52.0, 56.0, 89.0, 122.0, 142.0, 93.0, 68.0, 52.0, 39.0, 24.0, 20.0, 12.0, 10.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00022363662719726562, -0.00021772831678390503, -0.00021182000637054443, -0.00020591169595718384, -0.00020000338554382324, -0.00019409507513046265, -0.00018818676471710205, -0.00018227845430374146, -0.00017637014389038086, -0.00017046183347702026, -0.00016455352306365967, -0.00015864521265029907, -0.00015273690223693848, -0.00014682859182357788, -0.00014092028141021729, -0.0001350119709968567, -0.0001291036605834961, -0.0001231953501701355, -0.0001172870397567749, -0.0001113787293434143, -0.00010547041893005371, -9.956210851669312e-05, -9.365379810333252e-05, -8.774548768997192e-05, -8.183717727661133e-05, -7.592886686325073e-05, -7.002055644989014e-05, -6.411224603652954e-05, -5.8203935623168945e-05, -5.229562520980835e-05, -4.6387314796447754e-05, -4.047900438308716e-05, -3.457069396972656e-05, -2.8662383556365967e-05, -2.275407314300537e-05, -1.6845762729644775e-05, -1.093745231628418e-05, -5.029141902923584e-06, 8.791685104370117e-07, 6.787478923797607e-06, 1.2695789337158203e-05, 1.86040997505188e-05, 2.4512410163879395e-05, 3.042072057723999e-05, 3.6329030990600586e-05, 4.223734140396118e-05, 4.814565181732178e-05, 5.405396223068237e-05, 5.996227264404297e-05, 6.587058305740356e-05, 7.177889347076416e-05, 7.768720388412476e-05, 8.359551429748535e-05, 8.950382471084595e-05, 9.541213512420654e-05, 0.00010132044553756714, 0.00010722875595092773, 0.00011313706636428833, 0.00011904537677764893, 0.00012495368719100952, 0.00013086199760437012, 0.0001367703080177307, 0.0001426786184310913, 0.0001485869288444519, 0.0001544952392578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 9.0, 16.0, 24.0, 33.0, 58.0, 78.0, 75.0, 133.0, 144.0, 202.0, 271.0, 366.0, 453.0, 705.0, 932.0, 1194.0, 1757.0, 2614.0, 4356.0, 7404.0, 13560.0, 27130.0, 63125.0, 203184.0, 487651.0, 133806.0, 48239.0, 21724.0, 11154.0, 6260.0, 3742.0, 2339.0, 1606.0, 1119.0, 760.0, 576.0, 437.0, 354.0, 231.0, 196.0, 125.0, 123.0, 72.0, 56.0, 36.0, 32.0, 27.0, 16.0, 16.0, 12.0, 8.0, 6.0, 2.0, 1.0], "bins": [-3.95703125, -3.841827392578125, -3.72662353515625, -3.611419677734375, -3.4962158203125, -3.381011962890625, -3.26580810546875, -3.150604248046875, -3.035400390625, -2.920196533203125, -2.80499267578125, -2.689788818359375, -2.5745849609375, -2.459381103515625, -2.34417724609375, -2.228973388671875, -2.11376953125, -1.998565673828125, -1.88336181640625, -1.768157958984375, -1.6529541015625, -1.537750244140625, -1.42254638671875, -1.307342529296875, -1.192138671875, -1.076934814453125, -0.96173095703125, -0.846527099609375, -0.7313232421875, -0.616119384765625, -0.50091552734375, -0.385711669921875, -0.2705078125, -0.155303955078125, -0.04010009765625, 0.075103759765625, 0.1903076171875, 0.305511474609375, 0.42071533203125, 0.535919189453125, 0.651123046875, 0.766326904296875, 0.88153076171875, 0.996734619140625, 1.1119384765625, 1.227142333984375, 1.34234619140625, 1.457550048828125, 1.57275390625, 1.687957763671875, 1.80316162109375, 1.918365478515625, 2.0335693359375, 2.148773193359375, 2.26397705078125, 2.379180908203125, 2.494384765625, 2.609588623046875, 2.72479248046875, 2.839996337890625, 2.9552001953125, 3.070404052734375, 3.18560791015625, 3.300811767578125, 3.416015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 8.0, 7.0, 8.0, 7.0, 8.0, 24.0, 26.0, 30.0, 43.0, 54.0, 91.0, 112.0, 135.0, 105.0, 77.0, 55.0, 45.0, 37.0, 29.0, 20.0, 23.0, 10.0, 8.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.34765625, -1.3076019287109375, -1.267547607421875, -1.2274932861328125, -1.18743896484375, -1.1473846435546875, -1.107330322265625, -1.0672760009765625, -1.0272216796875, -0.9871673583984375, -0.947113037109375, -0.9070587158203125, -0.86700439453125, -0.8269500732421875, -0.786895751953125, -0.7468414306640625, -0.706787109375, -0.6667327880859375, -0.626678466796875, -0.5866241455078125, -0.54656982421875, -0.5065155029296875, -0.466461181640625, -0.4264068603515625, -0.3863525390625, -0.3462982177734375, -0.306243896484375, -0.2661895751953125, -0.22613525390625, -0.1860809326171875, -0.146026611328125, -0.1059722900390625, -0.06591796875, -0.0258636474609375, 0.014190673828125, 0.0542449951171875, 0.09429931640625, 0.1343536376953125, 0.174407958984375, 0.2144622802734375, 0.2545166015625, 0.2945709228515625, 0.334625244140625, 0.3746795654296875, 0.41473388671875, 0.4547882080078125, 0.494842529296875, 0.5348968505859375, 0.574951171875, 0.6150054931640625, 0.655059814453125, 0.6951141357421875, 0.73516845703125, 0.7752227783203125, 0.815277099609375, 0.8553314208984375, 0.8953857421875, 0.9354400634765625, 0.975494384765625, 1.0155487060546875, 1.05560302734375, 1.0956573486328125, 1.135711669921875, 1.1757659912109375, 1.2158203125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 3.0, 7.0, 3.0, 6.0, 11.0, 18.0, 15.0, 19.0, 37.0, 34.0, 43.0, 36.0, 59.0, 69.0, 76.0, 84.0, 63.0, 71.0, 67.0, 50.0, 35.0, 35.0, 27.0, 24.0, 20.0, 21.0, 9.0, 13.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.812544822692871, -5.61854887008667, -5.424552917480469, -5.230556964874268, -5.036561012268066, -4.842564582824707, -4.648569107055664, -4.454572677612305, -4.2605767250061035, -4.066580772399902, -3.872584819793701, -3.6785888671875, -3.4845926761627197, -3.2905967235565186, -3.0966007709503174, -2.902604579925537, -2.708608865737915, -2.514612913131714, -2.3206169605255127, -2.1266207695007324, -1.9326248168945312, -1.73862886428833, -1.544632911682129, -1.3506368398666382, -1.156640887260437, -0.9626448750495911, -0.7686488628387451, -0.574652910232544, -0.380656898021698, -0.18666088581085205, 0.007335066795349121, 0.20133113861083984, 0.395327091217041, 0.589323103427887, 0.7833191156387329, 0.9773150682449341, 1.1713111400604248, 1.365307092666626, 1.5593030452728271, 1.7532991170883179, 1.947295069694519, 2.1412911415100098, 2.335287094116211, 2.529283046722412, 2.7232789993286133, 2.9172749519348145, 3.1112709045410156, 3.305267095565796, 3.499263048171997, 3.6932590007781982, 3.8872549533843994, 4.08125114440918, 4.275247097015381, 4.469243049621582, 4.663239002227783, 4.857234954833984, 5.0512309074401855, 5.245226860046387, 5.439222812652588, 5.633218765258789, 5.82721471786499, 6.021210670471191, 6.215207099914551, 6.409203052520752, 6.603199005126953]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 6.0, 6.0, 10.0, 13.0, 15.0, 14.0, 16.0, 23.0, 17.0, 15.0, 18.0, 20.0, 28.0, 27.0, 34.0, 38.0, 25.0, 28.0, 37.0, 36.0, 28.0, 34.0, 34.0, 39.0, 39.0, 31.0, 30.0, 30.0, 28.0, 21.0, 30.0, 14.0, 30.0, 26.0, 14.0, 24.0, 14.0, 22.0, 6.0, 9.0, 13.0, 6.0, 8.0, 10.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-5.00058126449585, -4.847132682800293, -4.693684101104736, -4.540235996246338, -4.386787414550781, -4.233338832855225, -4.079890251159668, -3.9264419078826904, -3.772993564605713, -3.6195449829101562, -3.4660966396331787, -3.312648057937622, -3.1591997146606445, -3.005751132965088, -2.8523025512695312, -2.6988542079925537, -2.545405626296997, -2.3919570446014404, -2.238508701324463, -2.0850601196289062, -1.9316117763519287, -1.778163194656372, -1.624714732170105, -1.471266269683838, -1.3178178071975708, -1.1643693447113037, -1.0109208822250366, -0.8574723601341248, -0.7040238976478577, -0.5505754351615906, -0.3971269130706787, -0.24367845058441162, -0.09022998809814453, 0.06321848928928375, 0.21666696667671204, 0.3701154589653015, 0.5235639214515686, 0.6770123839378357, 0.8304609060287476, 0.9839093685150146, 1.1373578310012817, 1.2908062934875488, 1.444254755973816, 1.597703218460083, 1.7511518001556396, 1.9046001434326172, 2.058048725128174, 2.2114973068237305, 2.364945650100708, 2.5183942317962646, 2.671842575073242, 2.825291156768799, 2.9787395000457764, 3.132188081741333, 3.2856364250183105, 3.439085006713867, 3.592533588409424, 3.7459821701049805, 3.899430513381958, 4.0528788566589355, 4.206327438354492, 4.359776020050049, 4.5132246017456055, 4.666672706604004, 4.8201212882995605]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 13.0, 17.0, 12.0, 20.0, 26.0, 46.0, 68.0, 109.0, 172.0, 222.0, 298.0, 524.0, 779.0, 1214.0, 1860.0, 2798.0, 4644.0, 7483.0, 12177.0, 20099.0, 34319.0, 59845.0, 109311.0, 221683.0, 559553.0, 1245002.0, 1086993.0, 431963.0, 181253.0, 91005.0, 49902.0, 28415.0, 16688.0, 9902.0, 5907.0, 3581.0, 2247.0, 1481.0, 881.0, 632.0, 365.0, 265.0, 163.0, 108.0, 72.0, 60.0, 27.0, 34.0, 14.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0], "bins": [-7.65625, -7.42333984375, -7.1904296875, -6.95751953125, -6.724609375, -6.49169921875, -6.2587890625, -6.02587890625, -5.79296875, -5.56005859375, -5.3271484375, -5.09423828125, -4.861328125, -4.62841796875, -4.3955078125, -4.16259765625, -3.9296875, -3.69677734375, -3.4638671875, -3.23095703125, -2.998046875, -2.76513671875, -2.5322265625, -2.29931640625, -2.06640625, -1.83349609375, -1.6005859375, -1.36767578125, -1.134765625, -0.90185546875, -0.6689453125, -0.43603515625, -0.203125, 0.02978515625, 0.2626953125, 0.49560546875, 0.728515625, 0.96142578125, 1.1943359375, 1.42724609375, 1.66015625, 1.89306640625, 2.1259765625, 2.35888671875, 2.591796875, 2.82470703125, 3.0576171875, 3.29052734375, 3.5234375, 3.75634765625, 3.9892578125, 4.22216796875, 4.455078125, 4.68798828125, 4.9208984375, 5.15380859375, 5.38671875, 5.61962890625, 5.8525390625, 6.08544921875, 6.318359375, 6.55126953125, 6.7841796875, 7.01708984375, 7.25]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 0.0, 4.0, 5.0, 8.0, 7.0, 4.0, 14.0, 12.0, 20.0, 16.0, 26.0, 20.0, 16.0, 23.0, 24.0, 36.0, 36.0, 36.0, 35.0, 33.0, 42.0, 31.0, 33.0, 39.0, 37.0, 33.0, 57.0, 29.0, 32.0, 33.0, 22.0, 27.0, 20.0, 31.0, 21.0, 24.0, 19.0, 13.0, 15.0, 9.0, 12.0, 9.0, 6.0, 11.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.85546875, -4.7142333984375, -4.572998046875, -4.4317626953125, -4.29052734375, -4.1492919921875, -4.008056640625, -3.8668212890625, -3.7255859375, -3.5843505859375, -3.443115234375, -3.3018798828125, -3.16064453125, -3.0194091796875, -2.878173828125, -2.7369384765625, -2.595703125, -2.4544677734375, -2.313232421875, -2.1719970703125, -2.03076171875, -1.8895263671875, -1.748291015625, -1.6070556640625, -1.4658203125, -1.3245849609375, -1.183349609375, -1.0421142578125, -0.90087890625, -0.7596435546875, -0.618408203125, -0.4771728515625, -0.3359375, -0.1947021484375, -0.053466796875, 0.0877685546875, 0.22900390625, 0.3702392578125, 0.511474609375, 0.6527099609375, 0.7939453125, 0.9351806640625, 1.076416015625, 1.2176513671875, 1.35888671875, 1.5001220703125, 1.641357421875, 1.7825927734375, 1.923828125, 2.0650634765625, 2.206298828125, 2.3475341796875, 2.48876953125, 2.6300048828125, 2.771240234375, 2.9124755859375, 3.0537109375, 3.1949462890625, 3.336181640625, 3.4774169921875, 3.61865234375, 3.7598876953125, 3.901123046875, 4.0423583984375, 4.18359375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 14.0, 13.0, 22.0, 29.0, 46.0, 67.0, 95.0, 123.0, 226.0, 345.0, 485.0, 723.0, 1131.0, 1664.0, 2459.0, 3855.0, 5830.0, 9459.0, 14778.0, 23715.0, 38296.0, 64920.0, 111400.0, 198599.0, 359709.0, 652743.0, 985381.0, 749171.0, 419651.0, 229669.0, 128552.0, 74223.0, 43623.0, 26758.0, 16566.0, 10561.0, 6783.0, 4265.0, 2793.0, 1855.0, 1205.0, 855.0, 593.0, 329.0, 230.0, 147.0, 132.0, 65.0, 49.0, 38.0, 22.0, 15.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.796875, -5.61920166015625, -5.4415283203125, -5.26385498046875, -5.086181640625, -4.90850830078125, -4.7308349609375, -4.55316162109375, -4.37548828125, -4.19781494140625, -4.0201416015625, -3.84246826171875, -3.664794921875, -3.48712158203125, -3.3094482421875, -3.13177490234375, -2.9541015625, -2.77642822265625, -2.5987548828125, -2.42108154296875, -2.243408203125, -2.06573486328125, -1.8880615234375, -1.71038818359375, -1.53271484375, -1.35504150390625, -1.1773681640625, -0.99969482421875, -0.822021484375, -0.64434814453125, -0.4666748046875, -0.28900146484375, -0.111328125, 0.06634521484375, 0.2440185546875, 0.42169189453125, 0.599365234375, 0.77703857421875, 0.9547119140625, 1.13238525390625, 1.31005859375, 1.48773193359375, 1.6654052734375, 1.84307861328125, 2.020751953125, 2.19842529296875, 2.3760986328125, 2.55377197265625, 2.7314453125, 2.90911865234375, 3.0867919921875, 3.26446533203125, 3.442138671875, 3.61981201171875, 3.7974853515625, 3.97515869140625, 4.15283203125, 4.33050537109375, 4.5081787109375, 4.68585205078125, 4.863525390625, 5.04119873046875, 5.2188720703125, 5.39654541015625, 5.57421875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 8.0, 6.0, 10.0, 11.0, 23.0, 19.0, 20.0, 31.0, 47.0, 51.0, 54.0, 79.0, 94.0, 97.0, 139.0, 163.0, 189.0, 232.0, 230.0, 246.0, 298.0, 271.0, 246.0, 256.0, 183.0, 189.0, 134.0, 138.0, 126.0, 107.0, 76.0, 73.0, 50.0, 42.0, 29.0, 28.0, 15.0, 17.0, 12.0, 17.0, 6.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5703125, -2.491912841796875, -2.41351318359375, -2.335113525390625, -2.2567138671875, -2.178314208984375, -2.09991455078125, -2.021514892578125, -1.943115234375, -1.864715576171875, -1.78631591796875, -1.707916259765625, -1.6295166015625, -1.551116943359375, -1.47271728515625, -1.394317626953125, -1.31591796875, -1.237518310546875, -1.15911865234375, -1.080718994140625, -1.0023193359375, -0.923919677734375, -0.84552001953125, -0.767120361328125, -0.688720703125, -0.610321044921875, -0.53192138671875, -0.453521728515625, -0.3751220703125, -0.296722412109375, -0.21832275390625, -0.139923095703125, -0.0615234375, 0.016876220703125, 0.09527587890625, 0.173675537109375, 0.2520751953125, 0.330474853515625, 0.40887451171875, 0.487274169921875, 0.565673828125, 0.644073486328125, 0.72247314453125, 0.800872802734375, 0.8792724609375, 0.957672119140625, 1.03607177734375, 1.114471435546875, 1.19287109375, 1.271270751953125, 1.34967041015625, 1.428070068359375, 1.5064697265625, 1.584869384765625, 1.66326904296875, 1.741668701171875, 1.820068359375, 1.898468017578125, 1.97686767578125, 2.055267333984375, 2.1336669921875, 2.212066650390625, 2.29046630859375, 2.368865966796875, 2.447265625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 3.0, 6.0, 15.0, 22.0, 10.0, 16.0, 28.0, 37.0, 30.0, 51.0, 56.0, 55.0, 72.0, 82.0, 82.0, 72.0, 58.0, 46.0, 43.0, 40.0, 36.0, 23.0, 21.0, 15.0, 13.0, 15.0, 6.0, 5.0, 5.0, 7.0, 2.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4479193687438965, -5.260849475860596, -5.073780059814453, -4.886710166931152, -4.69964075088501, -4.512570858001709, -4.325501441955566, -4.138431549072266, -3.951362133026123, -3.7642924785614014, -3.5772228240966797, -3.390153169631958, -3.2030835151672363, -3.0160138607025146, -2.828944206237793, -2.641874313354492, -2.4548046588897705, -2.267735004425049, -2.080665349960327, -1.8935956954956055, -1.7065260410308838, -1.519456386566162, -1.3323866128921509, -1.1453169584274292, -0.9582473039627075, -0.7711776494979858, -0.5841079950332642, -0.3970382809638977, -0.20996862649917603, -0.022898972034454346, 0.1641707420349121, 0.3512403964996338, 0.5383100509643555, 0.7253797054290771, 0.9124493598937988, 1.0995190143585205, 1.2865886688232422, 1.4736583232879639, 1.660728096961975, 1.8477977514266968, 2.034867286682129, 2.2219369411468506, 2.4090065956115723, 2.596076250076294, 2.7831459045410156, 2.9702155590057373, 3.157285213470459, 3.3443551063537598, 3.5314247608184814, 3.718494415283203, 3.905564069747925, 4.0926337242126465, 4.279703617095947, 4.46677303314209, 4.653842926025391, 4.840912342071533, 5.027982234954834, 5.215052127838135, 5.402121543884277, 5.589191436767578, 5.776260852813721, 5.9633307456970215, 6.150400161743164, 6.337470054626465, 6.524539470672607]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 14.0, 15.0, 13.0, 13.0, 14.0, 21.0, 15.0, 22.0, 21.0, 23.0, 26.0, 33.0, 25.0, 25.0, 35.0, 39.0, 39.0, 35.0, 29.0, 41.0, 34.0, 42.0, 37.0, 38.0, 28.0, 28.0, 29.0, 27.0, 28.0, 25.0, 30.0, 20.0, 17.0, 17.0, 19.0, 16.0, 8.0, 12.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.651426792144775, -4.4979047775268555, -4.344382286071777, -4.190859794616699, -4.037337779998779, -3.8838155269622803, -3.7302932739257812, -3.5767710208892822, -3.423248767852783, -3.269726514816284, -3.116204261779785, -2.962682008743286, -2.809159755706787, -2.655637502670288, -2.502115249633789, -2.34859299659729, -2.195070743560791, -2.041548490524292, -1.888026237487793, -1.734503984451294, -1.580981731414795, -1.427459478378296, -1.2739372253417969, -1.1204149723052979, -0.9668927192687988, -0.8133704662322998, -0.6598482131958008, -0.5063259601593018, -0.35280370712280273, -0.1992814540863037, -0.04575920104980469, 0.10776305198669434, 0.26128482818603516, 0.4148070812225342, 0.5683293342590332, 0.7218515872955322, 0.8753738403320312, 1.0288960933685303, 1.1824183464050293, 1.3359405994415283, 1.4894628524780273, 1.6429851055145264, 1.7965073585510254, 1.9500296115875244, 2.1035518646240234, 2.2570741176605225, 2.4105963706970215, 2.5641186237335205, 2.7176408767700195, 2.8711631298065186, 3.0246853828430176, 3.1782076358795166, 3.3317298889160156, 3.4852521419525146, 3.6387743949890137, 3.7922966480255127, 3.9458189010620117, 4.09934139251709, 4.25286340713501, 4.40638542175293, 4.559907913208008, 4.713430404663086, 4.866952419281006, 5.020474433898926, 5.173996925354004]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 5.0, 7.0, 5.0, 11.0, 11.0, 14.0, 27.0, 37.0, 66.0, 106.0, 98.0, 172.0, 259.0, 378.0, 556.0, 787.0, 1191.0, 1675.0, 2449.0, 3708.0, 5149.0, 7497.0, 11211.0, 16460.0, 24445.0, 36554.0, 55452.0, 83289.0, 124162.0, 181562.0, 162687.0, 108369.0, 72555.0, 48305.0, 32074.0, 21438.0, 14602.0, 9705.0, 6616.0, 4709.0, 3163.0, 2222.0, 1550.0, 1024.0, 732.0, 488.0, 316.0, 239.0, 152.0, 91.0, 75.0, 44.0, 21.0, 24.0, 10.0, 7.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.75390625, -1.697021484375, -1.64013671875, -1.583251953125, -1.5263671875, -1.469482421875, -1.41259765625, -1.355712890625, -1.298828125, -1.241943359375, -1.18505859375, -1.128173828125, -1.0712890625, -1.014404296875, -0.95751953125, -0.900634765625, -0.84375, -0.786865234375, -0.72998046875, -0.673095703125, -0.6162109375, -0.559326171875, -0.50244140625, -0.445556640625, -0.388671875, -0.331787109375, -0.27490234375, -0.218017578125, -0.1611328125, -0.104248046875, -0.04736328125, 0.009521484375, 0.06640625, 0.123291015625, 0.18017578125, 0.237060546875, 0.2939453125, 0.350830078125, 0.40771484375, 0.464599609375, 0.521484375, 0.578369140625, 0.63525390625, 0.692138671875, 0.7490234375, 0.805908203125, 0.86279296875, 0.919677734375, 0.9765625, 1.033447265625, 1.09033203125, 1.147216796875, 1.2041015625, 1.260986328125, 1.31787109375, 1.374755859375, 1.431640625, 1.488525390625, 1.54541015625, 1.602294921875, 1.6591796875, 1.716064453125, 1.77294921875, 1.829833984375, 1.88671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 9.0, 5.0, 6.0, 14.0, 11.0, 16.0, 18.0, 16.0, 15.0, 21.0, 22.0, 20.0, 26.0, 23.0, 32.0, 29.0, 29.0, 36.0, 34.0, 40.0, 29.0, 42.0, 36.0, 40.0, 45.0, 32.0, 39.0, 32.0, 28.0, 34.0, 22.0, 31.0, 34.0, 26.0, 15.0, 17.0, 10.0, 15.0, 11.0, 5.0, 6.0, 8.0, 9.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.82421875, -4.663330078125, -4.50244140625, -4.341552734375, -4.1806640625, -4.019775390625, -3.85888671875, -3.697998046875, -3.537109375, -3.376220703125, -3.21533203125, -3.054443359375, -2.8935546875, -2.732666015625, -2.57177734375, -2.410888671875, -2.25, -2.089111328125, -1.92822265625, -1.767333984375, -1.6064453125, -1.445556640625, -1.28466796875, -1.123779296875, -0.962890625, -0.802001953125, -0.64111328125, -0.480224609375, -0.3193359375, -0.158447265625, 0.00244140625, 0.163330078125, 0.32421875, 0.485107421875, 0.64599609375, 0.806884765625, 0.9677734375, 1.128662109375, 1.28955078125, 1.450439453125, 1.611328125, 1.772216796875, 1.93310546875, 2.093994140625, 2.2548828125, 2.415771484375, 2.57666015625, 2.737548828125, 2.8984375, 3.059326171875, 3.22021484375, 3.381103515625, 3.5419921875, 3.702880859375, 3.86376953125, 4.024658203125, 4.185546875, 4.346435546875, 4.50732421875, 4.668212890625, 4.8291015625, 4.989990234375, 5.15087890625, 5.311767578125, 5.47265625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 10.0, 18.0, 15.0, 31.0, 57.0, 64.0, 110.0, 181.0, 296.0, 461.0, 752.0, 1242.0, 2105.0, 3676.0, 6282.0, 11081.0, 20441.0, 38167.0, 73445.0, 146183.0, 304840.0, 217586.0, 104688.0, 53307.0, 28095.0, 15155.0, 8491.0, 4785.0, 2774.0, 1601.0, 1019.0, 639.0, 323.0, 236.0, 162.0, 71.0, 52.0, 39.0, 24.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.98828125, -2.897064208984375, -2.80584716796875, -2.714630126953125, -2.6234130859375, -2.532196044921875, -2.44097900390625, -2.349761962890625, -2.258544921875, -2.167327880859375, -2.07611083984375, -1.984893798828125, -1.8936767578125, -1.802459716796875, -1.71124267578125, -1.620025634765625, -1.52880859375, -1.437591552734375, -1.34637451171875, -1.255157470703125, -1.1639404296875, -1.072723388671875, -0.98150634765625, -0.890289306640625, -0.799072265625, -0.707855224609375, -0.61663818359375, -0.525421142578125, -0.4342041015625, -0.342987060546875, -0.25177001953125, -0.160552978515625, -0.0693359375, 0.021881103515625, 0.11309814453125, 0.204315185546875, 0.2955322265625, 0.386749267578125, 0.47796630859375, 0.569183349609375, 0.660400390625, 0.751617431640625, 0.84283447265625, 0.934051513671875, 1.0252685546875, 1.116485595703125, 1.20770263671875, 1.298919677734375, 1.39013671875, 1.481353759765625, 1.57257080078125, 1.663787841796875, 1.7550048828125, 1.846221923828125, 1.93743896484375, 2.028656005859375, 2.119873046875, 2.211090087890625, 2.30230712890625, 2.393524169921875, 2.4847412109375, 2.575958251953125, 2.66717529296875, 2.758392333984375, 2.849609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 8.0, 6.0, 12.0, 7.0, 8.0, 17.0, 13.0, 16.0, 21.0, 25.0, 24.0, 27.0, 33.0, 19.0, 23.0, 27.0, 49.0, 31.0, 33.0, 50.0, 36.0, 28.0, 34.0, 39.0, 35.0, 37.0, 32.0, 31.0, 29.0, 30.0, 34.0, 27.0, 21.0, 25.0, 19.0, 13.0, 15.0, 10.0, 6.0, 13.0, 8.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0], "bins": [-3.34375, -3.24285888671875, -3.1419677734375, -3.04107666015625, -2.940185546875, -2.83929443359375, -2.7384033203125, -2.63751220703125, -2.53662109375, -2.43572998046875, -2.3348388671875, -2.23394775390625, -2.133056640625, -2.03216552734375, -1.9312744140625, -1.83038330078125, -1.7294921875, -1.62860107421875, -1.5277099609375, -1.42681884765625, -1.325927734375, -1.22503662109375, -1.1241455078125, -1.02325439453125, -0.92236328125, -0.82147216796875, -0.7205810546875, -0.61968994140625, -0.518798828125, -0.41790771484375, -0.3170166015625, -0.21612548828125, -0.115234375, -0.01434326171875, 0.0865478515625, 0.18743896484375, 0.288330078125, 0.38922119140625, 0.4901123046875, 0.59100341796875, 0.69189453125, 0.79278564453125, 0.8936767578125, 0.99456787109375, 1.095458984375, 1.19635009765625, 1.2972412109375, 1.39813232421875, 1.4990234375, 1.59991455078125, 1.7008056640625, 1.80169677734375, 1.902587890625, 2.00347900390625, 2.1043701171875, 2.20526123046875, 2.30615234375, 2.40704345703125, 2.5079345703125, 2.60882568359375, 2.709716796875, 2.81060791015625, 2.9114990234375, 3.01239013671875, 3.11328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 7.0, 15.0, 12.0, 20.0, 33.0, 35.0, 61.0, 90.0, 141.0, 221.0, 327.0, 541.0, 817.0, 1359.0, 2264.0, 3994.0, 7046.0, 13599.0, 27421.0, 61059.0, 156486.0, 405506.0, 217176.0, 79583.0, 34075.0, 16490.0, 8708.0, 4599.0, 2610.0, 1568.0, 956.0, 583.0, 388.0, 233.0, 161.0, 106.0, 69.0, 51.0, 46.0, 27.0, 15.0, 11.0, 12.0, 8.0, 3.0, 5.0, 6.0, 3.0, 3.0, 2.0], "bins": [-0.0269012451171875, -0.026146650314331055, -0.02539205551147461, -0.024637460708618164, -0.02388286590576172, -0.023128271102905273, -0.022373676300048828, -0.021619081497192383, -0.020864486694335938, -0.020109891891479492, -0.019355297088623047, -0.0186007022857666, -0.017846107482910156, -0.01709151268005371, -0.016336917877197266, -0.01558232307434082, -0.014827728271484375, -0.01407313346862793, -0.013318538665771484, -0.012563943862915039, -0.011809349060058594, -0.011054754257202148, -0.010300159454345703, -0.009545564651489258, -0.008790969848632812, -0.008036375045776367, -0.007281780242919922, -0.0065271854400634766, -0.005772590637207031, -0.005017995834350586, -0.004263401031494141, -0.0035088062286376953, -0.00275421142578125, -0.0019996166229248047, -0.0012450218200683594, -0.0004904270172119141, 0.00026416778564453125, 0.0010187625885009766, 0.0017733573913574219, 0.002527952194213867, 0.0032825469970703125, 0.004037141799926758, 0.004791736602783203, 0.0055463314056396484, 0.006300926208496094, 0.007055521011352539, 0.007810115814208984, 0.00856471061706543, 0.009319305419921875, 0.01007390022277832, 0.010828495025634766, 0.011583089828491211, 0.012337684631347656, 0.013092279434204102, 0.013846874237060547, 0.014601469039916992, 0.015356063842773438, 0.016110658645629883, 0.016865253448486328, 0.017619848251342773, 0.01837444305419922, 0.019129037857055664, 0.01988363265991211, 0.020638227462768555, 0.021392822265625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 7.0, 8.0, 9.0, 13.0, 12.0, 16.0, 17.0, 40.0, 39.0, 38.0, 51.0, 72.0, 56.0, 52.0, 53.0, 73.0, 49.0, 55.0, 48.0, 34.0, 35.0, 30.0, 34.0, 17.0, 25.0, 16.0, 15.0, 10.0, 8.0, 8.0, 5.0, 7.0, 3.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.900859832763672e-06, -5.706213414669037e-06, -5.511566996574402e-06, -5.316920578479767e-06, -5.122274160385132e-06, -4.927627742290497e-06, -4.732981324195862e-06, -4.538334906101227e-06, -4.343688488006592e-06, -4.149042069911957e-06, -3.954395651817322e-06, -3.7597492337226868e-06, -3.5651028156280518e-06, -3.3704563975334167e-06, -3.1758099794387817e-06, -2.9811635613441467e-06, -2.7865171432495117e-06, -2.5918707251548767e-06, -2.3972243070602417e-06, -2.2025778889656067e-06, -2.0079314708709717e-06, -1.8132850527763367e-06, -1.6186386346817017e-06, -1.4239922165870667e-06, -1.2293457984924316e-06, -1.0346993803977966e-06, -8.400529623031616e-07, -6.454065442085266e-07, -4.507601261138916e-07, -2.561137080192566e-07, -6.146728992462158e-08, 1.3317912817001343e-07, 3.2782554626464844e-07, 5.224719643592834e-07, 7.171183824539185e-07, 9.117648005485535e-07, 1.1064112186431885e-06, 1.3010576367378235e-06, 1.4957040548324585e-06, 1.6903504729270935e-06, 1.8849968910217285e-06, 2.0796433091163635e-06, 2.2742897272109985e-06, 2.4689361453056335e-06, 2.6635825634002686e-06, 2.8582289814949036e-06, 3.0528753995895386e-06, 3.2475218176841736e-06, 3.4421682357788086e-06, 3.6368146538734436e-06, 3.831461071968079e-06, 4.026107490062714e-06, 4.220753908157349e-06, 4.415400326251984e-06, 4.610046744346619e-06, 4.804693162441254e-06, 4.999339580535889e-06, 5.193985998630524e-06, 5.388632416725159e-06, 5.583278834819794e-06, 5.777925252914429e-06, 5.972571671009064e-06, 6.167218089103699e-06, 6.361864507198334e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 9.0, 16.0, 26.0, 40.0, 62.0, 72.0, 116.0, 192.0, 316.0, 417.0, 647.0, 1007.0, 1610.0, 2499.0, 4045.0, 6725.0, 11429.0, 20354.0, 36690.0, 71295.0, 146799.0, 313056.0, 217523.0, 99314.0, 49777.0, 27252.0, 14965.0, 8478.0, 5105.0, 3200.0, 1938.0, 1172.0, 855.0, 521.0, 361.0, 229.0, 157.0, 85.0, 64.0, 43.0, 32.0, 22.0, 12.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.01793074607849121, -0.017306804656982422, -0.016682863235473633, -0.016058921813964844, -0.015434980392456055, -0.014811038970947266, -0.014187097549438477, -0.013563156127929688, -0.012939214706420898, -0.01231527328491211, -0.01169133186340332, -0.011067390441894531, -0.010443449020385742, -0.009819507598876953, -0.009195566177368164, -0.008571624755859375, -0.007947683334350586, -0.007323741912841797, -0.006699800491333008, -0.006075859069824219, -0.00545191764831543, -0.004827976226806641, -0.0042040348052978516, -0.0035800933837890625, -0.0029561519622802734, -0.0023322105407714844, -0.0017082691192626953, -0.0010843276977539062, -0.0004603862762451172, 0.00016355514526367188, 0.0007874965667724609, 0.00141143798828125, 0.002035379409790039, 0.002659320831298828, 0.003283262252807617, 0.003907203674316406, 0.004531145095825195, 0.005155086517333984, 0.0057790279388427734, 0.0064029693603515625, 0.0070269107818603516, 0.007650852203369141, 0.00827479362487793, 0.008898735046386719, 0.009522676467895508, 0.010146617889404297, 0.010770559310913086, 0.011394500732421875, 0.012018442153930664, 0.012642383575439453, 0.013266324996948242, 0.013890266418457031, 0.01451420783996582, 0.01513814926147461, 0.0157620906829834, 0.016386032104492188, 0.017009973526000977, 0.017633914947509766, 0.018257856369018555, 0.018881797790527344, 0.019505739212036133, 0.020129680633544922, 0.02075362205505371, 0.0213775634765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 14.0, 12.0, 16.0, 16.0, 18.0, 25.0, 28.0, 38.0, 56.0, 75.0, 73.0, 92.0, 91.0, 72.0, 63.0, 49.0, 41.0, 39.0, 38.0, 27.0, 15.0, 13.0, 15.0, 7.0, 8.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006511688232421875, -0.0062871575355529785, -0.006062626838684082, -0.0058380961418151855, -0.005613565444946289, -0.005389034748077393, -0.005164504051208496, -0.0049399733543396, -0.004715442657470703, -0.004490911960601807, -0.00426638126373291, -0.004041850566864014, -0.003817319869995117, -0.0035927891731262207, -0.0033682584762573242, -0.0031437277793884277, -0.0029191970825195312, -0.0026946663856506348, -0.0024701356887817383, -0.002245604991912842, -0.0020210742950439453, -0.0017965435981750488, -0.0015720129013061523, -0.0013474822044372559, -0.0011229515075683594, -0.0008984208106994629, -0.0006738901138305664, -0.0004493594169616699, -0.00022482872009277344, -2.980232238769531e-07, 0.00022423267364501953, 0.000448763370513916, 0.0006732940673828125, 0.000897824764251709, 0.0011223554611206055, 0.001346886157989502, 0.0015714168548583984, 0.001795947551727295, 0.0020204782485961914, 0.002245008945465088, 0.0024695396423339844, 0.002694070339202881, 0.0029186010360717773, 0.003143131732940674, 0.0033676624298095703, 0.003592193126678467, 0.0038167238235473633, 0.00404125452041626, 0.004265785217285156, 0.004490315914154053, 0.004714846611022949, 0.004939377307891846, 0.005163908004760742, 0.005388438701629639, 0.005612969398498535, 0.005837500095367432, 0.006062030792236328, 0.006286561489105225, 0.006511092185974121, 0.006735622882843018, 0.006960153579711914, 0.0071846842765808105, 0.007409214973449707, 0.0076337456703186035, 0.0078582763671875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 11.0, 17.0, 15.0, 15.0, 16.0, 29.0, 37.0, 43.0, 49.0, 53.0, 53.0, 73.0, 84.0, 66.0, 71.0, 52.0, 45.0, 44.0, 34.0, 34.0, 24.0, 21.0, 23.0, 16.0, 6.0, 10.0, 2.0, 7.0, 3.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.347260475158691, -5.168665885925293, -4.9900712966918945, -4.811476707458496, -4.6328816413879395, -4.454287052154541, -4.275692462921143, -4.097097873687744, -3.9185032844543457, -3.7399086952209473, -3.5613138675689697, -3.3827192783355713, -3.204124689102173, -3.0255298614501953, -2.846935272216797, -2.6683406829833984, -2.489745855331421, -2.3111512660980225, -2.132556438446045, -1.9539618492126465, -1.775367259979248, -1.59677255153656, -1.418177843093872, -1.2395832538604736, -1.0609885454177856, -0.8823938965797424, -0.7037992477416992, -0.5252045392990112, -0.346609890460968, -0.1680152416229248, 0.010579466819763184, 0.18917405605316162, 0.3677687644958496, 0.5463634133338928, 0.724958062171936, 0.903552770614624, 1.0821473598480225, 1.2607420682907104, 1.4393367767333984, 1.6179313659667969, 1.7965260744094849, 1.9751207828521729, 2.1537153720855713, 2.332310199737549, 2.5109047889709473, 2.6894993782043457, 2.868093967437744, 3.0466885566711426, 3.22528338432312, 3.4038779735565186, 3.582472801208496, 3.7610673904418945, 3.939661979675293, 4.118256568908691, 4.29685115814209, 4.475445747375488, 4.654040813446045, 4.832635402679443, 5.011229991912842, 5.189825057983398, 5.368419647216797, 5.547014236450195, 5.725608825683594, 5.904203414916992, 6.082798004150391]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 4.0, 14.0, 15.0, 13.0, 13.0, 14.0, 21.0, 14.0, 22.0, 21.0, 24.0, 26.0, 32.0, 27.0, 23.0, 37.0, 38.0, 39.0, 33.0, 32.0, 39.0, 34.0, 43.0, 36.0, 40.0, 26.0, 29.0, 29.0, 27.0, 28.0, 24.0, 31.0, 21.0, 16.0, 17.0, 19.0, 16.0, 7.0, 13.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.641153335571289, -4.488080024719238, -4.335007190704346, -4.181933879852295, -4.028860569000244, -3.8757874965667725, -3.722714424133301, -3.56964111328125, -3.4165680408477783, -3.2634949684143066, -3.110421657562256, -2.957348585128784, -2.8042755126953125, -2.6512022018432617, -2.49812912940979, -2.3450560569763184, -2.1919827461242676, -2.038909673690796, -1.8858363628387451, -1.7327632904052734, -1.5796900987625122, -1.426616907119751, -1.2735438346862793, -1.120470643043518, -0.9673974514007568, -0.8143242597579956, -0.6612511277198792, -0.5081779956817627, -0.35510480403900146, -0.20203161239624023, -0.04895848035812378, 0.10411465167999268, 0.2571878433227539, 0.41026100516319275, 0.5633341670036316, 0.716407299041748, 0.8694804906845093, 1.0225536823272705, 1.1756267547607422, 1.3286999464035034, 1.4817731380462646, 1.6348463296890259, 1.787919521331787, 1.9409925937652588, 2.0940656661987305, 2.2471389770507812, 2.400212049484253, 2.5532851219177246, 2.7063584327697754, 2.859431505203247, 3.012504816055298, 3.1655778884887695, 3.3186511993408203, 3.471724271774292, 3.6247973442077637, 3.7778706550598145, 3.930943727493286, 4.084016799926758, 4.237090110778809, 4.390163421630859, 4.543236255645752, 4.696309566497803, 4.8493828773498535, 5.002455711364746, 5.155529022216797]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 16.0, 26.0, 27.0, 43.0, 51.0, 92.0, 125.0, 184.0, 226.0, 370.0, 522.0, 837.0, 1141.0, 1599.0, 2476.0, 3428.0, 5190.0, 7866.0, 12025.0, 17793.0, 27130.0, 40932.0, 61290.0, 89320.0, 123421.0, 148803.0, 144199.0, 114233.0, 81530.0, 54863.0, 36495.0, 24230.0, 15985.0, 10382.0, 6885.0, 4695.0, 3113.0, 2187.0, 1502.0, 1049.0, 729.0, 509.0, 346.0, 223.0, 143.0, 94.0, 84.0, 53.0, 30.0, 26.0, 14.0, 9.0, 9.0, 8.0, 2.0, 0.0, 2.0, 2.0], "bins": [-5.87109375, -5.68682861328125, -5.5025634765625, -5.31829833984375, -5.134033203125, -4.94976806640625, -4.7655029296875, -4.58123779296875, -4.39697265625, -4.21270751953125, -4.0284423828125, -3.84417724609375, -3.659912109375, -3.47564697265625, -3.2913818359375, -3.10711669921875, -2.9228515625, -2.73858642578125, -2.5543212890625, -2.37005615234375, -2.185791015625, -2.00152587890625, -1.8172607421875, -1.63299560546875, -1.44873046875, -1.26446533203125, -1.0802001953125, -0.89593505859375, -0.711669921875, -0.52740478515625, -0.3431396484375, -0.15887451171875, 0.025390625, 0.20965576171875, 0.3939208984375, 0.57818603515625, 0.762451171875, 0.94671630859375, 1.1309814453125, 1.31524658203125, 1.49951171875, 1.68377685546875, 1.8680419921875, 2.05230712890625, 2.236572265625, 2.42083740234375, 2.6051025390625, 2.78936767578125, 2.9736328125, 3.15789794921875, 3.3421630859375, 3.52642822265625, 3.710693359375, 3.89495849609375, 4.0792236328125, 4.26348876953125, 4.44775390625, 4.63201904296875, 4.8162841796875, 5.00054931640625, 5.184814453125, 5.36907958984375, 5.5533447265625, 5.73760986328125, 5.921875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 10.0, 6.0, 10.0, 12.0, 9.0, 14.0, 15.0, 14.0, 23.0, 21.0, 31.0, 27.0, 26.0, 23.0, 36.0, 35.0, 35.0, 33.0, 34.0, 39.0, 36.0, 44.0, 38.0, 37.0, 42.0, 45.0, 29.0, 26.0, 21.0, 23.0, 32.0, 20.0, 22.0, 13.0, 20.0, 19.0, 17.0, 12.0, 8.0, 6.0, 7.0, 4.0, 5.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6875, -4.5394287109375, -4.391357421875, -4.2432861328125, -4.09521484375, -3.9471435546875, -3.799072265625, -3.6510009765625, -3.5029296875, -3.3548583984375, -3.206787109375, -3.0587158203125, -2.91064453125, -2.7625732421875, -2.614501953125, -2.4664306640625, -2.318359375, -2.1702880859375, -2.022216796875, -1.8741455078125, -1.72607421875, -1.5780029296875, -1.429931640625, -1.2818603515625, -1.1337890625, -0.9857177734375, -0.837646484375, -0.6895751953125, -0.54150390625, -0.3934326171875, -0.245361328125, -0.0972900390625, 0.05078125, 0.1988525390625, 0.346923828125, 0.4949951171875, 0.64306640625, 0.7911376953125, 0.939208984375, 1.0872802734375, 1.2353515625, 1.3834228515625, 1.531494140625, 1.6795654296875, 1.82763671875, 1.9757080078125, 2.123779296875, 2.2718505859375, 2.419921875, 2.5679931640625, 2.716064453125, 2.8641357421875, 3.01220703125, 3.1602783203125, 3.308349609375, 3.4564208984375, 3.6044921875, 3.7525634765625, 3.900634765625, 4.0487060546875, 4.19677734375, 4.3448486328125, 4.492919921875, 4.6409912109375, 4.7890625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 19.0, 14.0, 32.0, 47.0, 49.0, 106.0, 120.0, 216.0, 389.0, 566.0, 1068.0, 1670.0, 2593.0, 4458.0, 7344.0, 12247.0, 20023.0, 34058.0, 57070.0, 95255.0, 148303.0, 190033.0, 172375.0, 118973.0, 72938.0, 43655.0, 25745.0, 15635.0, 9208.0, 5695.0, 3309.0, 1991.0, 1261.0, 761.0, 514.0, 304.0, 200.0, 106.0, 71.0, 44.0, 28.0, 20.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6055908203125, -6.367431640625, -6.1292724609375, -5.89111328125, -5.6529541015625, -5.414794921875, -5.1766357421875, -4.9384765625, -4.7003173828125, -4.462158203125, -4.2239990234375, -3.98583984375, -3.7476806640625, -3.509521484375, -3.2713623046875, -3.033203125, -2.7950439453125, -2.556884765625, -2.3187255859375, -2.08056640625, -1.8424072265625, -1.604248046875, -1.3660888671875, -1.1279296875, -0.8897705078125, -0.651611328125, -0.4134521484375, -0.17529296875, 0.0628662109375, 0.301025390625, 0.5391845703125, 0.77734375, 1.0155029296875, 1.253662109375, 1.4918212890625, 1.72998046875, 1.9681396484375, 2.206298828125, 2.4444580078125, 2.6826171875, 2.9207763671875, 3.158935546875, 3.3970947265625, 3.63525390625, 3.8734130859375, 4.111572265625, 4.3497314453125, 4.587890625, 4.8260498046875, 5.064208984375, 5.3023681640625, 5.54052734375, 5.7786865234375, 6.016845703125, 6.2550048828125, 6.4931640625, 6.7313232421875, 6.969482421875, 7.2076416015625, 7.44580078125, 7.6839599609375, 7.922119140625, 8.1602783203125, 8.3984375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 21.0, 9.0, 10.0, 12.0, 18.0, 21.0, 16.0, 13.0, 34.0, 21.0, 27.0, 27.0, 22.0, 35.0, 47.0, 36.0, 28.0, 41.0, 47.0, 33.0, 28.0, 46.0, 41.0, 30.0, 37.0, 36.0, 28.0, 24.0, 35.0, 19.0, 25.0, 20.0, 17.0, 12.0, 13.0, 14.0, 12.0, 11.0, 7.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.34375, -3.245330810546875, -3.14691162109375, -3.048492431640625, -2.9500732421875, -2.851654052734375, -2.75323486328125, -2.654815673828125, -2.556396484375, -2.457977294921875, -2.35955810546875, -2.261138916015625, -2.1627197265625, -2.064300537109375, -1.96588134765625, -1.867462158203125, -1.76904296875, -1.670623779296875, -1.57220458984375, -1.473785400390625, -1.3753662109375, -1.276947021484375, -1.17852783203125, -1.080108642578125, -0.981689453125, -0.883270263671875, -0.78485107421875, -0.686431884765625, -0.5880126953125, -0.489593505859375, -0.39117431640625, -0.292755126953125, -0.1943359375, -0.095916748046875, 0.00250244140625, 0.100921630859375, 0.1993408203125, 0.297760009765625, 0.39617919921875, 0.494598388671875, 0.593017578125, 0.691436767578125, 0.78985595703125, 0.888275146484375, 0.9866943359375, 1.085113525390625, 1.18353271484375, 1.281951904296875, 1.38037109375, 1.478790283203125, 1.57720947265625, 1.675628662109375, 1.7740478515625, 1.872467041015625, 1.97088623046875, 2.069305419921875, 2.167724609375, 2.266143798828125, 2.36456298828125, 2.462982177734375, 2.5614013671875, 2.659820556640625, 2.75823974609375, 2.856658935546875, 2.955078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 21.0, 28.0, 29.0, 47.0, 56.0, 84.0, 118.0, 157.0, 207.0, 355.0, 538.0, 781.0, 1240.0, 2193.0, 3727.0, 7040.0, 14801.0, 37004.0, 125898.0, 554471.0, 208584.0, 51682.0, 19237.0, 8893.0, 4555.0, 2538.0, 1445.0, 901.0, 595.0, 382.0, 270.0, 179.0, 131.0, 110.0, 61.0, 42.0, 42.0, 24.0, 9.0, 18.0, 6.0, 7.0, 3.0, 8.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.00225830078125, -3.8717041015625, -3.74114990234375, -3.610595703125, -3.48004150390625, -3.3494873046875, -3.21893310546875, -3.08837890625, -2.95782470703125, -2.8272705078125, -2.69671630859375, -2.566162109375, -2.43560791015625, -2.3050537109375, -2.17449951171875, -2.0439453125, -1.91339111328125, -1.7828369140625, -1.65228271484375, -1.521728515625, -1.39117431640625, -1.2606201171875, -1.13006591796875, -0.99951171875, -0.86895751953125, -0.7384033203125, -0.60784912109375, -0.477294921875, -0.34674072265625, -0.2161865234375, -0.08563232421875, 0.044921875, 0.17547607421875, 0.3060302734375, 0.43658447265625, 0.567138671875, 0.69769287109375, 0.8282470703125, 0.95880126953125, 1.08935546875, 1.21990966796875, 1.3504638671875, 1.48101806640625, 1.611572265625, 1.74212646484375, 1.8726806640625, 2.00323486328125, 2.1337890625, 2.26434326171875, 2.3948974609375, 2.52545166015625, 2.656005859375, 2.78656005859375, 2.9171142578125, 3.04766845703125, 3.17822265625, 3.30877685546875, 3.4393310546875, 3.56988525390625, 3.700439453125, 3.83099365234375, 3.9615478515625, 4.09210205078125, 4.22265625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 5.0, 6.0, 7.0, 13.0, 19.0, 32.0, 49.0, 62.0, 63.0, 96.0, 139.0, 125.0, 98.0, 85.0, 55.0, 46.0, 33.0, 13.0, 14.0, 13.0, 4.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00023424625396728516, -0.00022773630917072296, -0.00022122636437416077, -0.00021471641957759857, -0.00020820647478103638, -0.00020169652998447418, -0.000195186585187912, -0.0001886766403913498, -0.0001821666955947876, -0.0001756567507982254, -0.0001691468060016632, -0.000162636861205101, -0.00015612691640853882, -0.00014961697161197662, -0.00014310702681541443, -0.00013659708201885223, -0.00013008713722229004, -0.00012357719242572784, -0.00011706724762916565, -0.00011055730283260345, -0.00010404735803604126, -9.753741323947906e-05, -9.102746844291687e-05, -8.451752364635468e-05, -7.800757884979248e-05, -7.149763405323029e-05, -6.498768925666809e-05, -5.8477744460105896e-05, -5.19677996635437e-05, -4.5457854866981506e-05, -3.894791007041931e-05, -3.243796527385712e-05, -2.5928020477294922e-05, -1.9418075680732727e-05, -1.2908130884170532e-05, -6.398186087608337e-06, 1.1175870895385742e-07, 6.621703505516052e-06, 1.3131648302078247e-05, 1.9641593098640442e-05, 2.6151537895202637e-05, 3.266148269176483e-05, 3.9171427488327026e-05, 4.568137228488922e-05, 5.2191317081451416e-05, 5.870126187801361e-05, 6.52112066745758e-05, 7.1721151471138e-05, 7.82310962677002e-05, 8.474104106426239e-05, 9.125098586082458e-05, 9.776093065738678e-05, 0.00010427087545394897, 0.00011078082025051117, 0.00011729076504707336, 0.00012380070984363556, 0.00013031065464019775, 0.00013682059943675995, 0.00014333054423332214, 0.00014984048902988434, 0.00015635043382644653, 0.00016286037862300873, 0.00016937032341957092, 0.00017588026821613312, 0.0001823902130126953]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 11.0, 18.0, 12.0, 34.0, 29.0, 72.0, 93.0, 131.0, 224.0, 262.0, 402.0, 567.0, 812.0, 1161.0, 1759.0, 2635.0, 3998.0, 6711.0, 12056.0, 24931.0, 65534.0, 282996.0, 469846.0, 102534.0, 34052.0, 15419.0, 8086.0, 4776.0, 2906.0, 2007.0, 1379.0, 946.0, 636.0, 460.0, 336.0, 215.0, 171.0, 99.0, 76.0, 45.0, 38.0, 21.0, 14.0, 11.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.6640625, -3.546539306640625, -3.42901611328125, -3.311492919921875, -3.1939697265625, -3.076446533203125, -2.95892333984375, -2.841400146484375, -2.723876953125, -2.606353759765625, -2.48883056640625, -2.371307373046875, -2.2537841796875, -2.136260986328125, -2.01873779296875, -1.901214599609375, -1.78369140625, -1.666168212890625, -1.54864501953125, -1.431121826171875, -1.3135986328125, -1.196075439453125, -1.07855224609375, -0.961029052734375, -0.843505859375, -0.725982666015625, -0.60845947265625, -0.490936279296875, -0.3734130859375, -0.255889892578125, -0.13836669921875, -0.020843505859375, 0.0966796875, 0.214202880859375, 0.33172607421875, 0.449249267578125, 0.5667724609375, 0.684295654296875, 0.80181884765625, 0.919342041015625, 1.036865234375, 1.154388427734375, 1.27191162109375, 1.389434814453125, 1.5069580078125, 1.624481201171875, 1.74200439453125, 1.859527587890625, 1.97705078125, 2.094573974609375, 2.21209716796875, 2.329620361328125, 2.4471435546875, 2.564666748046875, 2.68218994140625, 2.799713134765625, 2.917236328125, 3.034759521484375, 3.15228271484375, 3.269805908203125, 3.3873291015625, 3.504852294921875, 3.62237548828125, 3.739898681640625, 3.857421875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 9.0, 6.0, 7.0, 12.0, 24.0, 21.0, 25.0, 47.0, 67.0, 106.0, 112.0, 118.0, 112.0, 84.0, 56.0, 39.0, 25.0, 27.0, 17.0, 9.0, 16.0, 6.0, 3.0, 6.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.988800048828125, -0.95123291015625, -0.913665771484375, -0.8760986328125, -0.838531494140625, -0.80096435546875, -0.763397216796875, -0.725830078125, -0.688262939453125, -0.65069580078125, -0.613128662109375, -0.5755615234375, -0.537994384765625, -0.50042724609375, -0.462860107421875, -0.42529296875, -0.387725830078125, -0.35015869140625, -0.312591552734375, -0.2750244140625, -0.237457275390625, -0.19989013671875, -0.162322998046875, -0.124755859375, -0.087188720703125, -0.04962158203125, -0.012054443359375, 0.0255126953125, 0.063079833984375, 0.10064697265625, 0.138214111328125, 0.17578125, 0.213348388671875, 0.25091552734375, 0.288482666015625, 0.3260498046875, 0.363616943359375, 0.40118408203125, 0.438751220703125, 0.476318359375, 0.513885498046875, 0.55145263671875, 0.589019775390625, 0.6265869140625, 0.664154052734375, 0.70172119140625, 0.739288330078125, 0.77685546875, 0.814422607421875, 0.85198974609375, 0.889556884765625, 0.9271240234375, 0.964691162109375, 1.00225830078125, 1.039825439453125, 1.077392578125, 1.114959716796875, 1.15252685546875, 1.190093994140625, 1.2276611328125, 1.265228271484375, 1.30279541015625, 1.340362548828125, 1.3779296875]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 4.0, 8.0, 14.0, 21.0, 21.0, 29.0, 36.0, 40.0, 48.0, 55.0, 69.0, 72.0, 74.0, 70.0, 72.0, 62.0, 50.0, 49.0, 36.0, 28.0, 28.0, 21.0, 12.0, 9.0, 12.0, 6.0, 5.0, 9.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.60665225982666, -5.420063018798828, -5.233473300933838, -5.046884059906006, -4.860294342041016, -4.673705101013184, -4.487115859985352, -4.300526142120361, -4.113936424255371, -3.92734694480896, -3.740757465362549, -3.554168224334717, -3.3675785064697266, -3.1809892654418945, -2.9943997859954834, -2.8078103065490723, -2.6212210655212402, -2.434631586074829, -2.248042106628418, -2.061452865600586, -1.8748632669448853, -1.6882737874984741, -1.5016844272613525, -1.3150949478149414, -1.1285054683685303, -0.9419159889221191, -0.7553265690803528, -0.5687371492385864, -0.3821476697921753, -0.19555819034576416, -0.008968830108642578, 0.17762064933776855, 0.3642096519470215, 0.5507991313934326, 0.737388551235199, 0.9239779710769653, 1.1105674505233765, 1.2971569299697876, 1.4837462902069092, 1.6703357696533203, 1.8569252490997314, 2.0435147285461426, 2.2301042079925537, 2.416693687438965, 2.603282928466797, 2.789872646331787, 2.976461887359619, 3.1630513668060303, 3.3496408462524414, 3.5362303256988525, 3.7228198051452637, 3.9094090461730957, 4.095998764038086, 4.282588005065918, 4.46917724609375, 4.65576696395874, 4.8423566818237305, 5.0289459228515625, 5.215535640716553, 5.402124881744385, 5.588714599609375, 5.775303840637207, 5.961893081665039, 6.148482799530029, 6.335072040557861]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 7.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 27.0, 25.0, 14.0, 24.0, 23.0, 23.0, 20.0, 31.0, 32.0, 26.0, 38.0, 39.0, 28.0, 35.0, 38.0, 45.0, 36.0, 42.0, 30.0, 40.0, 23.0, 31.0, 34.0, 28.0, 35.0, 26.0, 18.0, 18.0, 19.0, 21.0, 12.0, 6.0, 6.0, 10.0, 6.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765174388885498, -4.6061248779296875, -4.447075366973877, -4.288025856018066, -4.128976821899414, -3.9699273109436035, -3.810877799987793, -3.6518282890319824, -3.492778778076172, -3.3337292671203613, -3.17467999458313, -3.0156304836273193, -2.856580972671509, -2.6975317001342773, -2.538482189178467, -2.3794326782226562, -2.220383405685425, -2.0613338947296143, -1.9022845029830933, -1.7432351112365723, -1.5841856002807617, -1.4251362085342407, -1.2660868167877197, -1.1070373058319092, -0.9479879140853882, -0.7889384627342224, -0.6298890113830566, -0.47083961963653564, -0.3117901682853699, -0.1527407169342041, 0.0063086748123168945, 0.16535818576812744, 0.32440757751464844, 0.4834570288658142, 0.64250648021698, 0.801555871963501, 0.9606053233146667, 1.1196547746658325, 1.2787041664123535, 1.437753677368164, 1.596803069114685, 1.755852460861206, 1.9149019718170166, 2.073951244354248, 2.2330007553100586, 2.392050266265869, 2.5510997772216797, 2.7101492881774902, 2.8691985607147217, 3.0282480716705322, 3.1872973442077637, 3.346346855163574, 3.5053963661193848, 3.6644458770751953, 3.8234951496124268, 3.9825446605682373, 4.141593933105469, 4.300643444061279, 4.45969295501709, 4.618741989135742, 4.777791500091553, 4.936841011047363, 5.095890522003174, 5.254940032958984, 5.413989543914795]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 14.0, 18.0, 30.0, 56.0, 100.0, 160.0, 261.0, 407.0, 691.0, 1232.0, 2122.0, 3821.0, 6706.0, 11856.0, 22119.0, 41616.0, 81871.0, 175807.0, 461583.0, 1309696.0, 1288706.0, 447701.0, 169417.0, 79550.0, 40486.0, 20861.0, 11703.0, 6513.0, 3824.0, 2108.0, 1244.0, 772.0, 448.0, 276.0, 174.0, 101.0, 83.0, 53.0, 31.0, 15.0, 7.0, 11.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4296875, -8.1661376953125, -7.902587890625, -7.6390380859375, -7.37548828125, -7.1119384765625, -6.848388671875, -6.5848388671875, -6.3212890625, -6.0577392578125, -5.794189453125, -5.5306396484375, -5.26708984375, -5.0035400390625, -4.739990234375, -4.4764404296875, -4.212890625, -3.9493408203125, -3.685791015625, -3.4222412109375, -3.15869140625, -2.8951416015625, -2.631591796875, -2.3680419921875, -2.1044921875, -1.8409423828125, -1.577392578125, -1.3138427734375, -1.05029296875, -0.7867431640625, -0.523193359375, -0.2596435546875, 0.00390625, 0.2674560546875, 0.531005859375, 0.7945556640625, 1.05810546875, 1.3216552734375, 1.585205078125, 1.8487548828125, 2.1123046875, 2.3758544921875, 2.639404296875, 2.9029541015625, 3.16650390625, 3.4300537109375, 3.693603515625, 3.9571533203125, 4.220703125, 4.4842529296875, 4.747802734375, 5.0113525390625, 5.27490234375, 5.5384521484375, 5.802001953125, 6.0655517578125, 6.3291015625, 6.5926513671875, 6.856201171875, 7.1197509765625, 7.38330078125, 7.6468505859375, 7.910400390625, 8.1739501953125, 8.4375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 1.0, 3.0, 7.0, 5.0, 4.0, 3.0, 14.0, 6.0, 10.0, 20.0, 19.0, 23.0, 21.0, 18.0, 15.0, 20.0, 31.0, 38.0, 24.0, 29.0, 23.0, 33.0, 42.0, 36.0, 40.0, 37.0, 34.0, 48.0, 33.0, 30.0, 30.0, 32.0, 25.0, 26.0, 28.0, 27.0, 26.0, 16.0, 18.0, 22.0, 11.0, 18.0, 8.0, 9.0, 10.0, 7.0, 4.0, 1.0, 6.0, 0.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-4.296875, -4.16778564453125, -4.0386962890625, -3.90960693359375, -3.780517578125, -3.65142822265625, -3.5223388671875, -3.39324951171875, -3.26416015625, -3.13507080078125, -3.0059814453125, -2.87689208984375, -2.747802734375, -2.61871337890625, -2.4896240234375, -2.36053466796875, -2.2314453125, -2.10235595703125, -1.9732666015625, -1.84417724609375, -1.715087890625, -1.58599853515625, -1.4569091796875, -1.32781982421875, -1.19873046875, -1.06964111328125, -0.9405517578125, -0.81146240234375, -0.682373046875, -0.55328369140625, -0.4241943359375, -0.29510498046875, -0.166015625, -0.03692626953125, 0.0921630859375, 0.22125244140625, 0.350341796875, 0.47943115234375, 0.6085205078125, 0.73760986328125, 0.86669921875, 0.99578857421875, 1.1248779296875, 1.25396728515625, 1.383056640625, 1.51214599609375, 1.6412353515625, 1.77032470703125, 1.8994140625, 2.02850341796875, 2.1575927734375, 2.28668212890625, 2.415771484375, 2.54486083984375, 2.6739501953125, 2.80303955078125, 2.93212890625, 3.06121826171875, 3.1903076171875, 3.31939697265625, 3.448486328125, 3.57757568359375, 3.7066650390625, 3.83575439453125, 3.96484375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 20.0, 28.0, 47.0, 86.0, 130.0, 174.0, 303.0, 421.0, 681.0, 965.0, 1479.0, 2370.0, 3652.0, 5820.0, 9103.0, 14909.0, 24967.0, 42347.0, 74049.0, 135974.0, 254834.0, 494553.0, 911464.0, 995656.0, 567031.0, 294310.0, 154755.0, 84404.0, 47423.0, 27942.0, 16578.0, 10198.0, 6352.0, 3962.0, 2546.0, 1643.0, 1025.0, 739.0, 462.0, 315.0, 220.0, 122.0, 72.0, 57.0, 34.0, 20.0, 8.0, 15.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.921875, -5.7374267578125, -5.552978515625, -5.3685302734375, -5.18408203125, -4.9996337890625, -4.815185546875, -4.6307373046875, -4.4462890625, -4.2618408203125, -4.077392578125, -3.8929443359375, -3.70849609375, -3.5240478515625, -3.339599609375, -3.1551513671875, -2.970703125, -2.7862548828125, -2.601806640625, -2.4173583984375, -2.23291015625, -2.0484619140625, -1.864013671875, -1.6795654296875, -1.4951171875, -1.3106689453125, -1.126220703125, -0.9417724609375, -0.75732421875, -0.5728759765625, -0.388427734375, -0.2039794921875, -0.01953125, 0.1649169921875, 0.349365234375, 0.5338134765625, 0.71826171875, 0.9027099609375, 1.087158203125, 1.2716064453125, 1.4560546875, 1.6405029296875, 1.824951171875, 2.0093994140625, 2.19384765625, 2.3782958984375, 2.562744140625, 2.7471923828125, 2.931640625, 3.1160888671875, 3.300537109375, 3.4849853515625, 3.66943359375, 3.8538818359375, 4.038330078125, 4.2227783203125, 4.4072265625, 4.5916748046875, 4.776123046875, 4.9605712890625, 5.14501953125, 5.3294677734375, 5.513916015625, 5.6983642578125, 5.8828125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 7.0, 16.0, 15.0, 18.0, 26.0, 27.0, 53.0, 55.0, 70.0, 113.0, 102.0, 173.0, 197.0, 233.0, 288.0, 330.0, 367.0, 345.0, 275.0, 259.0, 206.0, 185.0, 160.0, 122.0, 94.0, 78.0, 55.0, 35.0, 44.0, 26.0, 14.0, 19.0, 19.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.150390625, -3.062408447265625, -2.97442626953125, -2.886444091796875, -2.7984619140625, -2.710479736328125, -2.62249755859375, -2.534515380859375, -2.446533203125, -2.358551025390625, -2.27056884765625, -2.182586669921875, -2.0946044921875, -2.006622314453125, -1.91864013671875, -1.830657958984375, -1.74267578125, -1.654693603515625, -1.56671142578125, -1.478729248046875, -1.3907470703125, -1.302764892578125, -1.21478271484375, -1.126800537109375, -1.038818359375, -0.950836181640625, -0.86285400390625, -0.774871826171875, -0.6868896484375, -0.598907470703125, -0.51092529296875, -0.422943115234375, -0.3349609375, -0.246978759765625, -0.15899658203125, -0.071014404296875, 0.0169677734375, 0.104949951171875, 0.19293212890625, 0.280914306640625, 0.368896484375, 0.456878662109375, 0.54486083984375, 0.632843017578125, 0.7208251953125, 0.808807373046875, 0.89678955078125, 0.984771728515625, 1.07275390625, 1.160736083984375, 1.24871826171875, 1.336700439453125, 1.4246826171875, 1.512664794921875, 1.60064697265625, 1.688629150390625, 1.776611328125, 1.864593505859375, 1.95257568359375, 2.040557861328125, 2.1285400390625, 2.216522216796875, 2.30450439453125, 2.392486572265625, 2.48046875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 10.0, 13.0, 17.0, 14.0, 29.0, 43.0, 35.0, 37.0, 54.0, 53.0, 74.0, 67.0, 84.0, 64.0, 70.0, 58.0, 53.0, 32.0, 26.0, 25.0, 22.0, 14.0, 17.0, 12.0, 8.0, 8.0, 7.0, 8.0, 3.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.661281108856201, -5.491174221038818, -5.3210673332214355, -5.1509599685668945, -4.980853080749512, -4.810746192932129, -4.640639305114746, -4.470532417297363, -4.3004255294799805, -4.130318641662598, -3.9602115154266357, -3.790104627609253, -3.619997501373291, -3.449890613555908, -3.2797837257385254, -3.1096768379211426, -2.9395694732666016, -2.7694625854492188, -2.599355459213257, -2.429248571395874, -2.259141445159912, -2.0890345573425293, -1.9189276695251465, -1.7488206624984741, -1.5787136554718018, -1.4086066484451294, -1.238499641418457, -1.0683927536010742, -0.8982857465744019, -0.7281787395477295, -0.5580718517303467, -0.3879648447036743, -0.21785831451416016, -0.04775133728981018, 0.1223556399345398, 0.2924625873565674, 0.46256959438323975, 0.6326766014099121, 0.8027834892272949, 0.9728904962539673, 1.1429975032806396, 1.313104510307312, 1.4832115173339844, 1.6533184051513672, 1.8234254121780396, 1.993532419204712, 2.1636393070220947, 2.3337464332580566, 2.5038533210754395, 2.6739602088928223, 2.844067335128784, 3.014174222946167, 3.184281349182129, 3.3543882369995117, 3.5244951248168945, 3.6946020126342773, 3.8647091388702393, 4.034816265106201, 4.204923152923584, 4.375030040740967, 4.54513692855835, 4.715244293212891, 4.885351181030273, 5.055458068847656, 5.225564956665039]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 12.0, 13.0, 13.0, 15.0, 11.0, 11.0, 26.0, 29.0, 25.0, 30.0, 19.0, 32.0, 41.0, 41.0, 33.0, 48.0, 39.0, 38.0, 46.0, 35.0, 31.0, 37.0, 31.0, 25.0, 35.0, 32.0, 25.0, 25.0, 29.0, 24.0, 19.0, 23.0, 15.0, 7.0, 6.0, 12.0, 6.0, 12.0, 1.0, 7.0, 0.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.86994743347168, -4.716521739959717, -4.563095569610596, -4.409669876098633, -4.25624418258667, -4.102818489074707, -3.949392318725586, -3.795966625213623, -3.642540693283081, -3.489114761352539, -3.335689067840576, -3.182263135910034, -3.028837203979492, -2.8754115104675293, -2.7219855785369873, -2.5685596466064453, -2.4151339530944824, -2.2617080211639404, -2.1082823276519775, -1.9548563957214355, -1.801430583000183, -1.6480047702789307, -1.4945788383483887, -1.3411530256271362, -1.1877272129058838, -1.0343014001846313, -0.8808755278587341, -0.7274496555328369, -0.5740238428115845, -0.42059803009033203, -0.2671721577644348, -0.1137462854385376, 0.03967905044555664, 0.19310489296913147, 0.3465307354927063, 0.49995657801628113, 0.653382420539856, 0.8068082332611084, 0.9602341055870056, 1.1136599779129028, 1.2670857906341553, 1.4205116033554077, 1.5739374160766602, 1.7273633480072021, 1.8807891607284546, 2.034214973449707, 2.187640905380249, 2.341066837310791, 2.494492530822754, 2.647918462753296, 2.801344156265259, 2.954770088195801, 3.1081957817077637, 3.2616217136383057, 3.4150476455688477, 3.5684733390808105, 3.7218992710113525, 3.8753252029418945, 4.028750896453857, 4.18217658996582, 4.335602760314941, 4.489028453826904, 4.642454147338867, 4.795880317687988, 4.949306011199951]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 12.0, 16.0, 27.0, 29.0, 68.0, 71.0, 108.0, 156.0, 231.0, 350.0, 510.0, 749.0, 1173.0, 1773.0, 2753.0, 4230.0, 6368.0, 9847.0, 14837.0, 23160.0, 35201.0, 54556.0, 84087.0, 131975.0, 204764.0, 169055.0, 105974.0, 68768.0, 44600.0, 28934.0, 18538.0, 12477.0, 7805.0, 5250.0, 3404.0, 2219.0, 1464.0, 1024.0, 678.0, 389.0, 277.0, 198.0, 139.0, 106.0, 54.0, 51.0, 26.0, 23.0, 15.0, 7.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.7978515625, -1.739410400390625, -1.68096923828125, -1.622528076171875, -1.5640869140625, -1.505645751953125, -1.44720458984375, -1.388763427734375, -1.330322265625, -1.271881103515625, -1.21343994140625, -1.154998779296875, -1.0965576171875, -1.038116455078125, -0.97967529296875, -0.921234130859375, -0.86279296875, -0.804351806640625, -0.74591064453125, -0.687469482421875, -0.6290283203125, -0.570587158203125, -0.51214599609375, -0.453704833984375, -0.395263671875, -0.336822509765625, -0.27838134765625, -0.219940185546875, -0.1614990234375, -0.103057861328125, -0.04461669921875, 0.013824462890625, 0.072265625, 0.130706787109375, 0.18914794921875, 0.247589111328125, 0.3060302734375, 0.364471435546875, 0.42291259765625, 0.481353759765625, 0.539794921875, 0.598236083984375, 0.65667724609375, 0.715118408203125, 0.7735595703125, 0.832000732421875, 0.89044189453125, 0.948883056640625, 1.00732421875, 1.065765380859375, 1.12420654296875, 1.182647705078125, 1.2410888671875, 1.299530029296875, 1.35797119140625, 1.416412353515625, 1.474853515625, 1.533294677734375, 1.59173583984375, 1.650177001953125, 1.7086181640625, 1.767059326171875, 1.82550048828125, 1.883941650390625, 1.9423828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 8.0, 8.0, 5.0, 14.0, 7.0, 12.0, 16.0, 16.0, 21.0, 21.0, 19.0, 30.0, 23.0, 30.0, 38.0, 40.0, 54.0, 38.0, 40.0, 39.0, 47.0, 47.0, 33.0, 27.0, 37.0, 28.0, 37.0, 34.0, 35.0, 31.0, 23.0, 25.0, 22.0, 16.0, 14.0, 10.0, 10.0, 12.0, 4.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.02734375, -4.8626708984375, -4.697998046875, -4.5333251953125, -4.36865234375, -4.2039794921875, -4.039306640625, -3.8746337890625, -3.7099609375, -3.5452880859375, -3.380615234375, -3.2159423828125, -3.05126953125, -2.8865966796875, -2.721923828125, -2.5572509765625, -2.392578125, -2.2279052734375, -2.063232421875, -1.8985595703125, -1.73388671875, -1.5692138671875, -1.404541015625, -1.2398681640625, -1.0751953125, -0.9105224609375, -0.745849609375, -0.5811767578125, -0.41650390625, -0.2518310546875, -0.087158203125, 0.0775146484375, 0.2421875, 0.4068603515625, 0.571533203125, 0.7362060546875, 0.90087890625, 1.0655517578125, 1.230224609375, 1.3948974609375, 1.5595703125, 1.7242431640625, 1.888916015625, 2.0535888671875, 2.21826171875, 2.3829345703125, 2.547607421875, 2.7122802734375, 2.876953125, 3.0416259765625, 3.206298828125, 3.3709716796875, 3.53564453125, 3.7003173828125, 3.864990234375, 4.0296630859375, 4.1943359375, 4.3590087890625, 4.523681640625, 4.6883544921875, 4.85302734375, 5.0177001953125, 5.182373046875, 5.3470458984375, 5.51171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 12.0, 12.0, 20.0, 20.0, 51.0, 74.0, 120.0, 177.0, 258.0, 407.0, 747.0, 1252.0, 2140.0, 3865.0, 6793.0, 12748.0, 24357.0, 47604.0, 96073.0, 205627.0, 326246.0, 160892.0, 76711.0, 38459.0, 19851.0, 10463.0, 5735.0, 3236.0, 1833.0, 1060.0, 669.0, 380.0, 230.0, 132.0, 99.0, 57.0, 50.0, 37.0, 20.0, 12.0, 8.0, 3.0, 1.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79296875, -2.700927734375, -2.60888671875, -2.516845703125, -2.4248046875, -2.332763671875, -2.24072265625, -2.148681640625, -2.056640625, -1.964599609375, -1.87255859375, -1.780517578125, -1.6884765625, -1.596435546875, -1.50439453125, -1.412353515625, -1.3203125, -1.228271484375, -1.13623046875, -1.044189453125, -0.9521484375, -0.860107421875, -0.76806640625, -0.676025390625, -0.583984375, -0.491943359375, -0.39990234375, -0.307861328125, -0.2158203125, -0.123779296875, -0.03173828125, 0.060302734375, 0.15234375, 0.244384765625, 0.33642578125, 0.428466796875, 0.5205078125, 0.612548828125, 0.70458984375, 0.796630859375, 0.888671875, 0.980712890625, 1.07275390625, 1.164794921875, 1.2568359375, 1.348876953125, 1.44091796875, 1.532958984375, 1.625, 1.717041015625, 1.80908203125, 1.901123046875, 1.9931640625, 2.085205078125, 2.17724609375, 2.269287109375, 2.361328125, 2.453369140625, 2.54541015625, 2.637451171875, 2.7294921875, 2.821533203125, 2.91357421875, 3.005615234375, 3.09765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 15.0, 15.0, 19.0, 15.0, 14.0, 21.0, 27.0, 35.0, 36.0, 35.0, 28.0, 54.0, 52.0, 42.0, 46.0, 40.0, 47.0, 46.0, 51.0, 48.0, 48.0, 41.0, 39.0, 28.0, 30.0, 25.0, 13.0, 19.0, 11.0, 14.0, 9.0, 13.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.198638916015625, -4.07305908203125, -3.947479248046875, -3.8218994140625, -3.696319580078125, -3.57073974609375, -3.445159912109375, -3.319580078125, -3.194000244140625, -3.06842041015625, -2.942840576171875, -2.8172607421875, -2.691680908203125, -2.56610107421875, -2.440521240234375, -2.31494140625, -2.189361572265625, -2.06378173828125, -1.938201904296875, -1.8126220703125, -1.687042236328125, -1.56146240234375, -1.435882568359375, -1.310302734375, -1.184722900390625, -1.05914306640625, -0.933563232421875, -0.8079833984375, -0.682403564453125, -0.55682373046875, -0.431243896484375, -0.3056640625, -0.180084228515625, -0.05450439453125, 0.071075439453125, 0.1966552734375, 0.322235107421875, 0.44781494140625, 0.573394775390625, 0.698974609375, 0.824554443359375, 0.95013427734375, 1.075714111328125, 1.2012939453125, 1.326873779296875, 1.45245361328125, 1.578033447265625, 1.70361328125, 1.829193115234375, 1.95477294921875, 2.080352783203125, 2.2059326171875, 2.331512451171875, 2.45709228515625, 2.582672119140625, 2.708251953125, 2.833831787109375, 2.95941162109375, 3.084991455078125, 3.2105712890625, 3.336151123046875, 3.46173095703125, 3.587310791015625, 3.712890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 12.0, 25.0, 23.0, 35.0, 45.0, 85.0, 117.0, 218.0, 318.0, 525.0, 857.0, 1507.0, 2722.0, 5173.0, 10315.0, 22403.0, 56601.0, 183532.0, 498829.0, 169280.0, 53278.0, 21490.0, 9843.0, 4926.0, 2625.0, 1472.0, 895.0, 513.0, 300.0, 167.0, 128.0, 88.0, 55.0, 40.0, 25.0, 17.0, 14.0, 12.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.03564453125, -0.034693241119384766, -0.03374195098876953, -0.0327906608581543, -0.03183937072753906, -0.030888080596923828, -0.029936790466308594, -0.02898550033569336, -0.028034210205078125, -0.02708292007446289, -0.026131629943847656, -0.025180339813232422, -0.024229049682617188, -0.023277759552001953, -0.02232646942138672, -0.021375179290771484, -0.02042388916015625, -0.019472599029541016, -0.01852130889892578, -0.017570018768310547, -0.016618728637695312, -0.015667438507080078, -0.014716148376464844, -0.01376485824584961, -0.012813568115234375, -0.01186227798461914, -0.010910987854003906, -0.009959697723388672, -0.009008407592773438, -0.008057117462158203, -0.007105827331542969, -0.006154537200927734, -0.0052032470703125, -0.004251956939697266, -0.0033006668090820312, -0.002349376678466797, -0.0013980865478515625, -0.0004467964172363281, 0.0005044937133789062, 0.0014557838439941406, 0.002407073974609375, 0.0033583641052246094, 0.004309654235839844, 0.005260944366455078, 0.0062122344970703125, 0.007163524627685547, 0.008114814758300781, 0.009066104888916016, 0.01001739501953125, 0.010968685150146484, 0.011919975280761719, 0.012871265411376953, 0.013822555541992188, 0.014773845672607422, 0.015725135803222656, 0.01667642593383789, 0.017627716064453125, 0.01857900619506836, 0.019530296325683594, 0.020481586456298828, 0.021432876586914062, 0.022384166717529297, 0.02333545684814453, 0.024286746978759766, 0.025238037109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 2.0, 10.0, 13.0, 14.0, 14.0, 21.0, 34.0, 41.0, 34.0, 64.0, 78.0, 69.0, 73.0, 92.0, 85.0, 68.0, 64.0, 30.0, 37.0, 37.0, 23.0, 16.0, 19.0, 9.0, 9.0, 5.0, 7.0, 7.0, 4.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.702278137207031e-06, -8.412636816501617e-06, -8.122995495796204e-06, -7.83335417509079e-06, -7.543712854385376e-06, -7.254071533679962e-06, -6.964430212974548e-06, -6.6747888922691345e-06, -6.385147571563721e-06, -6.095506250858307e-06, -5.805864930152893e-06, -5.516223609447479e-06, -5.2265822887420654e-06, -4.936940968036652e-06, -4.647299647331238e-06, -4.357658326625824e-06, -4.06801700592041e-06, -3.7783756852149963e-06, -3.4887343645095825e-06, -3.1990930438041687e-06, -2.909451723098755e-06, -2.619810402393341e-06, -2.3301690816879272e-06, -2.0405277609825134e-06, -1.7508864402770996e-06, -1.4612451195716858e-06, -1.171603798866272e-06, -8.819624781608582e-07, -5.923211574554443e-07, -3.026798367500305e-07, -1.30385160446167e-08, 2.766028046607971e-07, 5.662441253662109e-07, 8.558854460716248e-07, 1.1455267667770386e-06, 1.4351680874824524e-06, 1.7248094081878662e-06, 2.01445072889328e-06, 2.304092049598694e-06, 2.5937333703041077e-06, 2.8833746910095215e-06, 3.1730160117149353e-06, 3.462657332420349e-06, 3.752298653125763e-06, 4.041939973831177e-06, 4.3315812945365906e-06, 4.621222615242004e-06, 4.910863935947418e-06, 5.200505256652832e-06, 5.490146577358246e-06, 5.77978789806366e-06, 6.0694292187690735e-06, 6.359070539474487e-06, 6.648711860179901e-06, 6.938353180885315e-06, 7.227994501590729e-06, 7.517635822296143e-06, 7.807277143001556e-06, 8.09691846370697e-06, 8.386559784412384e-06, 8.676201105117798e-06, 8.965842425823212e-06, 9.255483746528625e-06, 9.54512506723404e-06, 9.834766387939453e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 9.0, 7.0, 25.0, 18.0, 34.0, 54.0, 87.0, 95.0, 173.0, 233.0, 294.0, 407.0, 642.0, 820.0, 1152.0, 1682.0, 2436.0, 3502.0, 5317.0, 8301.0, 13111.0, 22704.0, 39774.0, 74404.0, 148230.0, 284067.0, 210140.0, 100768.0, 53144.0, 29282.0, 17157.0, 10320.0, 6414.0, 4206.0, 2828.0, 1907.0, 1452.0, 1011.0, 634.0, 492.0, 387.0, 236.0, 161.0, 145.0, 88.0, 56.0, 62.0, 34.0, 26.0, 19.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.015350341796875, -0.014850854873657227, -0.014351367950439453, -0.01385188102722168, -0.013352394104003906, -0.012852907180786133, -0.01235342025756836, -0.011853933334350586, -0.011354446411132812, -0.010854959487915039, -0.010355472564697266, -0.009855985641479492, -0.009356498718261719, -0.008857011795043945, -0.008357524871826172, -0.007858037948608398, -0.007358551025390625, -0.0068590641021728516, -0.006359577178955078, -0.005860090255737305, -0.005360603332519531, -0.004861116409301758, -0.004361629486083984, -0.003862142562866211, -0.0033626556396484375, -0.002863168716430664, -0.0023636817932128906, -0.0018641948699951172, -0.0013647079467773438, -0.0008652210235595703, -0.0003657341003417969, 0.00013375282287597656, 0.00063323974609375, 0.0011327266693115234, 0.0016322135925292969, 0.0021317005157470703, 0.0026311874389648438, 0.003130674362182617, 0.0036301612854003906, 0.004129648208618164, 0.0046291351318359375, 0.005128622055053711, 0.005628108978271484, 0.006127595901489258, 0.006627082824707031, 0.007126569747924805, 0.007626056671142578, 0.008125543594360352, 0.008625030517578125, 0.009124517440795898, 0.009624004364013672, 0.010123491287231445, 0.010622978210449219, 0.011122465133666992, 0.011621952056884766, 0.012121438980102539, 0.012620925903320312, 0.013120412826538086, 0.01361989974975586, 0.014119386672973633, 0.014618873596191406, 0.01511836051940918, 0.015617847442626953, 0.016117334365844727, 0.0166168212890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 9.0, 9.0, 7.0, 10.0, 23.0, 26.0, 24.0, 47.0, 27.0, 44.0, 51.0, 75.0, 82.0, 80.0, 90.0, 66.0, 45.0, 52.0, 39.0, 43.0, 19.0, 21.0, 18.0, 12.0, 11.0, 4.0, 12.0, 2.0, 3.0, 8.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006732940673828125, -0.00654226541519165, -0.006351590156555176, -0.006160914897918701, -0.0059702396392822266, -0.005779564380645752, -0.005588889122009277, -0.005398213863372803, -0.005207538604736328, -0.0050168633460998535, -0.004826188087463379, -0.004635512828826904, -0.00444483757019043, -0.004254162311553955, -0.0040634870529174805, -0.003872811794281006, -0.0036821365356445312, -0.0034914612770080566, -0.003300786018371582, -0.0031101107597351074, -0.002919435501098633, -0.002728760242462158, -0.0025380849838256836, -0.002347409725189209, -0.0021567344665527344, -0.0019660592079162598, -0.0017753839492797852, -0.0015847086906433105, -0.001394033432006836, -0.0012033581733703613, -0.0010126829147338867, -0.0008220076560974121, -0.0006313323974609375, -0.0004406571388244629, -0.0002499818801879883, -5.930662155151367e-05, 0.00013136863708496094, 0.00032204389572143555, 0.0005127191543579102, 0.0007033944129943848, 0.0008940696716308594, 0.001084744930267334, 0.0012754201889038086, 0.0014660954475402832, 0.0016567707061767578, 0.0018474459648132324, 0.002038121223449707, 0.0022287964820861816, 0.0024194717407226562, 0.002610146999359131, 0.0028008222579956055, 0.00299149751663208, 0.0031821727752685547, 0.0033728480339050293, 0.003563523292541504, 0.0037541985511779785, 0.003944873809814453, 0.004135549068450928, 0.004326224327087402, 0.004516899585723877, 0.0047075748443603516, 0.004898250102996826, 0.005088925361633301, 0.005279600620269775, 0.00547027587890625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 2.0, 1.0, 15.0, 7.0, 14.0, 11.0, 29.0, 22.0, 28.0, 37.0, 48.0, 50.0, 51.0, 63.0, 82.0, 74.0, 74.0, 64.0, 63.0, 50.0, 31.0, 26.0, 29.0, 20.0, 20.0, 13.0, 15.0, 8.0, 9.0, 6.0, 10.0, 3.0, 3.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4548749923706055, -5.286917209625244, -5.118958950042725, -4.951001167297363, -4.783043384552002, -4.615085601806641, -4.447127342224121, -4.27916955947876, -4.111211776733398, -3.943253755569458, -3.7752959728240967, -3.6073379516601562, -3.439380168914795, -3.2714221477508545, -3.103464126586914, -2.9355063438415527, -2.767548084259033, -2.5995900630950928, -2.4316322803497314, -2.263674259185791, -2.0957164764404297, -1.9277584552764893, -1.7598004341125488, -1.591842532157898, -1.423884630203247, -1.2559267282485962, -1.0879688262939453, -0.9200108051300049, -0.752052903175354, -0.5840950012207031, -0.4161369800567627, -0.24817907810211182, -0.08022117614746094, 0.08773675560951233, 0.2556946873664856, 0.42365264892578125, 0.5916105508804321, 0.759568452835083, 0.9275264739990234, 1.0954843759536743, 1.2634422779083252, 1.431400179862976, 1.599358081817627, 1.7673161029815674, 1.9352740049362183, 2.103231906890869, 2.2711899280548096, 2.43914794921875, 2.6071057319641113, 2.7750637531280518, 2.943021535873413, 3.1109795570373535, 3.278937339782715, 3.4468953609466553, 3.6148533821105957, 3.782811164855957, 3.9507691860198975, 4.118727207183838, 4.286684989929199, 4.454643249511719, 4.62260103225708, 4.790558815002441, 4.958517074584961, 5.126474857330322, 5.294432640075684]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 8.0, 12.0, 12.0, 14.0, 16.0, 11.0, 11.0, 23.0, 32.0, 24.0, 29.0, 20.0, 33.0, 39.0, 42.0, 30.0, 47.0, 43.0, 37.0, 47.0, 31.0, 33.0, 40.0, 31.0, 25.0, 34.0, 32.0, 25.0, 23.0, 30.0, 24.0, 19.0, 25.0, 14.0, 7.0, 7.0, 12.0, 6.0, 11.0, 3.0, 6.0, 0.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.8671064376831055, -4.7142558097839355, -4.561405181884766, -4.4085540771484375, -4.255703449249268, -4.102852821350098, -3.9500021934509277, -3.7971513271331787, -3.6443004608154297, -3.4914498329162598, -3.3385989665985107, -3.185748338699341, -3.032897472381592, -2.880046844482422, -2.727196216583252, -2.574345350265503, -2.421494722366333, -2.268644094467163, -2.115793228149414, -1.9629426002502441, -1.8100917339324951, -1.6572411060333252, -1.5043903589248657, -1.3515396118164062, -1.1986888647079468, -1.0458381175994873, -0.8929873704910278, -0.7401366829872131, -0.5872859358787537, -0.4344351887702942, -0.2815845012664795, -0.12873375415802002, 0.024116992950439453, 0.17696772515773773, 0.329818457365036, 0.4826691746711731, 0.6355199217796326, 0.788370668888092, 0.9412213563919067, 1.0940721035003662, 1.2469228506088257, 1.3997735977172852, 1.5526243448257446, 1.705475091934204, 1.858325719833374, 2.011176586151123, 2.164027214050293, 2.316877841949463, 2.469728708267212, 2.622579336166382, 2.775430202484131, 2.928280830383301, 3.08113169670105, 3.2339823246002197, 3.3868331909179688, 3.5396838188171387, 3.6925344467163086, 3.8453850746154785, 3.9982359409332275, 4.151086807250977, 4.3039374351501465, 4.456788063049316, 4.609638690948486, 4.762489318847656, 4.915340423583984]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 11.0, 18.0, 32.0, 42.0, 67.0, 82.0, 147.0, 194.0, 301.0, 426.0, 638.0, 943.0, 1356.0, 1920.0, 2801.0, 3934.0, 5917.0, 8470.0, 12145.0, 17448.0, 25709.0, 37884.0, 55118.0, 79943.0, 111179.0, 137396.0, 141457.0, 118791.0, 88105.0, 61643.0, 42537.0, 29016.0, 19623.0, 13336.0, 9116.0, 6502.0, 4336.0, 2983.0, 2162.0, 1526.0, 1042.0, 710.0, 490.0, 356.0, 209.0, 177.0, 106.0, 74.0, 48.0, 28.0, 23.0, 13.0, 9.0, 5.0, 1.0, 5.0, 2.0, 1.0], "bins": [-5.39453125, -5.2266845703125, -5.058837890625, -4.8909912109375, -4.72314453125, -4.5552978515625, -4.387451171875, -4.2196044921875, -4.0517578125, -3.8839111328125, -3.716064453125, -3.5482177734375, -3.38037109375, -3.2125244140625, -3.044677734375, -2.8768310546875, -2.708984375, -2.5411376953125, -2.373291015625, -2.2054443359375, -2.03759765625, -1.8697509765625, -1.701904296875, -1.5340576171875, -1.3662109375, -1.1983642578125, -1.030517578125, -0.8626708984375, -0.69482421875, -0.5269775390625, -0.359130859375, -0.1912841796875, -0.0234375, 0.1444091796875, 0.312255859375, 0.4801025390625, 0.64794921875, 0.8157958984375, 0.983642578125, 1.1514892578125, 1.3193359375, 1.4871826171875, 1.655029296875, 1.8228759765625, 1.99072265625, 2.1585693359375, 2.326416015625, 2.4942626953125, 2.662109375, 2.8299560546875, 2.997802734375, 3.1656494140625, 3.33349609375, 3.5013427734375, 3.669189453125, 3.8370361328125, 4.0048828125, 4.1727294921875, 4.340576171875, 4.5084228515625, 4.67626953125, 4.8441162109375, 5.011962890625, 5.1798095703125, 5.34765625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 11.0, 9.0, 14.0, 7.0, 11.0, 8.0, 14.0, 14.0, 12.0, 15.0, 23.0, 24.0, 26.0, 28.0, 30.0, 37.0, 40.0, 39.0, 35.0, 52.0, 45.0, 42.0, 39.0, 39.0, 30.0, 31.0, 38.0, 22.0, 28.0, 23.0, 22.0, 35.0, 28.0, 21.0, 16.0, 22.0, 14.0, 13.0, 5.0, 7.0, 7.0, 5.0, 1.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.50714111328125, -4.3619384765625, -4.21673583984375, -4.071533203125, -3.92633056640625, -3.7811279296875, -3.63592529296875, -3.49072265625, -3.34552001953125, -3.2003173828125, -3.05511474609375, -2.909912109375, -2.76470947265625, -2.6195068359375, -2.47430419921875, -2.3291015625, -2.18389892578125, -2.0386962890625, -1.89349365234375, -1.748291015625, -1.60308837890625, -1.4578857421875, -1.31268310546875, -1.16748046875, -1.02227783203125, -0.8770751953125, -0.73187255859375, -0.586669921875, -0.44146728515625, -0.2962646484375, -0.15106201171875, -0.005859375, 0.13934326171875, 0.2845458984375, 0.42974853515625, 0.574951171875, 0.72015380859375, 0.8653564453125, 1.01055908203125, 1.15576171875, 1.30096435546875, 1.4461669921875, 1.59136962890625, 1.736572265625, 1.88177490234375, 2.0269775390625, 2.17218017578125, 2.3173828125, 2.46258544921875, 2.6077880859375, 2.75299072265625, 2.898193359375, 3.04339599609375, 3.1885986328125, 3.33380126953125, 3.47900390625, 3.62420654296875, 3.7694091796875, 3.91461181640625, 4.059814453125, 4.20501708984375, 4.3502197265625, 4.49542236328125, 4.640625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 11.0, 8.0, 22.0, 22.0, 52.0, 56.0, 100.0, 176.0, 255.0, 412.0, 678.0, 1066.0, 1825.0, 2916.0, 4703.0, 7711.0, 12606.0, 21368.0, 36358.0, 62775.0, 107464.0, 170600.0, 206561.0, 163585.0, 101993.0, 59651.0, 34078.0, 20341.0, 12174.0, 7263.0, 4487.0, 2743.0, 1693.0, 1033.0, 678.0, 369.0, 283.0, 154.0, 102.0, 68.0, 43.0, 27.0, 14.0, 16.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.0390625, -7.79132080078125, -7.5435791015625, -7.29583740234375, -7.048095703125, -6.80035400390625, -6.5526123046875, -6.30487060546875, -6.05712890625, -5.80938720703125, -5.5616455078125, -5.31390380859375, -5.066162109375, -4.81842041015625, -4.5706787109375, -4.32293701171875, -4.0751953125, -3.82745361328125, -3.5797119140625, -3.33197021484375, -3.084228515625, -2.83648681640625, -2.5887451171875, -2.34100341796875, -2.09326171875, -1.84552001953125, -1.5977783203125, -1.35003662109375, -1.102294921875, -0.85455322265625, -0.6068115234375, -0.35906982421875, -0.111328125, 0.13641357421875, 0.3841552734375, 0.63189697265625, 0.879638671875, 1.12738037109375, 1.3751220703125, 1.62286376953125, 1.87060546875, 2.11834716796875, 2.3660888671875, 2.61383056640625, 2.861572265625, 3.10931396484375, 3.3570556640625, 3.60479736328125, 3.8525390625, 4.10028076171875, 4.3480224609375, 4.59576416015625, 4.843505859375, 5.09124755859375, 5.3389892578125, 5.58673095703125, 5.83447265625, 6.08221435546875, 6.3299560546875, 6.57769775390625, 6.825439453125, 7.07318115234375, 7.3209228515625, 7.56866455078125, 7.81640625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 9.0, 11.0, 7.0, 6.0, 14.0, 10.0, 21.0, 15.0, 25.0, 24.0, 33.0, 19.0, 39.0, 32.0, 44.0, 43.0, 40.0, 48.0, 49.0, 33.0, 46.0, 40.0, 44.0, 36.0, 41.0, 27.0, 34.0, 22.0, 29.0, 23.0, 14.0, 16.0, 13.0, 16.0, 14.0, 5.0, 8.0, 7.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.76116943359375, -2.6590576171875, -2.55694580078125, -2.454833984375, -2.35272216796875, -2.2506103515625, -2.14849853515625, -2.04638671875, -1.94427490234375, -1.8421630859375, -1.74005126953125, -1.637939453125, -1.53582763671875, -1.4337158203125, -1.33160400390625, -1.2294921875, -1.12738037109375, -1.0252685546875, -0.92315673828125, -0.821044921875, -0.71893310546875, -0.6168212890625, -0.51470947265625, -0.41259765625, -0.31048583984375, -0.2083740234375, -0.10626220703125, -0.004150390625, 0.09796142578125, 0.2000732421875, 0.30218505859375, 0.404296875, 0.50640869140625, 0.6085205078125, 0.71063232421875, 0.812744140625, 0.91485595703125, 1.0169677734375, 1.11907958984375, 1.22119140625, 1.32330322265625, 1.4254150390625, 1.52752685546875, 1.629638671875, 1.73175048828125, 1.8338623046875, 1.93597412109375, 2.0380859375, 2.14019775390625, 2.2423095703125, 2.34442138671875, 2.446533203125, 2.54864501953125, 2.6507568359375, 2.75286865234375, 2.85498046875, 2.95709228515625, 3.0592041015625, 3.16131591796875, 3.263427734375, 3.36553955078125, 3.4676513671875, 3.56976318359375, 3.671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 5.0, 9.0, 12.0, 13.0, 17.0, 24.0, 39.0, 57.0, 64.0, 83.0, 137.0, 172.0, 259.0, 351.0, 474.0, 609.0, 874.0, 1295.0, 1803.0, 2427.0, 3572.0, 5263.0, 8029.0, 12791.0, 21376.0, 38684.0, 78399.0, 195846.0, 355183.0, 163139.0, 68427.0, 34299.0, 19460.0, 11624.0, 7401.0, 4828.0, 3345.0, 2224.0, 1599.0, 1208.0, 868.0, 607.0, 450.0, 303.0, 249.0, 188.0, 126.0, 94.0, 72.0, 59.0, 38.0, 22.0, 19.0, 17.0, 9.0, 11.0, 2.0, 4.0, 2.0, 3.0], "bins": [-2.169921875, -2.10296630859375, -2.0360107421875, -1.96905517578125, -1.902099609375, -1.83514404296875, -1.7681884765625, -1.70123291015625, -1.63427734375, -1.56732177734375, -1.5003662109375, -1.43341064453125, -1.366455078125, -1.29949951171875, -1.2325439453125, -1.16558837890625, -1.0986328125, -1.03167724609375, -0.9647216796875, -0.89776611328125, -0.830810546875, -0.76385498046875, -0.6968994140625, -0.62994384765625, -0.56298828125, -0.49603271484375, -0.4290771484375, -0.36212158203125, -0.295166015625, -0.22821044921875, -0.1612548828125, -0.09429931640625, -0.02734375, 0.03961181640625, 0.1065673828125, 0.17352294921875, 0.240478515625, 0.30743408203125, 0.3743896484375, 0.44134521484375, 0.50830078125, 0.57525634765625, 0.6422119140625, 0.70916748046875, 0.776123046875, 0.84307861328125, 0.9100341796875, 0.97698974609375, 1.0439453125, 1.11090087890625, 1.1778564453125, 1.24481201171875, 1.311767578125, 1.37872314453125, 1.4456787109375, 1.51263427734375, 1.57958984375, 1.64654541015625, 1.7135009765625, 1.78045654296875, 1.847412109375, 1.91436767578125, 1.9813232421875, 2.04827880859375, 2.115234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 10.0, 8.0, 9.0, 14.0, 21.0, 27.0, 37.0, 63.0, 91.0, 99.0, 142.0, 106.0, 111.0, 76.0, 56.0, 27.0, 26.0, 33.0, 12.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017499923706054688, -0.00016868487000465393, -0.00016237050294876099, -0.00015605613589286804, -0.0001497417688369751, -0.00014342740178108215, -0.0001371130347251892, -0.00013079866766929626, -0.00012448430061340332, -0.00011816993355751038, -0.00011185556650161743, -0.00010554119944572449, -9.922683238983154e-05, -9.29124653339386e-05, -8.659809827804565e-05, -8.028373122215271e-05, -7.396936416625977e-05, -6.765499711036682e-05, -6.134063005447388e-05, -5.502626299858093e-05, -4.871189594268799e-05, -4.2397528886795044e-05, -3.60831618309021e-05, -2.9768794775009155e-05, -2.345442771911621e-05, -1.7140060663223267e-05, -1.0825693607330322e-05, -4.511326551437378e-06, 1.8030405044555664e-06, 8.11740756034851e-06, 1.4431774616241455e-05, 2.07461416721344e-05, 2.7060508728027344e-05, 3.337487578392029e-05, 3.968924283981323e-05, 4.600360989570618e-05, 5.231797695159912e-05, 5.8632344007492065e-05, 6.494671106338501e-05, 7.126107811927795e-05, 7.75754451751709e-05, 8.388981223106384e-05, 9.020417928695679e-05, 9.651854634284973e-05, 0.00010283291339874268, 0.00010914728045463562, 0.00011546164751052856, 0.00012177601456642151, 0.00012809038162231445, 0.0001344047486782074, 0.00014071911573410034, 0.00014703348278999329, 0.00015334784984588623, 0.00015966221690177917, 0.00016597658395767212, 0.00017229095101356506, 0.000178605318069458, 0.00018491968512535095, 0.0001912340521812439, 0.00019754841923713684, 0.00020386278629302979, 0.00021017715334892273, 0.00021649152040481567, 0.00022280588746070862, 0.00022912025451660156]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 3.0, 9.0, 16.0, 22.0, 12.0, 19.0, 33.0, 54.0, 62.0, 94.0, 137.0, 178.0, 252.0, 386.0, 529.0, 786.0, 1132.0, 1757.0, 2559.0, 3955.0, 5978.0, 9452.0, 15713.0, 27582.0, 54346.0, 126277.0, 352188.0, 253075.0, 90389.0, 42599.0, 22628.0, 12838.0, 8043.0, 5129.0, 3351.0, 2230.0, 1468.0, 994.0, 654.0, 489.0, 346.0, 213.0, 164.0, 120.0, 85.0, 61.0, 42.0, 37.0, 19.0, 21.0, 11.0, 4.0, 10.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.095703125, -2.0277099609375, -1.959716796875, -1.8917236328125, -1.82373046875, -1.7557373046875, -1.687744140625, -1.6197509765625, -1.5517578125, -1.4837646484375, -1.415771484375, -1.3477783203125, -1.27978515625, -1.2117919921875, -1.143798828125, -1.0758056640625, -1.0078125, -0.9398193359375, -0.871826171875, -0.8038330078125, -0.73583984375, -0.6678466796875, -0.599853515625, -0.5318603515625, -0.4638671875, -0.3958740234375, -0.327880859375, -0.2598876953125, -0.19189453125, -0.1239013671875, -0.055908203125, 0.0120849609375, 0.080078125, 0.1480712890625, 0.216064453125, 0.2840576171875, 0.35205078125, 0.4200439453125, 0.488037109375, 0.5560302734375, 0.6240234375, 0.6920166015625, 0.760009765625, 0.8280029296875, 0.89599609375, 0.9639892578125, 1.031982421875, 1.0999755859375, 1.16796875, 1.2359619140625, 1.303955078125, 1.3719482421875, 1.43994140625, 1.5079345703125, 1.575927734375, 1.6439208984375, 1.7119140625, 1.7799072265625, 1.847900390625, 1.9158935546875, 1.98388671875, 2.0518798828125, 2.119873046875, 2.1878662109375, 2.255859375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 7.0, 3.0, 6.0, 9.0, 6.0, 15.0, 11.0, 11.0, 14.0, 21.0, 26.0, 37.0, 44.0, 60.0, 55.0, 64.0, 98.0, 117.0, 82.0, 49.0, 58.0, 36.0, 41.0, 21.0, 18.0, 12.0, 18.0, 11.0, 15.0, 9.0, 5.0, 7.0, 2.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77197265625, -0.74627685546875, -0.7205810546875, -0.69488525390625, -0.669189453125, -0.64349365234375, -0.6177978515625, -0.59210205078125, -0.56640625, -0.54071044921875, -0.5150146484375, -0.48931884765625, -0.463623046875, -0.43792724609375, -0.4122314453125, -0.38653564453125, -0.36083984375, -0.33514404296875, -0.3094482421875, -0.28375244140625, -0.258056640625, -0.23236083984375, -0.2066650390625, -0.18096923828125, -0.1552734375, -0.12957763671875, -0.1038818359375, -0.07818603515625, -0.052490234375, -0.02679443359375, -0.0010986328125, 0.02459716796875, 0.05029296875, 0.07598876953125, 0.1016845703125, 0.12738037109375, 0.153076171875, 0.17877197265625, 0.2044677734375, 0.23016357421875, 0.255859375, 0.28155517578125, 0.3072509765625, 0.33294677734375, 0.358642578125, 0.38433837890625, 0.4100341796875, 0.43572998046875, 0.46142578125, 0.48712158203125, 0.5128173828125, 0.53851318359375, 0.564208984375, 0.58990478515625, 0.6156005859375, 0.64129638671875, 0.6669921875, 0.69268798828125, 0.7183837890625, 0.74407958984375, 0.769775390625, 0.79547119140625, 0.8211669921875, 0.84686279296875, 0.87255859375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 5.0, 9.0, 6.0, 15.0, 17.0, 26.0, 28.0, 31.0, 41.0, 44.0, 56.0, 65.0, 71.0, 69.0, 82.0, 83.0, 58.0, 41.0, 53.0, 32.0, 27.0, 31.0, 22.0, 12.0, 15.0, 9.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.814776420593262, -5.637646675109863, -5.460516452789307, -5.28338623046875, -5.106256484985352, -4.929126739501953, -4.7519965171813965, -4.57486629486084, -4.397736549377441, -4.220606803894043, -4.043476581573486, -3.866346597671509, -3.6892166137695312, -3.5120866298675537, -3.334956645965576, -3.1578266620635986, -2.980696678161621, -2.8035666942596436, -2.626436710357666, -2.4493067264556885, -2.272176742553711, -2.0950467586517334, -1.9179167747497559, -1.7407867908477783, -1.5636568069458008, -1.3865268230438232, -1.2093968391418457, -1.0322668552398682, -0.8551368713378906, -0.6780068874359131, -0.5008769035339355, -0.323746919631958, -0.14661693572998047, 0.03051304817199707, 0.2076430320739746, 0.38477301597595215, 0.5619029998779297, 0.7390329837799072, 0.9161629676818848, 1.0932929515838623, 1.2704229354858398, 1.4475529193878174, 1.624682903289795, 1.8018128871917725, 1.97894287109375, 2.1560728549957275, 2.333202838897705, 2.5103328227996826, 2.68746280670166, 2.8645927906036377, 3.0417227745056152, 3.2188527584075928, 3.3959827423095703, 3.573112726211548, 3.7502427101135254, 3.927372694015503, 4.1045026779174805, 4.281632423400879, 4.4587626457214355, 4.635892868041992, 4.813022613525391, 4.990152359008789, 5.167282581329346, 5.344412803649902, 5.521542549133301]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 3.0, 7.0, 12.0, 9.0, 9.0, 26.0, 16.0, 14.0, 21.0, 22.0, 26.0, 36.0, 25.0, 41.0, 40.0, 30.0, 52.0, 41.0, 38.0, 49.0, 36.0, 40.0, 53.0, 46.0, 34.0, 39.0, 25.0, 29.0, 27.0, 38.0, 18.0, 13.0, 21.0, 11.0, 10.0, 10.0, 6.0, 4.0, 1.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.505605697631836, -6.326276779174805, -6.146947860717773, -5.967618942260742, -5.788290023803711, -5.60896110534668, -5.429632186889648, -5.250303268432617, -5.070974349975586, -4.891645431518555, -4.712316513061523, -4.532987594604492, -4.353658676147461, -4.17432975769043, -3.9950008392333984, -3.815671920776367, -3.636343240737915, -3.457014322280884, -3.2776854038238525, -3.0983564853668213, -2.91902756690979, -2.739698648452759, -2.5603699684143066, -2.3810410499572754, -2.201712131500244, -2.022383213043213, -1.8430542945861816, -1.6637253761291504, -1.4843964576721191, -1.305067539215088, -1.1257387399673462, -0.9464098215103149, -0.7670807838439941, -0.5877518653869629, -0.40842297673225403, -0.22909408807754517, -0.049765169620513916, 0.12956374883651733, 0.3088926076889038, 0.48822152614593506, 0.6675504446029663, 0.8468793630599976, 1.0262082815170288, 1.2055370807647705, 1.3848659992218018, 1.564194917678833, 1.7435238361358643, 1.9228527545928955, 2.1021816730499268, 2.281510591506958, 2.4608395099639893, 2.6401684284210205, 2.8194973468780518, 2.998826265335083, 3.178154945373535, 3.3574838638305664, 3.5368127822875977, 3.716141700744629, 3.89547061920166, 4.074799537658691, 4.254128456115723, 4.433457374572754, 4.612786293029785, 4.792115211486816, 4.971444129943848]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 6.0, 19.0, 19.0, 26.0, 47.0, 52.0, 89.0, 154.0, 194.0, 278.0, 439.0, 691.0, 1001.0, 1484.0, 2287.0, 3808.0, 5844.0, 9384.0, 15115.0, 24578.0, 41068.0, 69926.0, 126993.0, 261829.0, 683580.0, 1339212.0, 900926.0, 348625.0, 155145.0, 81755.0, 46929.0, 27560.0, 16639.0, 10238.0, 6405.0, 4060.0, 2722.0, 1676.0, 1123.0, 743.0, 502.0, 358.0, 214.0, 169.0, 118.0, 71.0, 67.0, 35.0, 28.0, 15.0, 10.0, 9.0, 8.0, 5.0, 1.0, 2.0, 3.0, 2.0], "bins": [-6.8828125, -6.665283203125, -6.44775390625, -6.230224609375, -6.0126953125, -5.795166015625, -5.57763671875, -5.360107421875, -5.142578125, -4.925048828125, -4.70751953125, -4.489990234375, -4.2724609375, -4.054931640625, -3.83740234375, -3.619873046875, -3.40234375, -3.184814453125, -2.96728515625, -2.749755859375, -2.5322265625, -2.314697265625, -2.09716796875, -1.879638671875, -1.662109375, -1.444580078125, -1.22705078125, -1.009521484375, -0.7919921875, -0.574462890625, -0.35693359375, -0.139404296875, 0.078125, 0.295654296875, 0.51318359375, 0.730712890625, 0.9482421875, 1.165771484375, 1.38330078125, 1.600830078125, 1.818359375, 2.035888671875, 2.25341796875, 2.470947265625, 2.6884765625, 2.906005859375, 3.12353515625, 3.341064453125, 3.55859375, 3.776123046875, 3.99365234375, 4.211181640625, 4.4287109375, 4.646240234375, 4.86376953125, 5.081298828125, 5.298828125, 5.516357421875, 5.73388671875, 5.951416015625, 6.1689453125, 6.386474609375, 6.60400390625, 6.821533203125, 7.0390625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 10.0, 10.0, 11.0, 13.0, 20.0, 27.0, 17.0, 16.0, 29.0, 21.0, 27.0, 41.0, 41.0, 38.0, 43.0, 44.0, 43.0, 41.0, 50.0, 46.0, 49.0, 41.0, 44.0, 34.0, 30.0, 32.0, 32.0, 27.0, 35.0, 14.0, 13.0, 13.0, 7.0, 5.0, 10.0, 1.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.6953125, -5.53515625, -5.375, -5.21484375, -5.0546875, -4.89453125, -4.734375, -4.57421875, -4.4140625, -4.25390625, -4.09375, -3.93359375, -3.7734375, -3.61328125, -3.453125, -3.29296875, -3.1328125, -2.97265625, -2.8125, -2.65234375, -2.4921875, -2.33203125, -2.171875, -2.01171875, -1.8515625, -1.69140625, -1.53125, -1.37109375, -1.2109375, -1.05078125, -0.890625, -0.73046875, -0.5703125, -0.41015625, -0.25, -0.08984375, 0.0703125, 0.23046875, 0.390625, 0.55078125, 0.7109375, 0.87109375, 1.03125, 1.19140625, 1.3515625, 1.51171875, 1.671875, 1.83203125, 1.9921875, 2.15234375, 2.3125, 2.47265625, 2.6328125, 2.79296875, 2.953125, 3.11328125, 3.2734375, 3.43359375, 3.59375, 3.75390625, 3.9140625, 4.07421875, 4.234375, 4.39453125, 4.5546875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 8.0, 9.0, 13.0, 17.0, 27.0, 43.0, 48.0, 79.0, 126.0, 150.0, 269.0, 338.0, 550.0, 779.0, 1176.0, 1780.0, 2709.0, 3911.0, 6107.0, 9522.0, 14986.0, 24653.0, 40567.0, 68967.0, 121680.0, 221093.0, 422529.0, 797823.0, 1046863.0, 643443.0, 336079.0, 180013.0, 99834.0, 57020.0, 33716.0, 20729.0, 12943.0, 8193.0, 5273.0, 3431.0, 2228.0, 1473.0, 1039.0, 668.0, 456.0, 320.0, 207.0, 128.0, 87.0, 69.0, 48.0, 27.0, 18.0, 13.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-5.81640625, -5.636474609375, -5.45654296875, -5.276611328125, -5.0966796875, -4.916748046875, -4.73681640625, -4.556884765625, -4.376953125, -4.197021484375, -4.01708984375, -3.837158203125, -3.6572265625, -3.477294921875, -3.29736328125, -3.117431640625, -2.9375, -2.757568359375, -2.57763671875, -2.397705078125, -2.2177734375, -2.037841796875, -1.85791015625, -1.677978515625, -1.498046875, -1.318115234375, -1.13818359375, -0.958251953125, -0.7783203125, -0.598388671875, -0.41845703125, -0.238525390625, -0.05859375, 0.121337890625, 0.30126953125, 0.481201171875, 0.6611328125, 0.841064453125, 1.02099609375, 1.200927734375, 1.380859375, 1.560791015625, 1.74072265625, 1.920654296875, 2.1005859375, 2.280517578125, 2.46044921875, 2.640380859375, 2.8203125, 3.000244140625, 3.18017578125, 3.360107421875, 3.5400390625, 3.719970703125, 3.89990234375, 4.079833984375, 4.259765625, 4.439697265625, 4.61962890625, 4.799560546875, 4.9794921875, 5.159423828125, 5.33935546875, 5.519287109375, 5.69921875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 9.0, 4.0, 12.0, 18.0, 22.0, 35.0, 29.0, 38.0, 72.0, 67.0, 92.0, 119.0, 121.0, 160.0, 216.0, 234.0, 284.0, 329.0, 325.0, 308.0, 264.0, 252.0, 221.0, 144.0, 100.0, 120.0, 94.0, 83.0, 64.0, 46.0, 28.0, 37.0, 24.0, 20.0, 13.0, 16.0, 13.0, 8.0, 10.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.783203125, -2.7001953125, -2.6171875, -2.5341796875, -2.451171875, -2.3681640625, -2.28515625, -2.2021484375, -2.119140625, -2.0361328125, -1.953125, -1.8701171875, -1.787109375, -1.7041015625, -1.62109375, -1.5380859375, -1.455078125, -1.3720703125, -1.2890625, -1.2060546875, -1.123046875, -1.0400390625, -0.95703125, -0.8740234375, -0.791015625, -0.7080078125, -0.625, -0.5419921875, -0.458984375, -0.3759765625, -0.29296875, -0.2099609375, -0.126953125, -0.0439453125, 0.0390625, 0.1220703125, 0.205078125, 0.2880859375, 0.37109375, 0.4541015625, 0.537109375, 0.6201171875, 0.703125, 0.7861328125, 0.869140625, 0.9521484375, 1.03515625, 1.1181640625, 1.201171875, 1.2841796875, 1.3671875, 1.4501953125, 1.533203125, 1.6162109375, 1.69921875, 1.7822265625, 1.865234375, 1.9482421875, 2.03125, 2.1142578125, 2.197265625, 2.2802734375, 2.36328125, 2.4462890625, 2.529296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 4.0, 9.0, 6.0, 8.0, 15.0, 24.0, 17.0, 28.0, 38.0, 43.0, 52.0, 54.0, 76.0, 60.0, 73.0, 61.0, 65.0, 50.0, 50.0, 52.0, 32.0, 26.0, 25.0, 15.0, 20.0, 23.0, 16.0, 9.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.343061923980713, -5.175854206085205, -5.008646011352539, -4.841438293457031, -4.674230575561523, -4.507022380828857, -4.33981466293335, -4.172606468200684, -4.005398750305176, -3.838190793991089, -3.670982837677002, -3.503775119781494, -3.3365671634674072, -3.1693592071533203, -3.0021514892578125, -2.8349435329437256, -2.6677355766296387, -2.5005276203155518, -2.333319664001465, -2.166111946105957, -1.9989039897918701, -1.8316960334777832, -1.6644881963729858, -1.4972803592681885, -1.3300724029541016, -1.1628644466400146, -0.9956566095352173, -0.8284487128257751, -0.661240816116333, -0.49403291940689087, -0.32682502269744873, -0.15961718559265137, 0.007590770721435547, 0.17479866743087769, 0.3420065641403198, 0.509214460849762, 0.6764223575592041, 0.8436302542686462, 1.0108381509780884, 1.1780459880828857, 1.3452539443969727, 1.5124619007110596, 1.679669737815857, 1.8468775749206543, 2.014085531234741, 2.181293487548828, 2.348501205444336, 2.515709161758423, 2.6829171180725098, 2.8501250743865967, 3.0173330307006836, 3.1845407485961914, 3.3517487049102783, 3.5189566612243652, 3.686164379119873, 3.85337233543396, 4.020580291748047, 4.187788009643555, 4.354996204376221, 4.5222039222717285, 4.6894121170043945, 4.856619834899902, 5.02382755279541, 5.191035270690918, 5.358243465423584]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 0.0, 5.0, 5.0, 13.0, 12.0, 13.0, 16.0, 21.0, 19.0, 28.0, 33.0, 25.0, 37.0, 33.0, 35.0, 33.0, 36.0, 37.0, 42.0, 34.0, 44.0, 37.0, 39.0, 46.0, 39.0, 34.0, 42.0, 28.0, 30.0, 29.0, 32.0, 17.0, 18.0, 17.0, 15.0, 8.0, 7.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.648920059204102, -5.479326248168945, -5.309732437133789, -5.140138626098633, -4.970544338226318, -4.800950527191162, -4.631356716156006, -4.46176290512085, -4.292169094085693, -4.122575283050537, -3.9529812335968018, -3.7833874225616455, -3.6137936115264893, -3.444199562072754, -3.2746057510375977, -3.1050119400024414, -2.935417890548706, -2.76582407951355, -2.5962300300598145, -2.426636219024658, -2.257042407989502, -2.0874485969543457, -1.9178545475006104, -1.748260736465454, -1.5786668062210083, -1.4090728759765625, -1.2394790649414062, -1.0698851346969604, -0.9002912640571594, -0.7306973934173584, -0.5611034631729126, -0.39150965213775635, -0.22191572189331055, -0.05232183635234833, 0.11727204918861389, 0.2868659496307373, 0.45645982027053833, 0.6260536909103394, 0.7956476211547852, 0.9652414321899414, 1.1348353624343872, 1.304429292678833, 1.4740231037139893, 1.643617033958435, 1.8132109642028809, 1.982804775238037, 2.1523985862731934, 2.3219923973083496, 2.491586446762085, 2.661180257797241, 2.8307743072509766, 3.000368118286133, 3.169961929321289, 3.3395557403564453, 3.5091497898101807, 3.678743600845337, 3.8483376502990723, 4.0179314613342285, 4.187525272369385, 4.357119560241699, 4.5267133712768555, 4.696307182312012, 4.865900993347168, 5.035494804382324, 5.2050886154174805]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 16.0, 15.0, 31.0, 32.0, 61.0, 78.0, 118.0, 182.0, 311.0, 491.0, 770.0, 1223.0, 1921.0, 3377.0, 5634.0, 9904.0, 16896.0, 29895.0, 53078.0, 95650.0, 172621.0, 258346.0, 175457.0, 96692.0, 53633.0, 30325.0, 17283.0, 9966.0, 5757.0, 3372.0, 2012.0, 1257.0, 765.0, 479.0, 336.0, 206.0, 126.0, 83.0, 59.0, 28.0, 26.0, 11.0, 14.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.4765625, -2.400390625, -2.32421875, -2.248046875, -2.171875, -2.095703125, -2.01953125, -1.943359375, -1.8671875, -1.791015625, -1.71484375, -1.638671875, -1.5625, -1.486328125, -1.41015625, -1.333984375, -1.2578125, -1.181640625, -1.10546875, -1.029296875, -0.953125, -0.876953125, -0.80078125, -0.724609375, -0.6484375, -0.572265625, -0.49609375, -0.419921875, -0.34375, -0.267578125, -0.19140625, -0.115234375, -0.0390625, 0.037109375, 0.11328125, 0.189453125, 0.265625, 0.341796875, 0.41796875, 0.494140625, 0.5703125, 0.646484375, 0.72265625, 0.798828125, 0.875, 0.951171875, 1.02734375, 1.103515625, 1.1796875, 1.255859375, 1.33203125, 1.408203125, 1.484375, 1.560546875, 1.63671875, 1.712890625, 1.7890625, 1.865234375, 1.94140625, 2.017578125, 2.09375, 2.169921875, 2.24609375, 2.322265625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 2.0, 9.0, 7.0, 9.0, 14.0, 12.0, 22.0, 23.0, 26.0, 21.0, 34.0, 38.0, 30.0, 36.0, 34.0, 32.0, 37.0, 40.0, 43.0, 36.0, 30.0, 37.0, 35.0, 48.0, 34.0, 27.0, 40.0, 35.0, 29.0, 28.0, 25.0, 25.0, 19.0, 11.0, 10.0, 10.0, 13.0, 2.0, 7.0, 5.0, 3.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.30078125, -5.13372802734375, -4.9666748046875, -4.79962158203125, -4.632568359375, -4.46551513671875, -4.2984619140625, -4.13140869140625, -3.96435546875, -3.79730224609375, -3.6302490234375, -3.46319580078125, -3.296142578125, -3.12908935546875, -2.9620361328125, -2.79498291015625, -2.6279296875, -2.46087646484375, -2.2938232421875, -2.12677001953125, -1.959716796875, -1.79266357421875, -1.6256103515625, -1.45855712890625, -1.29150390625, -1.12445068359375, -0.9573974609375, -0.79034423828125, -0.623291015625, -0.45623779296875, -0.2891845703125, -0.12213134765625, 0.044921875, 0.21197509765625, 0.3790283203125, 0.54608154296875, 0.713134765625, 0.88018798828125, 1.0472412109375, 1.21429443359375, 1.38134765625, 1.54840087890625, 1.7154541015625, 1.88250732421875, 2.049560546875, 2.21661376953125, 2.3836669921875, 2.55072021484375, 2.7177734375, 2.88482666015625, 3.0518798828125, 3.21893310546875, 3.385986328125, 3.55303955078125, 3.7200927734375, 3.88714599609375, 4.05419921875, 4.22125244140625, 4.3883056640625, 4.55535888671875, 4.722412109375, 4.88946533203125, 5.0565185546875, 5.22357177734375, 5.390625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 5.0, 3.0, 3.0, 16.0, 12.0, 24.0, 30.0, 53.0, 90.0, 109.0, 190.0, 230.0, 397.0, 544.0, 872.0, 1272.0, 2053.0, 3275.0, 5233.0, 8651.0, 14882.0, 26361.0, 47562.0, 88371.0, 174212.0, 303374.0, 171788.0, 87606.0, 46929.0, 26225.0, 14932.0, 8787.0, 5344.0, 3268.0, 1992.0, 1311.0, 833.0, 562.0, 395.0, 249.0, 165.0, 113.0, 67.0, 44.0, 43.0, 31.0, 11.0, 16.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.693359375, -2.612945556640625, -2.53253173828125, -2.452117919921875, -2.3717041015625, -2.291290283203125, -2.21087646484375, -2.130462646484375, -2.050048828125, -1.969635009765625, -1.88922119140625, -1.808807373046875, -1.7283935546875, -1.647979736328125, -1.56756591796875, -1.487152099609375, -1.40673828125, -1.326324462890625, -1.24591064453125, -1.165496826171875, -1.0850830078125, -1.004669189453125, -0.92425537109375, -0.843841552734375, -0.763427734375, -0.683013916015625, -0.60260009765625, -0.522186279296875, -0.4417724609375, -0.361358642578125, -0.28094482421875, -0.200531005859375, -0.1201171875, -0.039703369140625, 0.04071044921875, 0.121124267578125, 0.2015380859375, 0.281951904296875, 0.36236572265625, 0.442779541015625, 0.523193359375, 0.603607177734375, 0.68402099609375, 0.764434814453125, 0.8448486328125, 0.925262451171875, 1.00567626953125, 1.086090087890625, 1.16650390625, 1.246917724609375, 1.32733154296875, 1.407745361328125, 1.4881591796875, 1.568572998046875, 1.64898681640625, 1.729400634765625, 1.809814453125, 1.890228271484375, 1.97064208984375, 2.051055908203125, 2.1314697265625, 2.211883544921875, 2.29229736328125, 2.372711181640625, 2.453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 14.0, 14.0, 8.0, 11.0, 12.0, 25.0, 35.0, 15.0, 25.0, 22.0, 25.0, 32.0, 36.0, 37.0, 43.0, 30.0, 30.0, 28.0, 35.0, 47.0, 37.0, 49.0, 34.0, 48.0, 31.0, 31.0, 22.0, 31.0, 23.0, 29.0, 21.0, 18.0, 12.0, 13.0, 10.0, 7.0, 11.0, 7.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.2578125, -3.15521240234375, -3.0526123046875, -2.95001220703125, -2.847412109375, -2.74481201171875, -2.6422119140625, -2.53961181640625, -2.43701171875, -2.33441162109375, -2.2318115234375, -2.12921142578125, -2.026611328125, -1.92401123046875, -1.8214111328125, -1.71881103515625, -1.6162109375, -1.51361083984375, -1.4110107421875, -1.30841064453125, -1.205810546875, -1.10321044921875, -1.0006103515625, -0.89801025390625, -0.79541015625, -0.69281005859375, -0.5902099609375, -0.48760986328125, -0.385009765625, -0.28240966796875, -0.1798095703125, -0.07720947265625, 0.025390625, 0.12799072265625, 0.2305908203125, 0.33319091796875, 0.435791015625, 0.53839111328125, 0.6409912109375, 0.74359130859375, 0.84619140625, 0.94879150390625, 1.0513916015625, 1.15399169921875, 1.256591796875, 1.35919189453125, 1.4617919921875, 1.56439208984375, 1.6669921875, 1.76959228515625, 1.8721923828125, 1.97479248046875, 2.077392578125, 2.17999267578125, 2.2825927734375, 2.38519287109375, 2.48779296875, 2.59039306640625, 2.6929931640625, 2.79559326171875, 2.898193359375, 3.00079345703125, 3.1033935546875, 3.20599365234375, 3.30859375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 9.0, 9.0, 9.0, 15.0, 37.0, 28.0, 68.0, 85.0, 147.0, 197.0, 326.0, 474.0, 842.0, 1419.0, 2601.0, 4897.0, 10081.0, 23067.0, 60630.0, 204557.0, 496363.0, 155377.0, 48872.0, 19625.0, 8852.0, 4330.0, 2321.0, 1300.0, 738.0, 427.0, 314.0, 197.0, 111.0, 68.0, 62.0, 32.0, 24.0, 15.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027923583984375, -0.02706170082092285, -0.026199817657470703, -0.025337934494018555, -0.024476051330566406, -0.023614168167114258, -0.02275228500366211, -0.02189040184020996, -0.021028518676757812, -0.020166635513305664, -0.019304752349853516, -0.018442869186401367, -0.01758098602294922, -0.01671910285949707, -0.015857219696044922, -0.014995336532592773, -0.014133453369140625, -0.013271570205688477, -0.012409687042236328, -0.01154780387878418, -0.010685920715332031, -0.009824037551879883, -0.008962154388427734, -0.008100271224975586, -0.0072383880615234375, -0.006376504898071289, -0.005514621734619141, -0.004652738571166992, -0.0037908554077148438, -0.0029289722442626953, -0.002067089080810547, -0.0012052059173583984, -0.00034332275390625, 0.0005185604095458984, 0.0013804435729980469, 0.0022423267364501953, 0.0031042098999023438, 0.003966093063354492, 0.004827976226806641, 0.005689859390258789, 0.0065517425537109375, 0.007413625717163086, 0.008275508880615234, 0.009137392044067383, 0.009999275207519531, 0.01086115837097168, 0.011723041534423828, 0.012584924697875977, 0.013446807861328125, 0.014308691024780273, 0.015170574188232422, 0.01603245735168457, 0.01689434051513672, 0.017756223678588867, 0.018618106842041016, 0.019479990005493164, 0.020341873168945312, 0.02120375633239746, 0.02206563949584961, 0.022927522659301758, 0.023789405822753906, 0.024651288986206055, 0.025513172149658203, 0.02637505531311035, 0.0272369384765625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 3.0, 3.0, 6.0, 6.0, 10.0, 12.0, 17.0, 30.0, 27.0, 38.0, 59.0, 49.0, 53.0, 74.0, 95.0, 72.0, 95.0, 70.0, 51.0, 31.0, 50.0, 28.0, 25.0, 20.0, 18.0, 9.0, 4.0, 4.0, 8.0, 5.0, 2.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.761882781982422e-06, -8.531846106052399e-06, -8.301809430122375e-06, -8.071772754192352e-06, -7.841736078262329e-06, -7.611699402332306e-06, -7.381662726402283e-06, -7.1516260504722595e-06, -6.921589374542236e-06, -6.691552698612213e-06, -6.46151602268219e-06, -6.231479346752167e-06, -6.0014426708221436e-06, -5.77140599489212e-06, -5.541369318962097e-06, -5.311332643032074e-06, -5.081295967102051e-06, -4.851259291172028e-06, -4.621222615242004e-06, -4.391185939311981e-06, -4.161149263381958e-06, -3.931112587451935e-06, -3.7010759115219116e-06, -3.4710392355918884e-06, -3.2410025596618652e-06, -3.010965883731842e-06, -2.780929207801819e-06, -2.5508925318717957e-06, -2.3208558559417725e-06, -2.0908191800117493e-06, -1.860782504081726e-06, -1.6307458281517029e-06, -1.4007091522216797e-06, -1.1706724762916565e-06, -9.406358003616333e-07, -7.105991244316101e-07, -4.805624485015869e-07, -2.505257725715637e-07, -2.0489096641540527e-08, 2.0954757928848267e-07, 4.3958425521850586e-07, 6.69620931148529e-07, 8.996576070785522e-07, 1.1296942830085754e-06, 1.3597309589385986e-06, 1.5897676348686218e-06, 1.819804310798645e-06, 2.0498409867286682e-06, 2.2798776626586914e-06, 2.5099143385887146e-06, 2.739951014518738e-06, 2.969987690448761e-06, 3.200024366378784e-06, 3.4300610423088074e-06, 3.6600977182388306e-06, 3.890134394168854e-06, 4.120171070098877e-06, 4.3502077460289e-06, 4.580244421958923e-06, 4.8102810978889465e-06, 5.04031777381897e-06, 5.270354449748993e-06, 5.500391125679016e-06, 5.730427801609039e-06, 5.9604644775390625e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 14.0, 23.0, 44.0, 59.0, 75.0, 119.0, 180.0, 250.0, 350.0, 524.0, 735.0, 1115.0, 1599.0, 2369.0, 3668.0, 5601.0, 8821.0, 14304.0, 23599.0, 40701.0, 72811.0, 135402.0, 244617.0, 218738.0, 116856.0, 63530.0, 35703.0, 20807.0, 12702.0, 7880.0, 5026.0, 3300.0, 2253.0, 1449.0, 1067.0, 721.0, 466.0, 348.0, 222.0, 148.0, 108.0, 75.0, 45.0, 42.0, 26.0, 16.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0], "bins": [-0.0150146484375, -0.014571547508239746, -0.014128446578979492, -0.013685345649719238, -0.013242244720458984, -0.01279914379119873, -0.012356042861938477, -0.011912941932678223, -0.011469841003417969, -0.011026740074157715, -0.010583639144897461, -0.010140538215637207, -0.009697437286376953, -0.0092543363571167, -0.008811235427856445, -0.008368134498596191, -0.007925033569335938, -0.007481932640075684, -0.00703883171081543, -0.006595730781555176, -0.006152629852294922, -0.005709528923034668, -0.005266427993774414, -0.00482332706451416, -0.004380226135253906, -0.003937125205993652, -0.0034940242767333984, -0.0030509233474731445, -0.0026078224182128906, -0.0021647214889526367, -0.0017216205596923828, -0.001278519630432129, -0.000835418701171875, -0.0003923177719116211, 5.078315734863281e-05, 0.0004938840866088867, 0.0009369850158691406, 0.0013800859451293945, 0.0018231868743896484, 0.0022662878036499023, 0.0027093887329101562, 0.00315248966217041, 0.003595590591430664, 0.004038691520690918, 0.004481792449951172, 0.004924893379211426, 0.00536799430847168, 0.005811095237731934, 0.0062541961669921875, 0.006697297096252441, 0.007140398025512695, 0.007583498954772949, 0.008026599884033203, 0.008469700813293457, 0.008912801742553711, 0.009355902671813965, 0.009799003601074219, 0.010242104530334473, 0.010685205459594727, 0.01112830638885498, 0.011571407318115234, 0.012014508247375488, 0.012457609176635742, 0.012900710105895996, 0.01334381103515625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 0.0, 6.0, 4.0, 12.0, 9.0, 13.0, 8.0, 17.0, 29.0, 28.0, 28.0, 30.0, 37.0, 48.0, 62.0, 85.0, 73.0, 78.0, 60.0, 73.0, 61.0, 46.0, 40.0, 22.0, 17.0, 13.0, 16.0, 16.0, 12.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0069122314453125, -0.006721079349517822, -0.0065299272537231445, -0.006338775157928467, -0.006147623062133789, -0.005956470966339111, -0.005765318870544434, -0.005574166774749756, -0.005383014678955078, -0.0051918625831604, -0.005000710487365723, -0.004809558391571045, -0.004618406295776367, -0.0044272541999816895, -0.004236102104187012, -0.004044950008392334, -0.0038537979125976562, -0.0036626458168029785, -0.0034714937210083008, -0.003280341625213623, -0.0030891895294189453, -0.0028980374336242676, -0.00270688533782959, -0.002515733242034912, -0.0023245811462402344, -0.0021334290504455566, -0.001942276954650879, -0.0017511248588562012, -0.0015599727630615234, -0.0013688206672668457, -0.001177668571472168, -0.0009865164756774902, -0.0007953643798828125, -0.0006042122840881348, -0.00041306018829345703, -0.0002219080924987793, -3.075599670410156e-05, 0.00016039609909057617, 0.0003515481948852539, 0.0005427002906799316, 0.0007338523864746094, 0.0009250044822692871, 0.0011161565780639648, 0.0013073086738586426, 0.0014984607696533203, 0.001689612865447998, 0.0018807649612426758, 0.0020719170570373535, 0.0022630691528320312, 0.002454221248626709, 0.0026453733444213867, 0.0028365254402160645, 0.003027677536010742, 0.00321882963180542, 0.0034099817276000977, 0.0036011338233947754, 0.003792285919189453, 0.003983438014984131, 0.004174590110778809, 0.004365742206573486, 0.004556894302368164, 0.004748046398162842, 0.0049391984939575195, 0.005130350589752197, 0.005321502685546875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 5.0, 10.0, 16.0, 24.0, 21.0, 27.0, 38.0, 48.0, 54.0, 50.0, 73.0, 72.0, 73.0, 60.0, 61.0, 55.0, 52.0, 39.0, 29.0, 33.0, 19.0, 15.0, 30.0, 14.0, 13.0, 10.0, 7.0, 7.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.338839530944824, -5.170355796813965, -5.0018720626831055, -4.833388328552246, -4.664904594421387, -4.4964213371276855, -4.327937602996826, -4.159453868865967, -3.9909701347351074, -3.822486400604248, -3.6540026664733887, -3.4855191707611084, -3.317035436630249, -3.1485517024993896, -2.9800682067871094, -2.81158447265625, -2.6431007385253906, -2.4746170043945312, -2.306133270263672, -2.1376497745513916, -1.9691660404205322, -1.8006823062896729, -1.632198691368103, -1.4637150764465332, -1.2952313423156738, -1.1267476081848145, -0.9582639932632446, -0.78978031873703, -0.6212966442108154, -0.45281296968460083, -0.28432929515838623, -0.1158456802368164, 0.05263805389404297, 0.22112172842025757, 0.38960540294647217, 0.5580890774726868, 0.7265727519989014, 0.895056426525116, 1.0635401010513306, 1.2320237159729004, 1.4005074501037598, 1.5689911842346191, 1.737474799156189, 1.9059584140777588, 2.074442148208618, 2.2429258823394775, 2.411409378051758, 2.579893112182617, 2.7483768463134766, 2.916860580444336, 3.0853443145751953, 3.2538278102874756, 3.422311544418335, 3.5907952785491943, 3.7592787742614746, 3.927762508392334, 4.096246242523193, 4.264729976654053, 4.433213710784912, 4.6016974449157715, 4.770180702209473, 4.938664436340332, 5.107148170471191, 5.275631904602051, 5.44411563873291]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 0.0, 5.0, 5.0, 13.0, 11.0, 14.0, 17.0, 20.0, 19.0, 28.0, 33.0, 26.0, 36.0, 33.0, 35.0, 34.0, 35.0, 37.0, 43.0, 33.0, 43.0, 37.0, 39.0, 45.0, 41.0, 31.0, 44.0, 28.0, 31.0, 27.0, 31.0, 20.0, 17.0, 18.0, 15.0, 8.0, 6.0, 9.0, 8.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.602665901184082, -5.434182643890381, -5.2656989097595215, -5.09721565246582, -4.928732395172119, -4.76024866104126, -4.591765403747559, -4.423281669616699, -4.254798412322998, -4.086315155029297, -3.9178316593170166, -3.7493481636047363, -3.580864667892456, -3.412381172180176, -3.2438979148864746, -3.0754144191741943, -2.906931161880493, -2.738447666168213, -2.5699644088745117, -2.4014809131622314, -2.232997417449951, -2.06451416015625, -1.8960306644439697, -1.7275471687316895, -1.5590637922286987, -1.390580415725708, -1.2220969200134277, -1.053613543510437, -0.8851301074028015, -0.716646671295166, -0.5481632947921753, -0.379679799079895, -0.2111964225769043, -0.04271300137042999, 0.1257704198360443, 0.2942538261413574, 0.4627372622489929, 0.6312206983566284, 0.7997040748596191, 0.9681875705718994, 1.1366709470748901, 1.3051543235778809, 1.4736378192901611, 1.6421211957931519, 1.8106045722961426, 1.9790880680084229, 2.147571563720703, 2.3160548210144043, 2.4845383167266846, 2.653021812438965, 2.821505069732666, 2.9899885654449463, 3.1584720611572266, 3.3269553184509277, 3.495438814163208, 3.6639223098754883, 3.8324055671691895, 4.000888824462891, 4.16937255859375, 4.337855815887451, 4.506339073181152, 4.674822807312012, 4.843306064605713, 5.011789321899414, 5.180273056030273]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 10.0, 14.0, 24.0, 28.0, 38.0, 55.0, 109.0, 180.0, 234.0, 327.0, 528.0, 821.0, 1236.0, 1873.0, 2912.0, 4534.0, 7052.0, 10751.0, 16771.0, 26396.0, 41031.0, 65685.0, 101289.0, 146450.0, 173946.0, 150425.0, 105643.0, 69223.0, 43519.0, 27550.0, 17767.0, 11312.0, 7213.0, 4754.0, 3049.0, 1986.0, 1338.0, 808.0, 586.0, 401.0, 229.0, 166.0, 90.0, 67.0, 45.0, 26.0, 26.0, 13.0, 8.0, 2.0, 5.0, 4.0, 3.0, 3.0, 3.0], "bins": [-7.4140625, -7.193115234375, -6.97216796875, -6.751220703125, -6.5302734375, -6.309326171875, -6.08837890625, -5.867431640625, -5.646484375, -5.425537109375, -5.20458984375, -4.983642578125, -4.7626953125, -4.541748046875, -4.32080078125, -4.099853515625, -3.87890625, -3.657958984375, -3.43701171875, -3.216064453125, -2.9951171875, -2.774169921875, -2.55322265625, -2.332275390625, -2.111328125, -1.890380859375, -1.66943359375, -1.448486328125, -1.2275390625, -1.006591796875, -0.78564453125, -0.564697265625, -0.34375, -0.122802734375, 0.09814453125, 0.319091796875, 0.5400390625, 0.760986328125, 0.98193359375, 1.202880859375, 1.423828125, 1.644775390625, 1.86572265625, 2.086669921875, 2.3076171875, 2.528564453125, 2.74951171875, 2.970458984375, 3.19140625, 3.412353515625, 3.63330078125, 3.854248046875, 4.0751953125, 4.296142578125, 4.51708984375, 4.738037109375, 4.958984375, 5.179931640625, 5.40087890625, 5.621826171875, 5.8427734375, 6.063720703125, 6.28466796875, 6.505615234375, 6.7265625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 14.0, 7.0, 14.0, 13.0, 21.0, 16.0, 21.0, 30.0, 33.0, 29.0, 27.0, 27.0, 36.0, 36.0, 42.0, 42.0, 40.0, 53.0, 44.0, 36.0, 37.0, 46.0, 42.0, 29.0, 43.0, 41.0, 26.0, 26.0, 22.0, 17.0, 16.0, 15.0, 7.0, 7.0, 8.0, 7.0, 6.0, 8.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.69921875, -5.5350341796875, -5.370849609375, -5.2066650390625, -5.04248046875, -4.8782958984375, -4.714111328125, -4.5499267578125, -4.3857421875, -4.2215576171875, -4.057373046875, -3.8931884765625, -3.72900390625, -3.5648193359375, -3.400634765625, -3.2364501953125, -3.072265625, -2.9080810546875, -2.743896484375, -2.5797119140625, -2.41552734375, -2.2513427734375, -2.087158203125, -1.9229736328125, -1.7587890625, -1.5946044921875, -1.430419921875, -1.2662353515625, -1.10205078125, -0.9378662109375, -0.773681640625, -0.6094970703125, -0.4453125, -0.2811279296875, -0.116943359375, 0.0472412109375, 0.21142578125, 0.3756103515625, 0.539794921875, 0.7039794921875, 0.8681640625, 1.0323486328125, 1.196533203125, 1.3607177734375, 1.52490234375, 1.6890869140625, 1.853271484375, 2.0174560546875, 2.181640625, 2.3458251953125, 2.510009765625, 2.6741943359375, 2.83837890625, 3.0025634765625, 3.166748046875, 3.3309326171875, 3.4951171875, 3.6593017578125, 3.823486328125, 3.9876708984375, 4.15185546875, 4.3160400390625, 4.480224609375, 4.6444091796875, 4.80859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 11.0, 15.0, 31.0, 27.0, 66.0, 96.0, 127.0, 202.0, 323.0, 449.0, 662.0, 1041.0, 1675.0, 2491.0, 3993.0, 6384.0, 9800.0, 15871.0, 24904.0, 39318.0, 62843.0, 97077.0, 140631.0, 170055.0, 154431.0, 113644.0, 74265.0, 47414.0, 29757.0, 18688.0, 11536.0, 7437.0, 4579.0, 3042.0, 1975.0, 1217.0, 838.0, 557.0, 356.0, 237.0, 163.0, 104.0, 69.0, 46.0, 31.0, 23.0, 21.0, 8.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.046875, -6.831298828125, -6.61572265625, -6.400146484375, -6.1845703125, -5.968994140625, -5.75341796875, -5.537841796875, -5.322265625, -5.106689453125, -4.89111328125, -4.675537109375, -4.4599609375, -4.244384765625, -4.02880859375, -3.813232421875, -3.59765625, -3.382080078125, -3.16650390625, -2.950927734375, -2.7353515625, -2.519775390625, -2.30419921875, -2.088623046875, -1.873046875, -1.657470703125, -1.44189453125, -1.226318359375, -1.0107421875, -0.795166015625, -0.57958984375, -0.364013671875, -0.1484375, 0.067138671875, 0.28271484375, 0.498291015625, 0.7138671875, 0.929443359375, 1.14501953125, 1.360595703125, 1.576171875, 1.791748046875, 2.00732421875, 2.222900390625, 2.4384765625, 2.654052734375, 2.86962890625, 3.085205078125, 3.30078125, 3.516357421875, 3.73193359375, 3.947509765625, 4.1630859375, 4.378662109375, 4.59423828125, 4.809814453125, 5.025390625, 5.240966796875, 5.45654296875, 5.672119140625, 5.8876953125, 6.103271484375, 6.31884765625, 6.534423828125, 6.75]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 5.0, 4.0, 11.0, 4.0, 16.0, 7.0, 20.0, 18.0, 13.0, 21.0, 19.0, 25.0, 28.0, 28.0, 32.0, 38.0, 47.0, 33.0, 35.0, 51.0, 43.0, 36.0, 42.0, 45.0, 35.0, 39.0, 29.0, 28.0, 30.0, 25.0, 34.0, 26.0, 14.0, 26.0, 17.0, 12.0, 14.0, 10.0, 12.0, 8.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.197265625, -3.100433349609375, -3.00360107421875, -2.906768798828125, -2.8099365234375, -2.713104248046875, -2.61627197265625, -2.519439697265625, -2.422607421875, -2.325775146484375, -2.22894287109375, -2.132110595703125, -2.0352783203125, -1.938446044921875, -1.84161376953125, -1.744781494140625, -1.64794921875, -1.551116943359375, -1.45428466796875, -1.357452392578125, -1.2606201171875, -1.163787841796875, -1.06695556640625, -0.970123291015625, -0.873291015625, -0.776458740234375, -0.67962646484375, -0.582794189453125, -0.4859619140625, -0.389129638671875, -0.29229736328125, -0.195465087890625, -0.0986328125, -0.001800537109375, 0.09503173828125, 0.191864013671875, 0.2886962890625, 0.385528564453125, 0.48236083984375, 0.579193115234375, 0.676025390625, 0.772857666015625, 0.86968994140625, 0.966522216796875, 1.0633544921875, 1.160186767578125, 1.25701904296875, 1.353851318359375, 1.45068359375, 1.547515869140625, 1.64434814453125, 1.741180419921875, 1.8380126953125, 1.934844970703125, 2.03167724609375, 2.128509521484375, 2.225341796875, 2.322174072265625, 2.41900634765625, 2.515838623046875, 2.6126708984375, 2.709503173828125, 2.80633544921875, 2.903167724609375, 3.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 18.0, 17.0, 14.0, 32.0, 50.0, 50.0, 98.0, 155.0, 191.0, 283.0, 458.0, 730.0, 1156.0, 1975.0, 3227.0, 5537.0, 9399.0, 17999.0, 39961.0, 115719.0, 500509.0, 234410.0, 61125.0, 25342.0, 12368.0, 7135.0, 4166.0, 2384.0, 1454.0, 886.0, 568.0, 395.0, 231.0, 165.0, 109.0, 73.0, 48.0, 34.0, 25.0, 14.0, 12.0, 11.0, 6.0, 2.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.955078125, -2.8619384765625, -2.768798828125, -2.6756591796875, -2.58251953125, -2.4893798828125, -2.396240234375, -2.3031005859375, -2.2099609375, -2.1168212890625, -2.023681640625, -1.9305419921875, -1.83740234375, -1.7442626953125, -1.651123046875, -1.5579833984375, -1.46484375, -1.3717041015625, -1.278564453125, -1.1854248046875, -1.09228515625, -0.9991455078125, -0.906005859375, -0.8128662109375, -0.7197265625, -0.6265869140625, -0.533447265625, -0.4403076171875, -0.34716796875, -0.2540283203125, -0.160888671875, -0.0677490234375, 0.025390625, 0.1185302734375, 0.211669921875, 0.3048095703125, 0.39794921875, 0.4910888671875, 0.584228515625, 0.6773681640625, 0.7705078125, 0.8636474609375, 0.956787109375, 1.0499267578125, 1.14306640625, 1.2362060546875, 1.329345703125, 1.4224853515625, 1.515625, 1.6087646484375, 1.701904296875, 1.7950439453125, 1.88818359375, 1.9813232421875, 2.074462890625, 2.1676025390625, 2.2607421875, 2.3538818359375, 2.447021484375, 2.5401611328125, 2.63330078125, 2.7264404296875, 2.819580078125, 2.9127197265625, 3.005859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 11.0, 3.0, 16.0, 19.0, 22.0, 20.0, 32.0, 53.0, 92.0, 106.0, 154.0, 132.0, 97.0, 65.0, 65.0, 29.0, 24.0, 19.0, 6.0, 14.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00015354156494140625, -0.00014801695942878723, -0.0001424923539161682, -0.0001369677484035492, -0.00013144314289093018, -0.00012591853737831116, -0.00012039393186569214, -0.00011486932635307312, -0.0001093447208404541, -0.00010382011532783508, -9.829550981521606e-05, -9.277090430259705e-05, -8.724629878997803e-05, -8.172169327735901e-05, -7.619708776473999e-05, -7.067248225212097e-05, -6.514787673950195e-05, -5.9623271226882935e-05, -5.4098665714263916e-05, -4.85740602016449e-05, -4.304945468902588e-05, -3.752484917640686e-05, -3.200024366378784e-05, -2.6475638151168823e-05, -2.0951032638549805e-05, -1.5426427125930786e-05, -9.901821613311768e-06, -4.377216100692749e-06, 1.1473894119262695e-06, 6.671994924545288e-06, 1.2196600437164307e-05, 1.7721205949783325e-05, 2.3245811462402344e-05, 2.8770416975021362e-05, 3.429502248764038e-05, 3.98196280002594e-05, 4.534423351287842e-05, 5.0868839025497437e-05, 5.6393444538116455e-05, 6.191805005073547e-05, 6.744265556335449e-05, 7.296726107597351e-05, 7.849186658859253e-05, 8.401647210121155e-05, 8.954107761383057e-05, 9.506568312644958e-05, 0.0001005902886390686, 0.00010611489415168762, 0.00011163949966430664, 0.00011716410517692566, 0.00012268871068954468, 0.0001282133162021637, 0.00013373792171478271, 0.00013926252722740173, 0.00014478713274002075, 0.00015031173825263977, 0.0001558363437652588, 0.0001613609492778778, 0.00016688555479049683, 0.00017241016030311584, 0.00017793476581573486, 0.00018345937132835388, 0.0001889839768409729, 0.00019450858235359192, 0.00020003318786621094]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 10.0, 11.0, 18.0, 30.0, 43.0, 53.0, 85.0, 107.0, 135.0, 236.0, 282.0, 467.0, 685.0, 994.0, 1459.0, 2317.0, 3526.0, 5637.0, 9483.0, 16513.0, 32075.0, 73698.0, 252571.0, 429167.0, 120266.0, 44711.0, 21714.0, 12242.0, 7300.0, 4405.0, 2861.0, 1782.0, 1136.0, 819.0, 507.0, 347.0, 249.0, 185.0, 126.0, 91.0, 63.0, 57.0, 19.0, 19.0, 20.0, 14.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.369140625, -2.295623779296875, -2.22210693359375, -2.148590087890625, -2.0750732421875, -2.001556396484375, -1.92803955078125, -1.854522705078125, -1.781005859375, -1.707489013671875, -1.63397216796875, -1.560455322265625, -1.4869384765625, -1.413421630859375, -1.33990478515625, -1.266387939453125, -1.19287109375, -1.119354248046875, -1.04583740234375, -0.972320556640625, -0.8988037109375, -0.825286865234375, -0.75177001953125, -0.678253173828125, -0.604736328125, -0.531219482421875, -0.45770263671875, -0.384185791015625, -0.3106689453125, -0.237152099609375, -0.16363525390625, -0.090118408203125, -0.0166015625, 0.056915283203125, 0.13043212890625, 0.203948974609375, 0.2774658203125, 0.350982666015625, 0.42449951171875, 0.498016357421875, 0.571533203125, 0.645050048828125, 0.71856689453125, 0.792083740234375, 0.8656005859375, 0.939117431640625, 1.01263427734375, 1.086151123046875, 1.15966796875, 1.233184814453125, 1.30670166015625, 1.380218505859375, 1.4537353515625, 1.527252197265625, 1.60076904296875, 1.674285888671875, 1.747802734375, 1.821319580078125, 1.89483642578125, 1.968353271484375, 2.0418701171875, 2.115386962890625, 2.18890380859375, 2.262420654296875, 2.3359375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 8.0, 4.0, 12.0, 8.0, 13.0, 18.0, 18.0, 22.0, 26.0, 33.0, 39.0, 60.0, 102.0, 120.0, 107.0, 93.0, 78.0, 57.0, 38.0, 28.0, 17.0, 10.0, 20.0, 12.0, 8.0, 9.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.94482421875, -0.9187393188476562, -0.8926544189453125, -0.8665695190429688, -0.840484619140625, -0.8143997192382812, -0.7883148193359375, -0.7622299194335938, -0.73614501953125, -0.7100601196289062, -0.6839752197265625, -0.6578903198242188, -0.631805419921875, -0.6057205200195312, -0.5796356201171875, -0.5535507202148438, -0.5274658203125, -0.5013809204101562, -0.4752960205078125, -0.44921112060546875, -0.423126220703125, -0.39704132080078125, -0.3709564208984375, -0.34487152099609375, -0.31878662109375, -0.29270172119140625, -0.2666168212890625, -0.24053192138671875, -0.214447021484375, -0.18836212158203125, -0.1622772216796875, -0.13619232177734375, -0.110107421875, -0.08402252197265625, -0.0579376220703125, -0.03185272216796875, -0.005767822265625, 0.02031707763671875, 0.0464019775390625, 0.07248687744140625, 0.09857177734375, 0.12465667724609375, 0.1507415771484375, 0.17682647705078125, 0.202911376953125, 0.22899627685546875, 0.2550811767578125, 0.28116607666015625, 0.3072509765625, 0.33333587646484375, 0.3594207763671875, 0.38550567626953125, 0.411590576171875, 0.43767547607421875, 0.4637603759765625, 0.48984527587890625, 0.51593017578125, 0.5420150756835938, 0.5680999755859375, 0.5941848754882812, 0.620269775390625, 0.6463546752929688, 0.6724395751953125, 0.6985244750976562, 0.724609375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 10.0, 7.0, 13.0, 11.0, 18.0, 26.0, 22.0, 34.0, 40.0, 41.0, 56.0, 75.0, 77.0, 79.0, 72.0, 65.0, 59.0, 55.0, 46.0, 38.0, 28.0, 25.0, 16.0, 17.0, 15.0, 12.0, 10.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6575727462768555, -5.475069999694824, -5.292567729949951, -5.11006498336792, -4.927562713623047, -4.745059967041016, -4.562557220458984, -4.380054950714111, -4.197552680969238, -4.015049934387207, -3.832547664642334, -3.6500449180603027, -3.4675426483154297, -3.2850399017333984, -3.1025373935699463, -2.920034885406494, -2.737532138824463, -2.5550296306610107, -2.3725271224975586, -2.1900243759155273, -2.0075221061706543, -1.8250194787979126, -1.642516851425171, -1.4600143432617188, -1.2775118350982666, -1.0950093269348145, -0.9125067591667175, -0.7300041913986206, -0.5475016832351685, -0.3649991750717163, -0.1824965476989746, 5.9604644775390625e-06, 0.1825084686279297, 0.3650110065937042, 0.5475135445594788, 0.7300161123275757, 0.9125186204910278, 1.09502112865448, 1.2775237560272217, 1.4600262641906738, 1.642528772354126, 1.8250312805175781, 2.0075337886810303, 2.1900362968444824, 2.3725390434265137, 2.5550413131713867, 2.737544059753418, 2.92004656791687, 3.1025490760803223, 3.2850515842437744, 3.4675540924072266, 3.650056838989258, 3.832559108734131, 4.015061855316162, 4.197564125061035, 4.380066871643066, 4.562569618225098, 4.745072364807129, 4.927574634552002, 5.110077381134033, 5.292579650878906, 5.4750823974609375, 5.657585144042969, 5.840087413787842, 6.022589683532715]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 9.0, 9.0, 15.0, 6.0, 16.0, 24.0, 15.0, 25.0, 31.0, 26.0, 26.0, 31.0, 37.0, 40.0, 42.0, 40.0, 39.0, 34.0, 47.0, 46.0, 40.0, 44.0, 45.0, 31.0, 39.0, 33.0, 34.0, 26.0, 19.0, 21.0, 23.0, 13.0, 16.0, 9.0, 11.0, 10.0, 4.0, 9.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.743968486785889, -5.566460609436035, -5.388952255249023, -5.21144437789917, -5.033936500549316, -4.856428623199463, -4.678920745849609, -4.501412391662598, -4.323904514312744, -4.146396636962891, -3.968888521194458, -3.7913804054260254, -3.613872528076172, -3.4363646507263184, -3.2588565349578857, -3.081348419189453, -2.9038405418395996, -2.726332664489746, -2.5488245487213135, -2.371316432952881, -2.1938085556030273, -2.016300678253174, -1.8387925624847412, -1.6612845659255981, -1.483776569366455, -1.306268572807312, -1.128760576248169, -0.9512525796890259, -0.7737445831298828, -0.5962365865707397, -0.4187285900115967, -0.2412205934524536, -0.06371259689331055, 0.11379539966583252, 0.2913033962249756, 0.46881139278411865, 0.6463193893432617, 0.8238273859024048, 1.0013353824615479, 1.178843379020691, 1.356351375579834, 1.533859372138977, 1.7113673686981201, 1.8888753652572632, 2.0663833618164062, 2.2438912391662598, 2.4213993549346924, 2.598907470703125, 2.7764153480529785, 2.953923225402832, 3.1314313411712646, 3.3089394569396973, 3.486447334289551, 3.6639552116394043, 3.841463327407837, 4.0189714431762695, 4.196479320526123, 4.373987197875977, 4.551495552062988, 4.729003429412842, 4.906511306762695, 5.084019184112549, 5.261527061462402, 5.439035415649414, 5.616543292999268]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 5.0, 6.0, 7.0, 9.0, 12.0, 12.0, 16.0, 43.0, 51.0, 55.0, 92.0, 166.0, 253.0, 356.0, 546.0, 866.0, 1353.0, 2145.0, 3604.0, 5866.0, 10001.0, 17335.0, 30146.0, 54123.0, 102495.0, 216725.0, 598101.0, 1453623.0, 1037448.0, 346923.0, 143749.0, 73323.0, 39113.0, 22375.0, 13116.0, 7658.0, 4571.0, 2909.0, 1765.0, 1121.0, 676.0, 527.0, 330.0, 201.0, 168.0, 99.0, 61.0, 47.0, 28.0, 18.0, 20.0, 14.0, 10.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.84765625, -7.60052490234375, -7.3533935546875, -7.10626220703125, -6.859130859375, -6.61199951171875, -6.3648681640625, -6.11773681640625, -5.87060546875, -5.62347412109375, -5.3763427734375, -5.12921142578125, -4.882080078125, -4.63494873046875, -4.3878173828125, -4.14068603515625, -3.8935546875, -3.64642333984375, -3.3992919921875, -3.15216064453125, -2.905029296875, -2.65789794921875, -2.4107666015625, -2.16363525390625, -1.91650390625, -1.66937255859375, -1.4222412109375, -1.17510986328125, -0.927978515625, -0.68084716796875, -0.4337158203125, -0.18658447265625, 0.060546875, 0.30767822265625, 0.5548095703125, 0.80194091796875, 1.049072265625, 1.29620361328125, 1.5433349609375, 1.79046630859375, 2.03759765625, 2.28472900390625, 2.5318603515625, 2.77899169921875, 3.026123046875, 3.27325439453125, 3.5203857421875, 3.76751708984375, 4.0146484375, 4.26177978515625, 4.5089111328125, 4.75604248046875, 5.003173828125, 5.25030517578125, 5.4974365234375, 5.74456787109375, 5.99169921875, 6.23883056640625, 6.4859619140625, 6.73309326171875, 6.980224609375, 7.22735595703125, 7.4744873046875, 7.72161865234375, 7.96875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 5.0, 8.0, 10.0, 9.0, 16.0, 18.0, 19.0, 16.0, 24.0, 36.0, 30.0, 33.0, 30.0, 31.0, 49.0, 43.0, 47.0, 42.0, 39.0, 45.0, 41.0, 43.0, 46.0, 36.0, 47.0, 34.0, 29.0, 26.0, 27.0, 15.0, 16.0, 16.0, 14.0, 9.0, 11.0, 4.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.67022705078125, -4.5123291015625, -4.35443115234375, -4.196533203125, -4.03863525390625, -3.8807373046875, -3.72283935546875, -3.56494140625, -3.40704345703125, -3.2491455078125, -3.09124755859375, -2.933349609375, -2.77545166015625, -2.6175537109375, -2.45965576171875, -2.3017578125, -2.14385986328125, -1.9859619140625, -1.82806396484375, -1.670166015625, -1.51226806640625, -1.3543701171875, -1.19647216796875, -1.03857421875, -0.88067626953125, -0.7227783203125, -0.56488037109375, -0.406982421875, -0.24908447265625, -0.0911865234375, 0.06671142578125, 0.224609375, 0.38250732421875, 0.5404052734375, 0.69830322265625, 0.856201171875, 1.01409912109375, 1.1719970703125, 1.32989501953125, 1.48779296875, 1.64569091796875, 1.8035888671875, 1.96148681640625, 2.119384765625, 2.27728271484375, 2.4351806640625, 2.59307861328125, 2.7509765625, 2.90887451171875, 3.0667724609375, 3.22467041015625, 3.382568359375, 3.54046630859375, 3.6983642578125, 3.85626220703125, 4.01416015625, 4.17205810546875, 4.3299560546875, 4.48785400390625, 4.645751953125, 4.80364990234375, 4.9615478515625, 5.11944580078125, 5.27734375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 11.0, 21.0, 32.0, 31.0, 51.0, 88.0, 145.0, 191.0, 293.0, 478.0, 707.0, 1135.0, 1558.0, 2383.0, 3803.0, 5602.0, 8673.0, 13440.0, 21011.0, 34398.0, 55595.0, 92523.0, 159478.0, 287121.0, 533153.0, 940268.0, 892057.0, 494532.0, 268213.0, 150026.0, 86846.0, 52100.0, 31789.0, 20065.0, 12917.0, 8126.0, 5284.0, 3505.0, 2298.0, 1476.0, 961.0, 644.0, 442.0, 297.0, 160.0, 118.0, 80.0, 60.0, 36.0, 24.0, 16.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-5.75390625, -5.5792236328125, -5.404541015625, -5.2298583984375, -5.05517578125, -4.8804931640625, -4.705810546875, -4.5311279296875, -4.3564453125, -4.1817626953125, -4.007080078125, -3.8323974609375, -3.65771484375, -3.4830322265625, -3.308349609375, -3.1336669921875, -2.958984375, -2.7843017578125, -2.609619140625, -2.4349365234375, -2.26025390625, -2.0855712890625, -1.910888671875, -1.7362060546875, -1.5615234375, -1.3868408203125, -1.212158203125, -1.0374755859375, -0.86279296875, -0.6881103515625, -0.513427734375, -0.3387451171875, -0.1640625, 0.0106201171875, 0.185302734375, 0.3599853515625, 0.53466796875, 0.7093505859375, 0.884033203125, 1.0587158203125, 1.2333984375, 1.4080810546875, 1.582763671875, 1.7574462890625, 1.93212890625, 2.1068115234375, 2.281494140625, 2.4561767578125, 2.630859375, 2.8055419921875, 2.980224609375, 3.1549072265625, 3.32958984375, 3.5042724609375, 3.678955078125, 3.8536376953125, 4.0283203125, 4.2030029296875, 4.377685546875, 4.5523681640625, 4.72705078125, 4.9017333984375, 5.076416015625, 5.2510986328125, 5.42578125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 12.0, 7.0, 16.0, 20.0, 24.0, 17.0, 25.0, 31.0, 30.0, 53.0, 56.0, 70.0, 78.0, 100.0, 115.0, 130.0, 179.0, 196.0, 235.0, 257.0, 275.0, 284.0, 251.0, 239.0, 209.0, 192.0, 149.0, 129.0, 106.0, 99.0, 93.0, 75.0, 75.0, 48.0, 41.0, 31.0, 33.0, 22.0, 15.0, 6.0, 12.0, 6.0, 4.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.28125, -2.2078857421875, -2.134521484375, -2.0611572265625, -1.98779296875, -1.9144287109375, -1.841064453125, -1.7677001953125, -1.6943359375, -1.6209716796875, -1.547607421875, -1.4742431640625, -1.40087890625, -1.3275146484375, -1.254150390625, -1.1807861328125, -1.107421875, -1.0340576171875, -0.960693359375, -0.8873291015625, -0.81396484375, -0.7406005859375, -0.667236328125, -0.5938720703125, -0.5205078125, -0.4471435546875, -0.373779296875, -0.3004150390625, -0.22705078125, -0.1536865234375, -0.080322265625, -0.0069580078125, 0.06640625, 0.1397705078125, 0.213134765625, 0.2864990234375, 0.35986328125, 0.4332275390625, 0.506591796875, 0.5799560546875, 0.6533203125, 0.7266845703125, 0.800048828125, 0.8734130859375, 0.94677734375, 1.0201416015625, 1.093505859375, 1.1668701171875, 1.240234375, 1.3135986328125, 1.386962890625, 1.4603271484375, 1.53369140625, 1.6070556640625, 1.680419921875, 1.7537841796875, 1.8271484375, 1.9005126953125, 1.973876953125, 2.0472412109375, 2.12060546875, 2.1939697265625, 2.267333984375, 2.3406982421875, 2.4140625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 8.0, 9.0, 15.0, 24.0, 28.0, 42.0, 37.0, 63.0, 63.0, 61.0, 82.0, 95.0, 63.0, 73.0, 60.0, 49.0, 45.0, 36.0, 31.0, 10.0, 20.0, 11.0, 15.0, 8.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.007071495056152, -5.811352252960205, -5.6156325340271, -5.419913291931152, -5.224194049835205, -5.028474807739258, -4.832755088806152, -4.637035846710205, -4.441316604614258, -4.2455973625183105, -4.049877643585205, -3.854158401489258, -3.6584391593933105, -3.462719678878784, -3.267000198364258, -3.0712809562683105, -2.875561475753784, -2.679841995239258, -2.4841227531433105, -2.288403272628784, -2.092684030532837, -1.8969645500183105, -1.7012451887130737, -1.505525827407837, -1.3098064661026, -1.1140871047973633, -0.9183677434921265, -0.7226483225822449, -0.5269289612770081, -0.33120959997177124, -0.13549017906188965, 0.06022918224334717, 0.255948543548584, 0.4516679048538208, 0.6473872661590576, 0.8431066870689392, 1.0388259887695312, 1.2345454692840576, 1.4302648305892944, 1.6259841918945312, 1.821703553199768, 2.017422914505005, 2.2131423950195312, 2.4088616371154785, 2.604581117630005, 2.800300359725952, 2.9960198402404785, 3.191739082336426, 3.387458562850952, 3.5831780433654785, 3.778897285461426, 3.974616765975952, 4.1703362464904785, 4.366055488586426, 4.561774730682373, 4.75749397277832, 4.953213691711426, 5.148932933807373, 5.3446526527404785, 5.540371894836426, 5.736091136932373, 5.93181037902832, 6.127530097961426, 6.323249340057373, 6.51896858215332]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 8.0, 5.0, 3.0, 9.0, 13.0, 10.0, 21.0, 14.0, 18.0, 19.0, 21.0, 20.0, 30.0, 43.0, 28.0, 34.0, 38.0, 26.0, 44.0, 40.0, 38.0, 41.0, 37.0, 40.0, 35.0, 40.0, 33.0, 39.0, 27.0, 30.0, 26.0, 19.0, 15.0, 20.0, 15.0, 18.0, 10.0, 10.0, 16.0, 15.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.049901962280273, -4.89373779296875, -4.737574100494385, -4.581409931182861, -4.425246238708496, -4.269082069396973, -4.112917900085449, -3.956754207611084, -3.8005900382995605, -3.644426107406616, -3.488262176513672, -3.3320980072021484, -3.175934076309204, -3.0197701454162598, -2.8636062145233154, -2.707442283630371, -2.5512783527374268, -2.3951144218444824, -2.238950490951538, -2.0827865600585938, -1.9266223907470703, -1.770458459854126, -1.6142945289611816, -1.4581304788589478, -1.3019665479660034, -1.145802617073059, -0.9896385669708252, -0.8334746360778809, -0.6773106455802917, -0.5211466550827026, -0.3649827241897583, -0.20881867408752441, -0.05265474319458008, 0.10350923240184784, 0.25967320799827576, 0.4158371686935425, 0.5720011591911316, 0.7281651496887207, 0.884329080581665, 1.040493130683899, 1.1966570615768433, 1.3528209924697876, 1.5089850425720215, 1.6651489734649658, 1.8213129043579102, 1.977476954460144, 2.133640766143799, 2.2898049354553223, 2.4459688663482666, 2.602132797241211, 2.7582967281341553, 2.9144606590270996, 3.070624828338623, 3.2267887592315674, 3.3829526901245117, 3.539116859436035, 3.6952805519104004, 3.8514444828033447, 4.007608413696289, 4.1637725830078125, 4.319936275482178, 4.476100444793701, 4.632264137268066, 4.78842830657959, 4.944592475891113]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 10.0, 23.0, 37.0, 57.0, 96.0, 151.0, 262.0, 335.0, 556.0, 824.0, 1218.0, 1852.0, 2827.0, 4290.0, 6703.0, 10448.0, 16340.0, 25270.0, 40707.0, 65048.0, 105214.0, 175073.0, 224275.0, 138533.0, 84180.0, 52635.0, 32749.0, 20830.0, 13444.0, 8729.0, 5527.0, 3556.0, 2299.0, 1553.0, 971.0, 705.0, 421.0, 277.0, 179.0, 131.0, 74.0, 49.0, 29.0, 17.0, 16.0, 10.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.1015625, -2.0384063720703125, -1.975250244140625, -1.9120941162109375, -1.84893798828125, -1.7857818603515625, -1.722625732421875, -1.6594696044921875, -1.5963134765625, -1.5331573486328125, -1.470001220703125, -1.4068450927734375, -1.34368896484375, -1.2805328369140625, -1.217376708984375, -1.1542205810546875, -1.091064453125, -1.0279083251953125, -0.964752197265625, -0.9015960693359375, -0.83843994140625, -0.7752838134765625, -0.712127685546875, -0.6489715576171875, -0.5858154296875, -0.5226593017578125, -0.459503173828125, -0.3963470458984375, -0.33319091796875, -0.2700347900390625, -0.206878662109375, -0.1437225341796875, -0.08056640625, -0.0174102783203125, 0.045745849609375, 0.1089019775390625, 0.17205810546875, 0.2352142333984375, 0.298370361328125, 0.3615264892578125, 0.4246826171875, 0.4878387451171875, 0.550994873046875, 0.6141510009765625, 0.67730712890625, 0.7404632568359375, 0.803619384765625, 0.8667755126953125, 0.929931640625, 0.9930877685546875, 1.056243896484375, 1.1194000244140625, 1.18255615234375, 1.2457122802734375, 1.308868408203125, 1.3720245361328125, 1.4351806640625, 1.4983367919921875, 1.561492919921875, 1.6246490478515625, 1.68780517578125, 1.7509613037109375, 1.814117431640625, 1.8772735595703125, 1.9404296875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 1.0, 5.0, 8.0, 9.0, 7.0, 9.0, 14.0, 21.0, 14.0, 18.0, 18.0, 17.0, 33.0, 31.0, 35.0, 28.0, 38.0, 29.0, 40.0, 46.0, 49.0, 41.0, 39.0, 39.0, 41.0, 44.0, 38.0, 34.0, 36.0, 36.0, 28.0, 27.0, 17.0, 16.0, 14.0, 11.0, 17.0, 7.0, 13.0, 6.0, 7.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-5.671875, -5.5030517578125, -5.334228515625, -5.1654052734375, -4.99658203125, -4.8277587890625, -4.658935546875, -4.4901123046875, -4.3212890625, -4.1524658203125, -3.983642578125, -3.8148193359375, -3.64599609375, -3.4771728515625, -3.308349609375, -3.1395263671875, -2.970703125, -2.8018798828125, -2.633056640625, -2.4642333984375, -2.29541015625, -2.1265869140625, -1.957763671875, -1.7889404296875, -1.6201171875, -1.4512939453125, -1.282470703125, -1.1136474609375, -0.94482421875, -0.7760009765625, -0.607177734375, -0.4383544921875, -0.26953125, -0.1007080078125, 0.068115234375, 0.2369384765625, 0.40576171875, 0.5745849609375, 0.743408203125, 0.9122314453125, 1.0810546875, 1.2498779296875, 1.418701171875, 1.5875244140625, 1.75634765625, 1.9251708984375, 2.093994140625, 2.2628173828125, 2.431640625, 2.6004638671875, 2.769287109375, 2.9381103515625, 3.10693359375, 3.2757568359375, 3.444580078125, 3.6134033203125, 3.7822265625, 3.9510498046875, 4.119873046875, 4.2886962890625, 4.45751953125, 4.6263427734375, 4.795166015625, 4.9639892578125, 5.1328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 14.0, 26.0, 25.0, 54.0, 73.0, 116.0, 167.0, 295.0, 414.0, 779.0, 1289.0, 2091.0, 3610.0, 6452.0, 11631.0, 22093.0, 42743.0, 84831.0, 177336.0, 331200.0, 182154.0, 86900.0, 44009.0, 22533.0, 12193.0, 6509.0, 3634.0, 2100.0, 1264.0, 769.0, 446.0, 295.0, 167.0, 96.0, 86.0, 54.0, 32.0, 25.0, 15.0, 11.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.85546875, -2.76190185546875, -2.6683349609375, -2.57476806640625, -2.481201171875, -2.38763427734375, -2.2940673828125, -2.20050048828125, -2.10693359375, -2.01336669921875, -1.9197998046875, -1.82623291015625, -1.732666015625, -1.63909912109375, -1.5455322265625, -1.45196533203125, -1.3583984375, -1.26483154296875, -1.1712646484375, -1.07769775390625, -0.984130859375, -0.89056396484375, -0.7969970703125, -0.70343017578125, -0.60986328125, -0.51629638671875, -0.4227294921875, -0.32916259765625, -0.235595703125, -0.14202880859375, -0.0484619140625, 0.04510498046875, 0.138671875, 0.23223876953125, 0.3258056640625, 0.41937255859375, 0.512939453125, 0.60650634765625, 0.7000732421875, 0.79364013671875, 0.88720703125, 0.98077392578125, 1.0743408203125, 1.16790771484375, 1.261474609375, 1.35504150390625, 1.4486083984375, 1.54217529296875, 1.6357421875, 1.72930908203125, 1.8228759765625, 1.91644287109375, 2.010009765625, 2.10357666015625, 2.1971435546875, 2.29071044921875, 2.38427734375, 2.47784423828125, 2.5714111328125, 2.66497802734375, 2.758544921875, 2.85211181640625, 2.9456787109375, 3.03924560546875, 3.1328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 6.0, 7.0, 15.0, 10.0, 21.0, 18.0, 14.0, 23.0, 28.0, 24.0, 32.0, 20.0, 34.0, 26.0, 28.0, 35.0, 39.0, 45.0, 31.0, 26.0, 38.0, 50.0, 40.0, 28.0, 37.0, 25.0, 33.0, 21.0, 26.0, 26.0, 23.0, 19.0, 14.0, 16.0, 19.0, 13.0, 19.0, 12.0, 5.0, 11.0, 6.0, 6.0, 6.0, 4.0, 10.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-3.146484375, -3.05126953125, -2.9560546875, -2.86083984375, -2.765625, -2.67041015625, -2.5751953125, -2.47998046875, -2.384765625, -2.28955078125, -2.1943359375, -2.09912109375, -2.00390625, -1.90869140625, -1.8134765625, -1.71826171875, -1.623046875, -1.52783203125, -1.4326171875, -1.33740234375, -1.2421875, -1.14697265625, -1.0517578125, -0.95654296875, -0.861328125, -0.76611328125, -0.6708984375, -0.57568359375, -0.48046875, -0.38525390625, -0.2900390625, -0.19482421875, -0.099609375, -0.00439453125, 0.0908203125, 0.18603515625, 0.28125, 0.37646484375, 0.4716796875, 0.56689453125, 0.662109375, 0.75732421875, 0.8525390625, 0.94775390625, 1.04296875, 1.13818359375, 1.2333984375, 1.32861328125, 1.423828125, 1.51904296875, 1.6142578125, 1.70947265625, 1.8046875, 1.89990234375, 1.9951171875, 2.09033203125, 2.185546875, 2.28076171875, 2.3759765625, 2.47119140625, 2.56640625, 2.66162109375, 2.7568359375, 2.85205078125, 2.947265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 15.0, 23.0, 28.0, 67.0, 74.0, 127.0, 193.0, 303.0, 468.0, 830.0, 1416.0, 2439.0, 4430.0, 8159.0, 16518.0, 36976.0, 93899.0, 305196.0, 377477.0, 116129.0, 43780.0, 18943.0, 9401.0, 4989.0, 2719.0, 1554.0, 839.0, 564.0, 344.0, 220.0, 144.0, 76.0, 73.0, 37.0, 24.0, 17.0, 11.0, 11.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0291748046875, -0.028366565704345703, -0.027558326721191406, -0.02675008773803711, -0.025941848754882812, -0.025133609771728516, -0.02432537078857422, -0.023517131805419922, -0.022708892822265625, -0.021900653839111328, -0.02109241485595703, -0.020284175872802734, -0.019475936889648438, -0.01866769790649414, -0.017859458923339844, -0.017051219940185547, -0.01624298095703125, -0.015434741973876953, -0.014626502990722656, -0.01381826400756836, -0.013010025024414062, -0.012201786041259766, -0.011393547058105469, -0.010585308074951172, -0.009777069091796875, -0.008968830108642578, -0.008160591125488281, -0.007352352142333984, -0.0065441131591796875, -0.005735874176025391, -0.004927635192871094, -0.004119396209716797, -0.0033111572265625, -0.002502918243408203, -0.0016946792602539062, -0.0008864402770996094, -7.82012939453125e-05, 0.0007300376892089844, 0.0015382766723632812, 0.002346515655517578, 0.003154754638671875, 0.003962993621826172, 0.004771232604980469, 0.005579471588134766, 0.0063877105712890625, 0.007195949554443359, 0.008004188537597656, 0.008812427520751953, 0.00962066650390625, 0.010428905487060547, 0.011237144470214844, 0.01204538345336914, 0.012853622436523438, 0.013661861419677734, 0.014470100402832031, 0.015278339385986328, 0.016086578369140625, 0.016894817352294922, 0.01770305633544922, 0.018511295318603516, 0.019319534301757812, 0.02012777328491211, 0.020936012268066406, 0.021744251251220703, 0.022552490234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 18.0, 8.0, 17.0, 11.0, 25.0, 28.0, 47.0, 59.0, 66.0, 69.0, 68.0, 106.0, 75.0, 92.0, 59.0, 56.0, 49.0, 26.0, 18.0, 27.0, 18.0, 12.0, 9.0, 11.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.736706614494324e-06, -4.466623067855835e-06, -4.196539521217346e-06, -3.926455974578857e-06, -3.6563724279403687e-06, -3.38628888130188e-06, -3.116205334663391e-06, -2.8461217880249023e-06, -2.5760382413864136e-06, -2.305954694747925e-06, -2.035871148109436e-06, -1.7657876014709473e-06, -1.4957040548324585e-06, -1.2256205081939697e-06, -9.55536961555481e-07, -6.854534149169922e-07, -4.153698682785034e-07, -1.4528632164001465e-07, 1.2479722499847412e-07, 3.948807716369629e-07, 6.649643182754517e-07, 9.350478649139404e-07, 1.2051314115524292e-06, 1.475214958190918e-06, 1.7452985048294067e-06, 2.0153820514678955e-06, 2.2854655981063843e-06, 2.555549144744873e-06, 2.825632691383362e-06, 3.0957162380218506e-06, 3.3657997846603394e-06, 3.635883331298828e-06, 3.905966877937317e-06, 4.176050424575806e-06, 4.4461339712142944e-06, 4.716217517852783e-06, 4.986301064491272e-06, 5.256384611129761e-06, 5.5264681577682495e-06, 5.796551704406738e-06, 6.066635251045227e-06, 6.336718797683716e-06, 6.606802344322205e-06, 6.876885890960693e-06, 7.146969437599182e-06, 7.417052984237671e-06, 7.68713653087616e-06, 7.957220077514648e-06, 8.227303624153137e-06, 8.497387170791626e-06, 8.767470717430115e-06, 9.037554264068604e-06, 9.307637810707092e-06, 9.577721357345581e-06, 9.84780490398407e-06, 1.0117888450622559e-05, 1.0387971997261047e-05, 1.0658055543899536e-05, 1.0928139090538025e-05, 1.1198222637176514e-05, 1.1468306183815002e-05, 1.1738389730453491e-05, 1.200847327709198e-05, 1.2278556823730469e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 10.0, 20.0, 24.0, 38.0, 61.0, 88.0, 116.0, 201.0, 262.0, 463.0, 703.0, 1022.0, 1623.0, 2806.0, 4602.0, 7683.0, 13788.0, 25713.0, 50561.0, 109481.0, 264276.0, 309634.0, 130210.0, 58506.0, 29034.0, 15636.0, 8751.0, 5027.0, 2982.0, 1887.0, 1166.0, 770.0, 459.0, 345.0, 214.0, 128.0, 84.0, 55.0, 42.0, 32.0, 22.0, 11.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176544189453125, -0.017026185989379883, -0.016397953033447266, -0.01576972007751465, -0.015141487121582031, -0.014513254165649414, -0.013885021209716797, -0.01325678825378418, -0.012628555297851562, -0.012000322341918945, -0.011372089385986328, -0.010743856430053711, -0.010115623474121094, -0.009487390518188477, -0.00885915756225586, -0.008230924606323242, -0.007602691650390625, -0.006974458694458008, -0.006346225738525391, -0.0057179927825927734, -0.005089759826660156, -0.004461526870727539, -0.003833293914794922, -0.0032050609588623047, -0.0025768280029296875, -0.0019485950469970703, -0.0013203620910644531, -0.0006921291351318359, -6.389617919921875e-05, 0.0005643367767333984, 0.0011925697326660156, 0.0018208026885986328, 0.00244903564453125, 0.003077268600463867, 0.0037055015563964844, 0.0043337345123291016, 0.004961967468261719, 0.005590200424194336, 0.006218433380126953, 0.00684666633605957, 0.0074748992919921875, 0.008103132247924805, 0.008731365203857422, 0.009359598159790039, 0.009987831115722656, 0.010616064071655273, 0.01124429702758789, 0.011872529983520508, 0.012500762939453125, 0.013128995895385742, 0.01375722885131836, 0.014385461807250977, 0.015013694763183594, 0.01564192771911621, 0.016270160675048828, 0.016898393630981445, 0.017526626586914062, 0.01815485954284668, 0.018783092498779297, 0.019411325454711914, 0.02003955841064453, 0.02066779136657715, 0.021296024322509766, 0.021924257278442383, 0.022552490234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 5.0, 11.0, 4.0, 11.0, 10.0, 19.0, 16.0, 24.0, 28.0, 29.0, 45.0, 53.0, 71.0, 91.0, 99.0, 85.0, 82.0, 72.0, 55.0, 37.0, 32.0, 28.0, 16.0, 17.0, 11.0, 9.0, 5.0, 10.0, 7.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00957489013671875, -0.009306073188781738, -0.009037256240844727, -0.008768439292907715, -0.008499622344970703, -0.008230805397033691, -0.00796198844909668, -0.007693171501159668, -0.007424354553222656, -0.0071555376052856445, -0.006886720657348633, -0.006617903709411621, -0.006349086761474609, -0.006080269813537598, -0.005811452865600586, -0.005542635917663574, -0.0052738189697265625, -0.005005002021789551, -0.004736185073852539, -0.004467368125915527, -0.004198551177978516, -0.003929734230041504, -0.003660917282104492, -0.0033921003341674805, -0.0031232833862304688, -0.002854466438293457, -0.0025856494903564453, -0.0023168325424194336, -0.002048015594482422, -0.0017791986465454102, -0.0015103816986083984, -0.0012415647506713867, -0.000972747802734375, -0.0007039308547973633, -0.00043511390686035156, -0.00016629695892333984, 0.00010251998901367188, 0.0003713369369506836, 0.0006401538848876953, 0.000908970832824707, 0.0011777877807617188, 0.0014466047286987305, 0.0017154216766357422, 0.001984238624572754, 0.0022530555725097656, 0.0025218725204467773, 0.002790689468383789, 0.0030595064163208008, 0.0033283233642578125, 0.0035971403121948242, 0.003865957260131836, 0.004134774208068848, 0.004403591156005859, 0.004672408103942871, 0.004941225051879883, 0.0052100419998168945, 0.005478858947753906, 0.005747675895690918, 0.00601649284362793, 0.006285309791564941, 0.006554126739501953, 0.006822943687438965, 0.0070917606353759766, 0.007360577583312988, 0.00762939453125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 5.0, 12.0, 9.0, 13.0, 30.0, 32.0, 45.0, 44.0, 62.0, 65.0, 73.0, 88.0, 93.0, 70.0, 65.0, 61.0, 39.0, 49.0, 24.0, 21.0, 19.0, 8.0, 13.0, 11.0, 8.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.323980808258057, -6.121556758880615, -5.919132709503174, -5.716708660125732, -5.514284133911133, -5.311860084533691, -5.10943603515625, -4.907011985778809, -4.704587936401367, -4.502163887023926, -4.299739837646484, -4.097315788269043, -3.8948915004730225, -3.692467451095581, -3.4900431632995605, -3.287619113922119, -3.0851950645446777, -2.8827710151672363, -2.680346965789795, -2.4779226779937744, -2.275498628616333, -2.0730745792388916, -1.8706504106521606, -1.6682262420654297, -1.4658021926879883, -1.2633781433105469, -1.060953974723816, -0.8585298657417297, -0.6561057567596436, -0.45368170738220215, -0.2512575387954712, -0.048833370208740234, 0.15359020233154297, 0.35601431131362915, 0.5584384202957153, 0.7608625292778015, 0.9632866382598877, 1.165710687637329, 1.36813485622406, 1.570559024810791, 1.7729830741882324, 1.9754071235656738, 2.1778311729431152, 2.3802554607391357, 2.582679510116577, 2.7851035594940186, 2.987527847290039, 3.1899518966674805, 3.392375946044922, 3.5947999954223633, 3.7972240447998047, 3.999648332595825, 4.2020721435546875, 4.404496192932129, 4.6069207191467285, 4.80934476852417, 5.011768817901611, 5.214192867279053, 5.416616916656494, 5.6190409660339355, 5.821465492248535, 6.023889541625977, 6.226313591003418, 6.428737640380859, 6.631161689758301]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 5.0, 8.0, 3.0, 7.0, 15.0, 9.0, 18.0, 18.0, 17.0, 19.0, 20.0, 22.0, 27.0, 46.0, 28.0, 33.0, 38.0, 26.0, 40.0, 43.0, 39.0, 40.0, 37.0, 41.0, 37.0, 36.0, 34.0, 42.0, 26.0, 28.0, 27.0, 19.0, 15.0, 21.0, 15.0, 18.0, 9.0, 11.0, 16.0, 14.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.010387420654297, -4.854788780212402, -4.699190616607666, -4.5435919761657715, -4.387993335723877, -4.232395172119141, -4.076796531677246, -3.9211978912353516, -3.765599489212036, -3.6100010871887207, -3.454402446746826, -3.2988040447235107, -3.1432056427001953, -2.987607002258301, -2.8320086002349854, -2.67641019821167, -2.5208115577697754, -2.36521315574646, -2.2096145153045654, -2.05401611328125, -1.898417592048645, -1.74281907081604, -1.5872206687927246, -1.4316221475601196, -1.2760236263275146, -1.1204251050949097, -0.9648266434669495, -0.8092281818389893, -0.6536296606063843, -0.4980311393737793, -0.3424326777458191, -0.1868342161178589, -0.031235694885253906, 0.12436279654502869, 0.2799612879753113, 0.43555977940559387, 0.5911582708358765, 0.7467567920684814, 0.9023552536964417, 1.0579537153244019, 1.2135522365570068, 1.3691507577896118, 1.5247492790222168, 1.6803476810455322, 1.8359462022781372, 1.9915447235107422, 2.1471431255340576, 2.302741527557373, 2.4583401679992676, 2.613938570022583, 2.7695372104644775, 2.925135612487793, 3.0807342529296875, 3.236332654953003, 3.3919310569763184, 3.547529697418213, 3.7031280994415283, 3.8587265014648438, 4.014325141906738, 4.169923782348633, 4.325521945953369, 4.481120586395264, 4.636719226837158, 4.7923173904418945, 4.947916030883789]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 12.0, 27.0, 35.0, 43.0, 50.0, 93.0, 153.0, 180.0, 313.0, 484.0, 727.0, 1108.0, 1703.0, 2557.0, 4057.0, 6213.0, 9869.0, 16166.0, 26363.0, 44139.0, 74924.0, 125108.0, 184561.0, 194378.0, 140672.0, 85583.0, 50267.0, 29817.0, 18333.0, 11106.0, 6982.0, 4533.0, 2740.0, 1788.0, 1169.0, 771.0, 526.0, 344.0, 217.0, 148.0, 92.0, 54.0, 40.0, 31.0, 23.0, 17.0, 6.0, 6.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.7109375, -7.4549560546875, -7.198974609375, -6.9429931640625, -6.68701171875, -6.4310302734375, -6.175048828125, -5.9190673828125, -5.6630859375, -5.4071044921875, -5.151123046875, -4.8951416015625, -4.63916015625, -4.3831787109375, -4.127197265625, -3.8712158203125, -3.615234375, -3.3592529296875, -3.103271484375, -2.8472900390625, -2.59130859375, -2.3353271484375, -2.079345703125, -1.8233642578125, -1.5673828125, -1.3114013671875, -1.055419921875, -0.7994384765625, -0.54345703125, -0.2874755859375, -0.031494140625, 0.2244873046875, 0.48046875, 0.7364501953125, 0.992431640625, 1.2484130859375, 1.50439453125, 1.7603759765625, 2.016357421875, 2.2723388671875, 2.5283203125, 2.7843017578125, 3.040283203125, 3.2962646484375, 3.55224609375, 3.8082275390625, 4.064208984375, 4.3201904296875, 4.576171875, 4.8321533203125, 5.088134765625, 5.3441162109375, 5.60009765625, 5.8560791015625, 6.112060546875, 6.3680419921875, 6.6240234375, 6.8800048828125, 7.135986328125, 7.3919677734375, 7.64794921875, 7.9039306640625, 8.159912109375, 8.4158935546875, 8.671875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 7.0, 3.0, 9.0, 10.0, 12.0, 18.0, 16.0, 15.0, 13.0, 24.0, 29.0, 33.0, 31.0, 35.0, 35.0, 29.0, 40.0, 44.0, 45.0, 51.0, 37.0, 41.0, 36.0, 44.0, 39.0, 34.0, 34.0, 34.0, 24.0, 24.0, 18.0, 18.0, 14.0, 19.0, 10.0, 13.0, 10.0, 12.0, 10.0, 13.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91796875, -4.75970458984375, -4.6014404296875, -4.44317626953125, -4.284912109375, -4.12664794921875, -3.9683837890625, -3.81011962890625, -3.65185546875, -3.49359130859375, -3.3353271484375, -3.17706298828125, -3.018798828125, -2.86053466796875, -2.7022705078125, -2.54400634765625, -2.3857421875, -2.22747802734375, -2.0692138671875, -1.91094970703125, -1.752685546875, -1.59442138671875, -1.4361572265625, -1.27789306640625, -1.11962890625, -0.96136474609375, -0.8031005859375, -0.64483642578125, -0.486572265625, -0.32830810546875, -0.1700439453125, -0.01177978515625, 0.146484375, 0.30474853515625, 0.4630126953125, 0.62127685546875, 0.779541015625, 0.93780517578125, 1.0960693359375, 1.25433349609375, 1.41259765625, 1.57086181640625, 1.7291259765625, 1.88739013671875, 2.045654296875, 2.20391845703125, 2.3621826171875, 2.52044677734375, 2.6787109375, 2.83697509765625, 2.9952392578125, 3.15350341796875, 3.311767578125, 3.47003173828125, 3.6282958984375, 3.78656005859375, 3.94482421875, 4.10308837890625, 4.2613525390625, 4.41961669921875, 4.577880859375, 4.73614501953125, 4.8944091796875, 5.05267333984375, 5.2109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 9.0, 19.0, 15.0, 28.0, 39.0, 63.0, 90.0, 122.0, 198.0, 258.0, 333.0, 477.0, 645.0, 973.0, 1327.0, 1792.0, 2635.0, 3681.0, 5249.0, 7796.0, 11428.0, 16596.0, 24764.0, 37505.0, 56421.0, 83774.0, 120063.0, 149108.0, 149245.0, 119259.0, 83636.0, 55514.0, 36926.0, 24969.0, 16619.0, 11267.0, 7651.0, 5295.0, 3655.0, 2611.0, 1853.0, 1368.0, 948.0, 679.0, 505.0, 357.0, 221.0, 172.0, 136.0, 78.0, 61.0, 54.0, 32.0, 13.0, 19.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0], "bins": [-6.1328125, -5.9349365234375, -5.737060546875, -5.5391845703125, -5.34130859375, -5.1434326171875, -4.945556640625, -4.7476806640625, -4.5498046875, -4.3519287109375, -4.154052734375, -3.9561767578125, -3.75830078125, -3.5604248046875, -3.362548828125, -3.1646728515625, -2.966796875, -2.7689208984375, -2.571044921875, -2.3731689453125, -2.17529296875, -1.9774169921875, -1.779541015625, -1.5816650390625, -1.3837890625, -1.1859130859375, -0.988037109375, -0.7901611328125, -0.59228515625, -0.3944091796875, -0.196533203125, 0.0013427734375, 0.19921875, 0.3970947265625, 0.594970703125, 0.7928466796875, 0.99072265625, 1.1885986328125, 1.386474609375, 1.5843505859375, 1.7822265625, 1.9801025390625, 2.177978515625, 2.3758544921875, 2.57373046875, 2.7716064453125, 2.969482421875, 3.1673583984375, 3.365234375, 3.5631103515625, 3.760986328125, 3.9588623046875, 4.15673828125, 4.3546142578125, 4.552490234375, 4.7503662109375, 4.9482421875, 5.1461181640625, 5.343994140625, 5.5418701171875, 5.73974609375, 5.9376220703125, 6.135498046875, 6.3333740234375, 6.53125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 7.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 10.0, 8.0, 7.0, 15.0, 22.0, 11.0, 17.0, 21.0, 27.0, 26.0, 21.0, 32.0, 33.0, 19.0, 29.0, 25.0, 31.0, 31.0, 26.0, 35.0, 35.0, 28.0, 41.0, 35.0, 35.0, 40.0, 24.0, 28.0, 34.0, 33.0, 20.0, 23.0, 19.0, 24.0, 14.0, 15.0, 10.0, 15.0, 13.0, 10.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.669921875, -2.582489013671875, -2.49505615234375, -2.407623291015625, -2.3201904296875, -2.232757568359375, -2.14532470703125, -2.057891845703125, -1.970458984375, -1.883026123046875, -1.79559326171875, -1.708160400390625, -1.6207275390625, -1.533294677734375, -1.44586181640625, -1.358428955078125, -1.27099609375, -1.183563232421875, -1.09613037109375, -1.008697509765625, -0.9212646484375, -0.833831787109375, -0.74639892578125, -0.658966064453125, -0.571533203125, -0.484100341796875, -0.39666748046875, -0.309234619140625, -0.2218017578125, -0.134368896484375, -0.04693603515625, 0.040496826171875, 0.1279296875, 0.215362548828125, 0.30279541015625, 0.390228271484375, 0.4776611328125, 0.565093994140625, 0.65252685546875, 0.739959716796875, 0.827392578125, 0.914825439453125, 1.00225830078125, 1.089691162109375, 1.1771240234375, 1.264556884765625, 1.35198974609375, 1.439422607421875, 1.52685546875, 1.614288330078125, 1.70172119140625, 1.789154052734375, 1.8765869140625, 1.964019775390625, 2.05145263671875, 2.138885498046875, 2.226318359375, 2.313751220703125, 2.40118408203125, 2.488616943359375, 2.5760498046875, 2.663482666015625, 2.75091552734375, 2.838348388671875, 2.92578125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 7.0, 5.0, 10.0, 22.0, 27.0, 28.0, 41.0, 55.0, 83.0, 111.0, 159.0, 195.0, 299.0, 422.0, 586.0, 811.0, 1276.0, 1879.0, 2920.0, 4607.0, 7405.0, 12269.0, 21694.0, 41501.0, 99513.0, 343388.0, 321843.0, 94402.0, 40180.0, 20683.0, 11721.0, 7192.0, 4404.0, 2814.0, 1820.0, 1250.0, 877.0, 577.0, 444.0, 284.0, 238.0, 144.0, 107.0, 78.0, 54.0, 41.0, 28.0, 19.0, 19.0, 10.0, 5.0, 4.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.171875, -2.10394287109375, -2.0360107421875, -1.96807861328125, -1.900146484375, -1.83221435546875, -1.7642822265625, -1.69635009765625, -1.62841796875, -1.56048583984375, -1.4925537109375, -1.42462158203125, -1.356689453125, -1.28875732421875, -1.2208251953125, -1.15289306640625, -1.0849609375, -1.01702880859375, -0.9490966796875, -0.88116455078125, -0.813232421875, -0.74530029296875, -0.6773681640625, -0.60943603515625, -0.54150390625, -0.47357177734375, -0.4056396484375, -0.33770751953125, -0.269775390625, -0.20184326171875, -0.1339111328125, -0.06597900390625, 0.001953125, 0.06988525390625, 0.1378173828125, 0.20574951171875, 0.273681640625, 0.34161376953125, 0.4095458984375, 0.47747802734375, 0.54541015625, 0.61334228515625, 0.6812744140625, 0.74920654296875, 0.817138671875, 0.88507080078125, 0.9530029296875, 1.02093505859375, 1.0888671875, 1.15679931640625, 1.2247314453125, 1.29266357421875, 1.360595703125, 1.42852783203125, 1.4964599609375, 1.56439208984375, 1.63232421875, 1.70025634765625, 1.7681884765625, 1.83612060546875, 1.904052734375, 1.97198486328125, 2.0399169921875, 2.10784912109375, 2.17578125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 13.0, 18.0, 14.0, 16.0, 24.0, 45.0, 54.0, 85.0, 108.0, 111.0, 89.0, 82.0, 68.0, 63.0, 34.0, 27.0, 18.0, 17.0, 22.0, 12.0, 14.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001537799835205078, -0.00014959275722503662, -0.00014540553092956543, -0.00014121830463409424, -0.00013703107833862305, -0.00013284385204315186, -0.00012865662574768066, -0.00012446939945220947, -0.00012028217315673828, -0.00011609494686126709, -0.0001119077205657959, -0.00010772049427032471, -0.00010353326797485352, -9.934604167938232e-05, -9.515881538391113e-05, -9.097158908843994e-05, -8.678436279296875e-05, -8.259713649749756e-05, -7.840991020202637e-05, -7.422268390655518e-05, -7.003545761108398e-05, -6.584823131561279e-05, -6.16610050201416e-05, -5.747377872467041e-05, -5.328655242919922e-05, -4.909932613372803e-05, -4.4912099838256836e-05, -4.0724873542785645e-05, -3.653764724731445e-05, -3.235042095184326e-05, -2.816319465637207e-05, -2.397596836090088e-05, -1.9788742065429688e-05, -1.5601515769958496e-05, -1.1414289474487305e-05, -7.227063179016113e-06, -3.039836883544922e-06, 1.1473894119262695e-06, 5.334615707397461e-06, 9.521842002868652e-06, 1.3709068298339844e-05, 1.7896294593811035e-05, 2.2083520889282227e-05, 2.6270747184753418e-05, 3.045797348022461e-05, 3.46451997756958e-05, 3.883242607116699e-05, 4.3019652366638184e-05, 4.7206878662109375e-05, 5.1394104957580566e-05, 5.558133125305176e-05, 5.976855754852295e-05, 6.395578384399414e-05, 6.814301013946533e-05, 7.233023643493652e-05, 7.651746273040771e-05, 8.07046890258789e-05, 8.48919153213501e-05, 8.907914161682129e-05, 9.326636791229248e-05, 9.745359420776367e-05, 0.00010164082050323486, 0.00010582804679870605, 0.00011001527309417725, 0.00011420249938964844]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 11.0, 17.0, 17.0, 36.0, 37.0, 57.0, 78.0, 119.0, 160.0, 267.0, 387.0, 516.0, 806.0, 1159.0, 1824.0, 2942.0, 4638.0, 7311.0, 12537.0, 23040.0, 49315.0, 147910.0, 467283.0, 203289.0, 61321.0, 26791.0, 13930.0, 8175.0, 5157.0, 3192.0, 2060.0, 1316.0, 964.0, 549.0, 415.0, 292.0, 190.0, 131.0, 81.0, 70.0, 37.0, 34.0, 30.0, 12.0, 16.0, 10.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.314453125, -2.241241455078125, -2.16802978515625, -2.094818115234375, -2.0216064453125, -1.948394775390625, -1.87518310546875, -1.801971435546875, -1.728759765625, -1.655548095703125, -1.58233642578125, -1.509124755859375, -1.4359130859375, -1.362701416015625, -1.28948974609375, -1.216278076171875, -1.14306640625, -1.069854736328125, -0.99664306640625, -0.923431396484375, -0.8502197265625, -0.777008056640625, -0.70379638671875, -0.630584716796875, -0.557373046875, -0.484161376953125, -0.41094970703125, -0.337738037109375, -0.2645263671875, -0.191314697265625, -0.11810302734375, -0.044891357421875, 0.0283203125, 0.101531982421875, 0.17474365234375, 0.247955322265625, 0.3211669921875, 0.394378662109375, 0.46759033203125, 0.540802001953125, 0.614013671875, 0.687225341796875, 0.76043701171875, 0.833648681640625, 0.9068603515625, 0.980072021484375, 1.05328369140625, 1.126495361328125, 1.19970703125, 1.272918701171875, 1.34613037109375, 1.419342041015625, 1.4925537109375, 1.565765380859375, 1.63897705078125, 1.712188720703125, 1.785400390625, 1.858612060546875, 1.93182373046875, 2.005035400390625, 2.0782470703125, 2.151458740234375, 2.22467041015625, 2.297882080078125, 2.37109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 9.0, 6.0, 8.0, 12.0, 10.0, 12.0, 13.0, 16.0, 37.0, 37.0, 48.0, 65.0, 97.0, 101.0, 128.0, 102.0, 51.0, 50.0, 30.0, 24.0, 25.0, 14.0, 11.0, 12.0, 13.0, 11.0, 7.0, 11.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7861328125, -0.7629928588867188, -0.7398529052734375, -0.7167129516601562, -0.693572998046875, -0.6704330444335938, -0.6472930908203125, -0.6241531372070312, -0.60101318359375, -0.5778732299804688, -0.5547332763671875, -0.5315933227539062, -0.508453369140625, -0.48531341552734375, -0.4621734619140625, -0.43903350830078125, -0.4158935546875, -0.39275360107421875, -0.3696136474609375, -0.34647369384765625, -0.323333740234375, -0.30019378662109375, -0.2770538330078125, -0.25391387939453125, -0.23077392578125, -0.20763397216796875, -0.1844940185546875, -0.16135406494140625, -0.138214111328125, -0.11507415771484375, -0.0919342041015625, -0.06879425048828125, -0.045654296875, -0.02251434326171875, 0.0006256103515625, 0.02376556396484375, 0.046905517578125, 0.07004547119140625, 0.0931854248046875, 0.11632537841796875, 0.13946533203125, 0.16260528564453125, 0.1857452392578125, 0.20888519287109375, 0.232025146484375, 0.25516510009765625, 0.2783050537109375, 0.30144500732421875, 0.3245849609375, 0.34772491455078125, 0.3708648681640625, 0.39400482177734375, 0.417144775390625, 0.44028472900390625, 0.4634246826171875, 0.48656463623046875, 0.50970458984375, 0.5328445434570312, 0.5559844970703125, 0.5791244506835938, 0.602264404296875, 0.6254043579101562, 0.6485443115234375, 0.6716842651367188, 0.69482421875]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 7.0, 15.0, 16.0, 26.0, 24.0, 38.0, 43.0, 69.0, 67.0, 101.0, 79.0, 105.0, 76.0, 58.0, 65.0, 50.0, 25.0, 25.0, 27.0, 14.0, 14.0, 7.0, 13.0, 8.0, 8.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79243803024292, -5.571795463562012, -5.3511528968811035, -5.130510330200195, -4.909867763519287, -4.689225196838379, -4.468583106994629, -4.2479400634765625, -4.0272979736328125, -3.8066554069519043, -3.586012840270996, -3.365370273590088, -3.1447277069091797, -2.9240851402282715, -2.7034428119659424, -2.482800245285034, -2.262157440185547, -2.0415148735046387, -1.8208723068237305, -1.6002298593521118, -1.3795872926712036, -1.1589447259902954, -0.9383022785186768, -0.7176597118377686, -0.49701714515686035, -0.27637460827827454, -0.05573207139968872, 0.1649104356765747, 0.3855530023574829, 0.6061955690383911, 0.8268380165100098, 1.047480583190918, 1.2681236267089844, 1.4887661933898926, 1.7094087600708008, 1.9300512075424194, 2.150693893432617, 2.3713364601135254, 2.5919787883758545, 2.8126213550567627, 3.033263921737671, 3.253906488418579, 3.4745490550994873, 3.6951913833618164, 3.9158339500427246, 4.136476516723633, 4.357119083404541, 4.577761650085449, 4.798404216766357, 5.019046783447266, 5.239689350128174, 5.460331916809082, 5.68097448348999, 5.901617050170898, 6.122259140014648, 6.342902183532715, 6.563544273376465, 6.784186840057373, 7.004829406738281, 7.2254719734191895, 7.446114540100098, 7.666757106781006, 7.887399673461914, 8.108041763305664, 8.32868480682373]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 6.0, 17.0, 13.0, 15.0, 14.0, 20.0, 20.0, 20.0, 22.0, 28.0, 27.0, 38.0, 30.0, 37.0, 43.0, 37.0, 49.0, 41.0, 38.0, 38.0, 35.0, 41.0, 42.0, 43.0, 40.0, 36.0, 23.0, 21.0, 25.0, 16.0, 16.0, 19.0, 18.0, 9.0, 9.0, 8.0, 12.0, 11.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.911592483520508, -5.738431930541992, -5.565271854400635, -5.392111301422119, -5.218951225280762, -5.045790672302246, -4.8726301193237305, -4.699469566345215, -4.526309490203857, -4.353148937225342, -4.179988861083984, -4.006828308105469, -3.8336679935455322, -3.6605076789855957, -3.48734712600708, -3.3141868114471436, -3.141026496887207, -2.9678661823272705, -2.794705867767334, -2.6215453147888184, -2.448385000228882, -2.2752246856689453, -2.1020641326904297, -1.9289038181304932, -1.7557435035705566, -1.5825831890106201, -1.409422755241394, -1.236262321472168, -1.0631020069122314, -0.8899416327476501, -0.7167812585830688, -0.5436208248138428, -0.37046003341674805, -0.19729965925216675, -0.02413928508758545, 0.14902108907699585, 0.32218146324157715, 0.49534183740615845, 0.6685022115707397, 0.8416626453399658, 1.0148229598999023, 1.1879832744598389, 1.361143708229065, 1.534304141998291, 1.7074644565582275, 1.880624771118164, 2.0537853240966797, 2.226945638656616, 2.4001059532165527, 2.5732662677764893, 2.746426582336426, 2.9195871353149414, 3.092747449874878, 3.2659077644348145, 3.43906831741333, 3.6122286319732666, 3.785388946533203, 3.9585492610931396, 4.131709575653076, 4.304870128631592, 4.478030204772949, 4.651190757751465, 4.8243513107299805, 4.997511863708496, 5.1706719398498535]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 5.0, 12.0, 9.0, 20.0, 23.0, 37.0, 61.0, 76.0, 116.0, 188.0, 283.0, 400.0, 659.0, 937.0, 1497.0, 2241.0, 3535.0, 5500.0, 8566.0, 13734.0, 22349.0, 36826.0, 63641.0, 114500.0, 235645.0, 627487.0, 1344276.0, 976445.0, 363764.0, 158913.0, 86002.0, 49294.0, 29000.0, 17695.0, 11063.0, 7043.0, 4423.0, 2770.0, 1815.0, 1199.0, 750.0, 501.0, 362.0, 213.0, 143.0, 89.0, 69.0, 32.0, 26.0, 20.0, 15.0, 5.0, 9.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.60546875, -7.3800048828125, -7.154541015625, -6.9290771484375, -6.70361328125, -6.4781494140625, -6.252685546875, -6.0272216796875, -5.8017578125, -5.5762939453125, -5.350830078125, -5.1253662109375, -4.89990234375, -4.6744384765625, -4.448974609375, -4.2235107421875, -3.998046875, -3.7725830078125, -3.547119140625, -3.3216552734375, -3.09619140625, -2.8707275390625, -2.645263671875, -2.4197998046875, -2.1943359375, -1.9688720703125, -1.743408203125, -1.5179443359375, -1.29248046875, -1.0670166015625, -0.841552734375, -0.6160888671875, -0.390625, -0.1651611328125, 0.060302734375, 0.2857666015625, 0.51123046875, 0.7366943359375, 0.962158203125, 1.1876220703125, 1.4130859375, 1.6385498046875, 1.864013671875, 2.0894775390625, 2.31494140625, 2.5404052734375, 2.765869140625, 2.9913330078125, 3.216796875, 3.4422607421875, 3.667724609375, 3.8931884765625, 4.11865234375, 4.3441162109375, 4.569580078125, 4.7950439453125, 5.0205078125, 5.2459716796875, 5.471435546875, 5.6968994140625, 5.92236328125, 6.1478271484375, 6.373291015625, 6.5987548828125, 6.82421875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 8.0, 5.0, 9.0, 8.0, 15.0, 18.0, 16.0, 15.0, 19.0, 27.0, 30.0, 26.0, 30.0, 33.0, 43.0, 52.0, 46.0, 44.0, 35.0, 41.0, 44.0, 47.0, 44.0, 52.0, 25.0, 41.0, 39.0, 28.0, 27.0, 23.0, 13.0, 18.0, 17.0, 12.0, 18.0, 5.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.5859375, -5.4224853515625, -5.259033203125, -5.0955810546875, -4.93212890625, -4.7686767578125, -4.605224609375, -4.4417724609375, -4.2783203125, -4.1148681640625, -3.951416015625, -3.7879638671875, -3.62451171875, -3.4610595703125, -3.297607421875, -3.1341552734375, -2.970703125, -2.8072509765625, -2.643798828125, -2.4803466796875, -2.31689453125, -2.1534423828125, -1.989990234375, -1.8265380859375, -1.6630859375, -1.4996337890625, -1.336181640625, -1.1727294921875, -1.00927734375, -0.8458251953125, -0.682373046875, -0.5189208984375, -0.35546875, -0.1920166015625, -0.028564453125, 0.1348876953125, 0.29833984375, 0.4617919921875, 0.625244140625, 0.7886962890625, 0.9521484375, 1.1156005859375, 1.279052734375, 1.4425048828125, 1.60595703125, 1.7694091796875, 1.932861328125, 2.0963134765625, 2.259765625, 2.4232177734375, 2.586669921875, 2.7501220703125, 2.91357421875, 3.0770263671875, 3.240478515625, 3.4039306640625, 3.5673828125, 3.7308349609375, 3.894287109375, 4.0577392578125, 4.22119140625, 4.3846435546875, 4.548095703125, 4.7115478515625, 4.875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 9.0, 18.0, 27.0, 47.0, 66.0, 115.0, 165.0, 259.0, 397.0, 626.0, 998.0, 1493.0, 2400.0, 3915.0, 6327.0, 10324.0, 17419.0, 29308.0, 50320.0, 91918.0, 171700.0, 338948.0, 707677.0, 1236706.0, 755343.0, 359081.0, 181441.0, 97040.0, 53628.0, 30785.0, 17848.0, 10732.0, 6503.0, 3902.0, 2511.0, 1519.0, 998.0, 673.0, 409.0, 236.0, 156.0, 117.0, 64.0, 37.0, 25.0, 22.0, 14.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.599365234375, -6.39013671875, -6.180908203125, -5.9716796875, -5.762451171875, -5.55322265625, -5.343994140625, -5.134765625, -4.925537109375, -4.71630859375, -4.507080078125, -4.2978515625, -4.088623046875, -3.87939453125, -3.670166015625, -3.4609375, -3.251708984375, -3.04248046875, -2.833251953125, -2.6240234375, -2.414794921875, -2.20556640625, -1.996337890625, -1.787109375, -1.577880859375, -1.36865234375, -1.159423828125, -0.9501953125, -0.740966796875, -0.53173828125, -0.322509765625, -0.11328125, 0.095947265625, 0.30517578125, 0.514404296875, 0.7236328125, 0.932861328125, 1.14208984375, 1.351318359375, 1.560546875, 1.769775390625, 1.97900390625, 2.188232421875, 2.3974609375, 2.606689453125, 2.81591796875, 3.025146484375, 3.234375, 3.443603515625, 3.65283203125, 3.862060546875, 4.0712890625, 4.280517578125, 4.48974609375, 4.698974609375, 4.908203125, 5.117431640625, 5.32666015625, 5.535888671875, 5.7451171875, 5.954345703125, 6.16357421875, 6.372802734375, 6.58203125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 4.0, 7.0, 5.0, 9.0, 10.0, 7.0, 10.0, 29.0, 29.0, 43.0, 31.0, 60.0, 66.0, 79.0, 104.0, 118.0, 147.0, 145.0, 197.0, 228.0, 252.0, 329.0, 339.0, 284.0, 252.0, 226.0, 203.0, 137.0, 138.0, 107.0, 81.0, 68.0, 78.0, 52.0, 40.0, 33.0, 24.0, 34.0, 15.0, 11.0, 13.0, 5.0, 5.0, 7.0, 7.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.515625, -2.43499755859375, -2.3543701171875, -2.27374267578125, -2.193115234375, -2.11248779296875, -2.0318603515625, -1.95123291015625, -1.87060546875, -1.78997802734375, -1.7093505859375, -1.62872314453125, -1.548095703125, -1.46746826171875, -1.3868408203125, -1.30621337890625, -1.2255859375, -1.14495849609375, -1.0643310546875, -0.98370361328125, -0.903076171875, -0.82244873046875, -0.7418212890625, -0.66119384765625, -0.58056640625, -0.49993896484375, -0.4193115234375, -0.33868408203125, -0.258056640625, -0.17742919921875, -0.0968017578125, -0.01617431640625, 0.064453125, 0.14508056640625, 0.2257080078125, 0.30633544921875, 0.386962890625, 0.46759033203125, 0.5482177734375, 0.62884521484375, 0.70947265625, 0.79010009765625, 0.8707275390625, 0.95135498046875, 1.031982421875, 1.11260986328125, 1.1932373046875, 1.27386474609375, 1.3544921875, 1.43511962890625, 1.5157470703125, 1.59637451171875, 1.677001953125, 1.75762939453125, 1.8382568359375, 1.91888427734375, 1.99951171875, 2.08013916015625, 2.1607666015625, 2.24139404296875, 2.322021484375, 2.40264892578125, 2.4832763671875, 2.56390380859375, 2.64453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 12.0, 9.0, 14.0, 18.0, 19.0, 25.0, 33.0, 51.0, 54.0, 70.0, 75.0, 74.0, 79.0, 78.0, 82.0, 56.0, 40.0, 43.0, 29.0, 28.0, 21.0, 22.0, 12.0, 5.0, 4.0, 9.0, 8.0, 11.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.108372211456299, -5.914872169494629, -5.721371650695801, -5.527871608734131, -5.334371566772461, -5.140871524810791, -4.947371006011963, -4.753870964050293, -4.560370922088623, -4.366870880126953, -4.173370361328125, -3.979870319366455, -3.786370277404785, -3.592869997024536, -3.399369716644287, -3.205869674682617, -3.012369394302368, -2.818869113922119, -2.625369071960449, -2.4318687915802, -2.2383687496185303, -2.0448684692382812, -1.8513683080673218, -1.6578681468963623, -1.4643679857254028, -1.2708678245544434, -1.0773676633834839, -0.8838674426078796, -0.6903672814369202, -0.4968671202659607, -0.30336689949035645, -0.10986673831939697, 0.0836334228515625, 0.277133584022522, 0.47063377499580383, 0.6641339659690857, 0.8576341271400452, 1.0511343479156494, 1.2446345090866089, 1.4381346702575684, 1.6316348314285278, 1.8251349925994873, 2.0186352729797363, 2.2121353149414062, 2.4056355953216553, 2.599135637283325, 2.792635917663574, 2.986135959625244, 3.179636240005493, 3.373136520385742, 3.566636562347412, 3.760136842727661, 3.953636884689331, 4.14713716506958, 4.34063720703125, 4.534137725830078, 4.727637767791748, 4.921137809753418, 5.114638328552246, 5.308138370513916, 5.501638412475586, 5.695138454437256, 5.888638973236084, 6.082139015197754, 6.275639057159424]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 9.0, 12.0, 8.0, 12.0, 9.0, 21.0, 20.0, 16.0, 31.0, 25.0, 25.0, 35.0, 34.0, 37.0, 49.0, 40.0, 41.0, 58.0, 35.0, 45.0, 45.0, 31.0, 54.0, 38.0, 36.0, 35.0, 31.0, 21.0, 24.0, 16.0, 18.0, 18.0, 10.0, 17.0, 7.0, 9.0, 7.0, 6.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0943074226379395, -4.915544509887695, -4.736781597137451, -4.558018684387207, -4.379255771636963, -4.200492858886719, -4.021730422973633, -3.8429672718048096, -3.6642043590545654, -3.4854414463043213, -3.306678533554077, -3.127915859222412, -2.949152946472168, -2.770390033721924, -2.5916271209716797, -2.4128642082214355, -2.2341012954711914, -2.0553383827209473, -1.8765754699707031, -1.6978126764297485, -1.5190497636795044, -1.3402868509292603, -1.1615240573883057, -0.9827611446380615, -0.8039982318878174, -0.6252353191375732, -0.4464724659919739, -0.2677096128463745, -0.08894670009613037, 0.08981621265411377, 0.26857900619506836, 0.4473419189453125, 0.6261053085327148, 0.804868221282959, 0.9836310744285583, 1.1623939275741577, 1.3411568403244019, 1.519919753074646, 1.6986825466156006, 1.8774454593658447, 2.056208372116089, 2.234971284866333, 2.413734197616577, 2.592496871948242, 2.7712597846984863, 2.9500226974487305, 3.1287856101989746, 3.3075485229492188, 3.486311435699463, 3.665074348449707, 3.843837261199951, 4.022600173950195, 4.2013630867004395, 4.380125999450684, 4.5588884353637695, 4.737651824951172, 4.916414260864258, 5.095177173614502, 5.273940086364746, 5.45270299911499, 5.631465911865234, 5.8102288246154785, 5.988991737365723, 6.167754173278809, 6.346517562866211]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 8.0, 12.0, 19.0, 36.0, 52.0, 81.0, 107.0, 179.0, 300.0, 435.0, 750.0, 1157.0, 1770.0, 2740.0, 4218.0, 6829.0, 10969.0, 16944.0, 26865.0, 42632.0, 68034.0, 112047.0, 191262.0, 219169.0, 130422.0, 78471.0, 49398.0, 30780.0, 19381.0, 12263.0, 7682.0, 4772.0, 3138.0, 2014.0, 1294.0, 832.0, 541.0, 344.0, 208.0, 137.0, 98.0, 65.0, 39.0, 25.0, 14.0, 13.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.146484375, -2.0797119140625, -2.012939453125, -1.9461669921875, -1.87939453125, -1.8126220703125, -1.745849609375, -1.6790771484375, -1.6123046875, -1.5455322265625, -1.478759765625, -1.4119873046875, -1.34521484375, -1.2784423828125, -1.211669921875, -1.1448974609375, -1.078125, -1.0113525390625, -0.944580078125, -0.8778076171875, -0.81103515625, -0.7442626953125, -0.677490234375, -0.6107177734375, -0.5439453125, -0.4771728515625, -0.410400390625, -0.3436279296875, -0.27685546875, -0.2100830078125, -0.143310546875, -0.0765380859375, -0.009765625, 0.0570068359375, 0.123779296875, 0.1905517578125, 0.25732421875, 0.3240966796875, 0.390869140625, 0.4576416015625, 0.5244140625, 0.5911865234375, 0.657958984375, 0.7247314453125, 0.79150390625, 0.8582763671875, 0.925048828125, 0.9918212890625, 1.05859375, 1.1253662109375, 1.192138671875, 1.2589111328125, 1.32568359375, 1.3924560546875, 1.459228515625, 1.5260009765625, 1.5927734375, 1.6595458984375, 1.726318359375, 1.7930908203125, 1.85986328125, 1.9266357421875, 1.993408203125, 2.0601806640625, 2.126953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 8.0, 8.0, 16.0, 15.0, 21.0, 19.0, 27.0, 20.0, 30.0, 22.0, 37.0, 47.0, 44.0, 34.0, 28.0, 54.0, 39.0, 46.0, 52.0, 47.0, 50.0, 34.0, 42.0, 29.0, 34.0, 24.0, 28.0, 20.0, 24.0, 15.0, 15.0, 14.0, 7.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.80810546875, -4.6240234375, -4.43994140625, -4.255859375, -4.07177734375, -3.8876953125, -3.70361328125, -3.51953125, -3.33544921875, -3.1513671875, -2.96728515625, -2.783203125, -2.59912109375, -2.4150390625, -2.23095703125, -2.046875, -1.86279296875, -1.6787109375, -1.49462890625, -1.310546875, -1.12646484375, -0.9423828125, -0.75830078125, -0.57421875, -0.39013671875, -0.2060546875, -0.02197265625, 0.162109375, 0.34619140625, 0.5302734375, 0.71435546875, 0.8984375, 1.08251953125, 1.2666015625, 1.45068359375, 1.634765625, 1.81884765625, 2.0029296875, 2.18701171875, 2.37109375, 2.55517578125, 2.7392578125, 2.92333984375, 3.107421875, 3.29150390625, 3.4755859375, 3.65966796875, 3.84375, 4.02783203125, 4.2119140625, 4.39599609375, 4.580078125, 4.76416015625, 4.9482421875, 5.13232421875, 5.31640625, 5.50048828125, 5.6845703125, 5.86865234375, 6.052734375, 6.23681640625, 6.4208984375, 6.60498046875, 6.7890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 6.0, 13.0, 16.0, 32.0, 27.0, 45.0, 86.0, 115.0, 204.0, 296.0, 501.0, 821.0, 1344.0, 2201.0, 3763.0, 6558.0, 11617.0, 20646.0, 38568.0, 73511.0, 147752.0, 307545.0, 215201.0, 102036.0, 52241.0, 27667.0, 15072.0, 8457.0, 4892.0, 2914.0, 1719.0, 1033.0, 646.0, 391.0, 218.0, 146.0, 84.0, 58.0, 41.0, 25.0, 15.0, 9.0, 11.0, 7.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.916015625, -2.82958984375, -2.7431640625, -2.65673828125, -2.5703125, -2.48388671875, -2.3974609375, -2.31103515625, -2.224609375, -2.13818359375, -2.0517578125, -1.96533203125, -1.87890625, -1.79248046875, -1.7060546875, -1.61962890625, -1.533203125, -1.44677734375, -1.3603515625, -1.27392578125, -1.1875, -1.10107421875, -1.0146484375, -0.92822265625, -0.841796875, -0.75537109375, -0.6689453125, -0.58251953125, -0.49609375, -0.40966796875, -0.3232421875, -0.23681640625, -0.150390625, -0.06396484375, 0.0224609375, 0.10888671875, 0.1953125, 0.28173828125, 0.3681640625, 0.45458984375, 0.541015625, 0.62744140625, 0.7138671875, 0.80029296875, 0.88671875, 0.97314453125, 1.0595703125, 1.14599609375, 1.232421875, 1.31884765625, 1.4052734375, 1.49169921875, 1.578125, 1.66455078125, 1.7509765625, 1.83740234375, 1.923828125, 2.01025390625, 2.0966796875, 2.18310546875, 2.26953125, 2.35595703125, 2.4423828125, 2.52880859375, 2.615234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 7.0, 2.0, 7.0, 3.0, 6.0, 13.0, 19.0, 11.0, 13.0, 23.0, 25.0, 24.0, 29.0, 33.0, 48.0, 36.0, 37.0, 33.0, 27.0, 47.0, 60.0, 43.0, 44.0, 43.0, 44.0, 44.0, 35.0, 30.0, 33.0, 25.0, 25.0, 19.0, 24.0, 18.0, 26.0, 9.0, 6.0, 10.0, 3.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5390625, -3.424041748046875, -3.30902099609375, -3.194000244140625, -3.0789794921875, -2.963958740234375, -2.84893798828125, -2.733917236328125, -2.618896484375, -2.503875732421875, -2.38885498046875, -2.273834228515625, -2.1588134765625, -2.043792724609375, -1.92877197265625, -1.813751220703125, -1.69873046875, -1.583709716796875, -1.46868896484375, -1.353668212890625, -1.2386474609375, -1.123626708984375, -1.00860595703125, -0.893585205078125, -0.778564453125, -0.663543701171875, -0.54852294921875, -0.433502197265625, -0.3184814453125, -0.203460693359375, -0.08843994140625, 0.026580810546875, 0.1416015625, 0.256622314453125, 0.37164306640625, 0.486663818359375, 0.6016845703125, 0.716705322265625, 0.83172607421875, 0.946746826171875, 1.061767578125, 1.176788330078125, 1.29180908203125, 1.406829833984375, 1.5218505859375, 1.636871337890625, 1.75189208984375, 1.866912841796875, 1.98193359375, 2.096954345703125, 2.21197509765625, 2.326995849609375, 2.4420166015625, 2.557037353515625, 2.67205810546875, 2.787078857421875, 2.902099609375, 3.017120361328125, 3.13214111328125, 3.247161865234375, 3.3621826171875, 3.477203369140625, 3.59222412109375, 3.707244873046875, 3.822265625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 14.0, 10.0, 27.0, 28.0, 44.0, 68.0, 102.0, 152.0, 206.0, 375.0, 612.0, 963.0, 2026.0, 4108.0, 10233.0, 30316.0, 120406.0, 575553.0, 228757.0, 48144.0, 14765.0, 5680.0, 2629.0, 1332.0, 740.0, 431.0, 262.0, 183.0, 138.0, 76.0, 55.0, 37.0, 27.0, 11.0, 17.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04205322265625, -0.04090690612792969, -0.039760589599609375, -0.03861427307128906, -0.03746795654296875, -0.03632164001464844, -0.035175323486328125, -0.03402900695800781, -0.0328826904296875, -0.03173637390136719, -0.030590057373046875, -0.029443740844726562, -0.02829742431640625, -0.027151107788085938, -0.026004791259765625, -0.024858474731445312, -0.023712158203125, -0.022565841674804688, -0.021419525146484375, -0.020273208618164062, -0.01912689208984375, -0.017980575561523438, -0.016834259033203125, -0.015687942504882812, -0.0145416259765625, -0.013395309448242188, -0.012248992919921875, -0.011102676391601562, -0.00995635986328125, -0.008810043334960938, -0.007663726806640625, -0.0065174102783203125, -0.00537109375, -0.0042247772216796875, -0.003078460693359375, -0.0019321441650390625, -0.00078582763671875, 0.0003604888916015625, 0.001506805419921875, 0.0026531219482421875, 0.0037994384765625, 0.0049457550048828125, 0.006092071533203125, 0.0072383880615234375, 0.00838470458984375, 0.009531021118164062, 0.010677337646484375, 0.011823654174804688, 0.012969970703125, 0.014116287231445312, 0.015262603759765625, 0.016408920288085938, 0.01755523681640625, 0.018701553344726562, 0.019847869873046875, 0.020994186401367188, 0.0221405029296875, 0.023286819458007812, 0.024433135986328125, 0.025579452514648438, 0.02672576904296875, 0.027872085571289062, 0.029018402099609375, 0.030164718627929688, 0.03131103515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 10.0, 12.0, 14.0, 22.0, 38.0, 52.0, 64.0, 80.0, 91.0, 95.0, 91.0, 72.0, 83.0, 62.0, 48.0, 45.0, 17.0, 27.0, 11.0, 10.0, 6.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1514872312545776e-05, -1.1228024959564209e-05, -1.0941177606582642e-05, -1.0654330253601074e-05, -1.0367482900619507e-05, -1.008063554763794e-05, -9.793788194656372e-06, -9.506940841674805e-06, -9.220093488693237e-06, -8.93324613571167e-06, -8.646398782730103e-06, -8.359551429748535e-06, -8.072704076766968e-06, -7.7858567237854e-06, -7.499009370803833e-06, -7.212162017822266e-06, -6.925314664840698e-06, -6.638467311859131e-06, -6.3516199588775635e-06, -6.064772605895996e-06, -5.777925252914429e-06, -5.491077899932861e-06, -5.204230546951294e-06, -4.9173831939697266e-06, -4.630535840988159e-06, -4.343688488006592e-06, -4.056841135025024e-06, -3.769993782043457e-06, -3.4831464290618896e-06, -3.1962990760803223e-06, -2.909451723098755e-06, -2.6226043701171875e-06, -2.33575701713562e-06, -2.0489096641540527e-06, -1.7620623111724854e-06, -1.475214958190918e-06, -1.1883676052093506e-06, -9.015202522277832e-07, -6.146728992462158e-07, -3.2782554626464844e-07, -4.0978193283081055e-08, 2.4586915969848633e-07, 5.327165126800537e-07, 8.195638656616211e-07, 1.1064112186431885e-06, 1.3932585716247559e-06, 1.6801059246063232e-06, 1.9669532775878906e-06, 2.253800630569458e-06, 2.5406479835510254e-06, 2.8274953365325928e-06, 3.11434268951416e-06, 3.4011900424957275e-06, 3.688037395477295e-06, 3.974884748458862e-06, 4.26173210144043e-06, 4.548579454421997e-06, 4.8354268074035645e-06, 5.122274160385132e-06, 5.409121513366699e-06, 5.695968866348267e-06, 5.982816219329834e-06, 6.269663572311401e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 12.0, 5.0, 10.0, 26.0, 31.0, 46.0, 60.0, 92.0, 121.0, 182.0, 271.0, 485.0, 687.0, 1080.0, 1691.0, 2746.0, 4622.0, 8100.0, 15148.0, 29941.0, 65131.0, 157557.0, 367026.0, 222686.0, 88092.0, 39061.0, 19150.0, 9949.0, 5654.0, 3254.0, 2085.0, 1258.0, 789.0, 489.0, 333.0, 219.0, 158.0, 101.0, 67.0, 34.0, 29.0, 25.0, 15.0, 17.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185699462890625, -0.017922401428222656, -0.017274856567382812, -0.01662731170654297, -0.015979766845703125, -0.015332221984863281, -0.014684677124023438, -0.014037132263183594, -0.01338958740234375, -0.012742042541503906, -0.012094497680664062, -0.011446952819824219, -0.010799407958984375, -0.010151863098144531, -0.009504318237304688, -0.008856773376464844, -0.008209228515625, -0.007561683654785156, -0.0069141387939453125, -0.006266593933105469, -0.005619049072265625, -0.004971504211425781, -0.0043239593505859375, -0.0036764144897460938, -0.00302886962890625, -0.0023813247680664062, -0.0017337799072265625, -0.0010862350463867188, -0.000438690185546875, 0.00020885467529296875, 0.0008563995361328125, 0.0015039443969726562, 0.0021514892578125, 0.0027990341186523438, 0.0034465789794921875, 0.004094123840332031, 0.004741668701171875, 0.005389213562011719, 0.0060367584228515625, 0.006684303283691406, 0.00733184814453125, 0.007979393005371094, 0.008626937866210938, 0.009274482727050781, 0.009922027587890625, 0.010569572448730469, 0.011217117309570312, 0.011864662170410156, 0.01251220703125, 0.013159751892089844, 0.013807296752929688, 0.014454841613769531, 0.015102386474609375, 0.01574993133544922, 0.016397476196289062, 0.017045021057128906, 0.01769256591796875, 0.018340110778808594, 0.018987655639648438, 0.01963520050048828, 0.020282745361328125, 0.02093029022216797, 0.021577835083007812, 0.022225379943847656, 0.0228729248046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 8.0, 11.0, 15.0, 28.0, 42.0, 35.0, 63.0, 74.0, 79.0, 80.0, 84.0, 75.0, 64.0, 63.0, 51.0, 42.0, 38.0, 25.0, 26.0, 8.0, 16.0, 9.0, 7.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00772857666015625, -0.007516026496887207, -0.007303476333618164, -0.007090926170349121, -0.006878376007080078, -0.006665825843811035, -0.006453275680541992, -0.006240725517272949, -0.006028175354003906, -0.005815625190734863, -0.00560307502746582, -0.005390524864196777, -0.005177974700927734, -0.004965424537658691, -0.0047528743743896484, -0.0045403242111206055, -0.0043277740478515625, -0.0041152238845825195, -0.0039026737213134766, -0.0036901235580444336, -0.0034775733947753906, -0.0032650232315063477, -0.0030524730682373047, -0.0028399229049682617, -0.0026273727416992188, -0.0024148225784301758, -0.002202272415161133, -0.00198972225189209, -0.0017771720886230469, -0.001564621925354004, -0.001352071762084961, -0.001139521598815918, -0.000926971435546875, -0.000714421272277832, -0.0005018711090087891, -0.0002893209457397461, -7.677078247070312e-05, 0.00013577938079833984, 0.0003483295440673828, 0.0005608797073364258, 0.0007734298706054688, 0.0009859800338745117, 0.0011985301971435547, 0.0014110803604125977, 0.0016236305236816406, 0.0018361806869506836, 0.0020487308502197266, 0.0022612810134887695, 0.0024738311767578125, 0.0026863813400268555, 0.0028989315032958984, 0.0031114816665649414, 0.0033240318298339844, 0.0035365819931030273, 0.0037491321563720703, 0.003961682319641113, 0.004174232482910156, 0.004386782646179199, 0.004599332809448242, 0.004811882972717285, 0.005024433135986328, 0.005236983299255371, 0.005449533462524414, 0.005662083625793457, 0.0058746337890625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 12.0, 13.0, 11.0, 12.0, 22.0, 20.0, 34.0, 51.0, 57.0, 71.0, 74.0, 69.0, 85.0, 73.0, 87.0, 54.0, 49.0, 43.0, 25.0, 29.0, 25.0, 17.0, 11.0, 5.0, 4.0, 9.0, 9.0, 6.0, 6.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.179548740386963, -5.984485626220703, -5.789422512054443, -5.594359397888184, -5.399295806884766, -5.204232692718506, -5.009169578552246, -4.814106464385986, -4.619043350219727, -4.423980236053467, -4.228917121887207, -4.033853530883789, -3.8387906551361084, -3.6437273025512695, -3.4486641883850098, -3.25360107421875, -3.058537721633911, -2.8634746074676514, -2.6684112548828125, -2.4733481407165527, -2.278285026550293, -2.083221912384033, -1.8881585597991943, -1.6930954456329346, -1.4980322122573853, -1.302968978881836, -1.1079058647155762, -0.9128426313400269, -0.7177794575691223, -0.5227162837982178, -0.32765305042266846, -0.1325899362564087, 0.062473297119140625, 0.25753647089004517, 0.4525996744632721, 0.647662878036499, 0.8427260518074036, 1.037789225578308, 1.2328524589538574, 1.4279155731201172, 1.6229788064956665, 1.8180420398712158, 2.0131051540374756, 2.2081685066223145, 2.403231620788574, 2.598294734954834, 2.7933578491210938, 2.9884209632873535, 3.1834843158721924, 3.378547430038452, 3.573610782623291, 3.768673896789551, 3.9637370109558105, 4.15880012512207, 4.353863716125488, 4.54892635345459, 4.743989944458008, 4.939053058624268, 5.134116172790527, 5.329179763793945, 5.524242877960205, 5.719305992126465, 5.914369106292725, 6.109432220458984, 6.304495334625244]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 12.0, 8.0, 12.0, 11.0, 19.0, 20.0, 17.0, 31.0, 26.0, 26.0, 33.0, 36.0, 39.0, 44.0, 43.0, 40.0, 58.0, 33.0, 47.0, 45.0, 34.0, 49.0, 37.0, 37.0, 36.0, 31.0, 21.0, 22.0, 17.0, 18.0, 17.0, 11.0, 17.0, 7.0, 10.0, 6.0, 6.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.059604167938232, -4.881618499755859, -4.703632831573486, -4.525647163391113, -4.34766149520874, -4.169675827026367, -3.991690158843994, -3.813704490661621, -3.635718822479248, -3.457733154296875, -3.279747486114502, -3.101761817932129, -2.923776149749756, -2.745790481567383, -2.5678048133850098, -2.3898191452026367, -2.2118334770202637, -2.0338478088378906, -1.8558621406555176, -1.6778764724731445, -1.4998908042907715, -1.3219051361083984, -1.1439194679260254, -0.9659337997436523, -0.7879481315612793, -0.6099624633789062, -0.4319767951965332, -0.25399112701416016, -0.07600545883178711, 0.10198020935058594, 0.279965877532959, 0.45795154571533203, 0.6359376907348633, 0.8139233589172363, 0.9919090270996094, 1.1698946952819824, 1.3478803634643555, 1.5258660316467285, 1.7038516998291016, 1.8818373680114746, 2.0598230361938477, 2.2378087043762207, 2.4157943725585938, 2.593780040740967, 2.77176570892334, 2.949751377105713, 3.127737045288086, 3.305722713470459, 3.483708381652832, 3.661694049835205, 3.839679718017578, 4.017665386199951, 4.195651054382324, 4.373636722564697, 4.55162239074707, 4.729608058929443, 4.907593727111816, 5.0855793952941895, 5.2635650634765625, 5.4415507316589355, 5.619536399841309, 5.797522068023682, 5.975507736206055, 6.153493404388428, 6.331479072570801]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 16.0, 15.0, 25.0, 43.0, 61.0, 103.0, 188.0, 308.0, 497.0, 863.0, 1336.0, 2266.0, 3801.0, 6453.0, 11247.0, 19597.0, 36475.0, 69611.0, 133855.0, 228116.0, 233917.0, 139846.0, 73167.0, 37895.0, 20475.0, 11655.0, 6788.0, 3909.0, 2425.0, 1416.0, 867.0, 502.0, 344.0, 195.0, 102.0, 63.0, 32.0, 32.0, 17.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6015625, -10.2806396484375, -9.959716796875, -9.6387939453125, -9.31787109375, -8.9969482421875, -8.676025390625, -8.3551025390625, -8.0341796875, -7.7132568359375, -7.392333984375, -7.0714111328125, -6.75048828125, -6.4295654296875, -6.108642578125, -5.7877197265625, -5.466796875, -5.1458740234375, -4.824951171875, -4.5040283203125, -4.18310546875, -3.8621826171875, -3.541259765625, -3.2203369140625, -2.8994140625, -2.5784912109375, -2.257568359375, -1.9366455078125, -1.61572265625, -1.2947998046875, -0.973876953125, -0.6529541015625, -0.33203125, -0.0111083984375, 0.309814453125, 0.6307373046875, 0.95166015625, 1.2725830078125, 1.593505859375, 1.9144287109375, 2.2353515625, 2.5562744140625, 2.877197265625, 3.1981201171875, 3.51904296875, 3.8399658203125, 4.160888671875, 4.4818115234375, 4.802734375, 5.1236572265625, 5.444580078125, 5.7655029296875, 6.08642578125, 6.4073486328125, 6.728271484375, 7.0491943359375, 7.3701171875, 7.6910400390625, 8.011962890625, 8.3328857421875, 8.65380859375, 8.9747314453125, 9.295654296875, 9.6165771484375, 9.9375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 9.0, 6.0, 6.0, 10.0, 6.0, 12.0, 26.0, 24.0, 20.0, 20.0, 26.0, 30.0, 33.0, 33.0, 41.0, 44.0, 34.0, 49.0, 34.0, 46.0, 34.0, 45.0, 48.0, 49.0, 38.0, 33.0, 33.0, 27.0, 25.0, 22.0, 19.0, 17.0, 15.0, 18.0, 11.0, 10.0, 14.0, 3.0, 9.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.9046630859375, -4.739013671875, -4.5733642578125, -4.40771484375, -4.2420654296875, -4.076416015625, -3.9107666015625, -3.7451171875, -3.5794677734375, -3.413818359375, -3.2481689453125, -3.08251953125, -2.9168701171875, -2.751220703125, -2.5855712890625, -2.419921875, -2.2542724609375, -2.088623046875, -1.9229736328125, -1.75732421875, -1.5916748046875, -1.426025390625, -1.2603759765625, -1.0947265625, -0.9290771484375, -0.763427734375, -0.5977783203125, -0.43212890625, -0.2664794921875, -0.100830078125, 0.0648193359375, 0.23046875, 0.3961181640625, 0.561767578125, 0.7274169921875, 0.89306640625, 1.0587158203125, 1.224365234375, 1.3900146484375, 1.5556640625, 1.7213134765625, 1.886962890625, 2.0526123046875, 2.21826171875, 2.3839111328125, 2.549560546875, 2.7152099609375, 2.880859375, 3.0465087890625, 3.212158203125, 3.3778076171875, 3.54345703125, 3.7091064453125, 3.874755859375, 4.0404052734375, 4.2060546875, 4.3717041015625, 4.537353515625, 4.7030029296875, 4.86865234375, 5.0343017578125, 5.199951171875, 5.3656005859375, 5.53125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 6.0, 11.0, 11.0, 19.0, 27.0, 44.0, 60.0, 86.0, 148.0, 181.0, 265.0, 351.0, 577.0, 848.0, 1253.0, 1994.0, 2973.0, 4436.0, 7117.0, 10809.0, 17440.0, 28088.0, 47243.0, 78941.0, 132470.0, 193697.0, 191711.0, 129588.0, 76975.0, 45589.0, 27524.0, 17289.0, 10899.0, 6814.0, 4310.0, 2888.0, 1945.0, 1273.0, 841.0, 542.0, 416.0, 269.0, 181.0, 121.0, 72.0, 63.0, 40.0, 30.0, 28.0, 18.0, 13.0, 10.0, 9.0, 1.0, 2.0, 0.0, 3.0], "bins": [-8.5625, -8.3028564453125, -8.043212890625, -7.7835693359375, -7.52392578125, -7.2642822265625, -7.004638671875, -6.7449951171875, -6.4853515625, -6.2257080078125, -5.966064453125, -5.7064208984375, -5.44677734375, -5.1871337890625, -4.927490234375, -4.6678466796875, -4.408203125, -4.1485595703125, -3.888916015625, -3.6292724609375, -3.36962890625, -3.1099853515625, -2.850341796875, -2.5906982421875, -2.3310546875, -2.0714111328125, -1.811767578125, -1.5521240234375, -1.29248046875, -1.0328369140625, -0.773193359375, -0.5135498046875, -0.25390625, 0.0057373046875, 0.265380859375, 0.5250244140625, 0.78466796875, 1.0443115234375, 1.303955078125, 1.5635986328125, 1.8232421875, 2.0828857421875, 2.342529296875, 2.6021728515625, 2.86181640625, 3.1214599609375, 3.381103515625, 3.6407470703125, 3.900390625, 4.1600341796875, 4.419677734375, 4.6793212890625, 4.93896484375, 5.1986083984375, 5.458251953125, 5.7178955078125, 5.9775390625, 6.2371826171875, 6.496826171875, 6.7564697265625, 7.01611328125, 7.2757568359375, 7.535400390625, 7.7950439453125, 8.0546875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 8.0, 13.0, 6.0, 13.0, 23.0, 15.0, 23.0, 26.0, 27.0, 25.0, 28.0, 39.0, 38.0, 35.0, 46.0, 34.0, 36.0, 45.0, 39.0, 41.0, 38.0, 44.0, 29.0, 37.0, 28.0, 30.0, 31.0, 22.0, 30.0, 21.0, 17.0, 18.0, 12.0, 12.0, 11.0, 7.0, 8.0, 4.0, 13.0, 3.0, 8.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.029296875, -2.92608642578125, -2.8228759765625, -2.71966552734375, -2.616455078125, -2.51324462890625, -2.4100341796875, -2.30682373046875, -2.20361328125, -2.10040283203125, -1.9971923828125, -1.89398193359375, -1.790771484375, -1.68756103515625, -1.5843505859375, -1.48114013671875, -1.3779296875, -1.27471923828125, -1.1715087890625, -1.06829833984375, -0.965087890625, -0.86187744140625, -0.7586669921875, -0.65545654296875, -0.55224609375, -0.44903564453125, -0.3458251953125, -0.24261474609375, -0.139404296875, -0.03619384765625, 0.0670166015625, 0.17022705078125, 0.2734375, 0.37664794921875, 0.4798583984375, 0.58306884765625, 0.686279296875, 0.78948974609375, 0.8927001953125, 0.99591064453125, 1.09912109375, 1.20233154296875, 1.3055419921875, 1.40875244140625, 1.511962890625, 1.61517333984375, 1.7183837890625, 1.82159423828125, 1.9248046875, 2.02801513671875, 2.1312255859375, 2.23443603515625, 2.337646484375, 2.44085693359375, 2.5440673828125, 2.64727783203125, 2.75048828125, 2.85369873046875, 2.9569091796875, 3.06011962890625, 3.163330078125, 3.26654052734375, 3.3697509765625, 3.47296142578125, 3.576171875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 12.0, 9.0, 17.0, 23.0, 42.0, 42.0, 76.0, 98.0, 176.0, 209.0, 336.0, 455.0, 637.0, 975.0, 1423.0, 2081.0, 3014.0, 4831.0, 7480.0, 12684.0, 21741.0, 40781.0, 88386.0, 247923.0, 353197.0, 135042.0, 55925.0, 28234.0, 15945.0, 9429.0, 5897.0, 3698.0, 2467.0, 1614.0, 1153.0, 762.0, 497.0, 401.0, 251.0, 201.0, 116.0, 98.0, 62.0, 39.0, 31.0, 20.0, 16.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6201171875, -1.5682220458984375, -1.516326904296875, -1.4644317626953125, -1.41253662109375, -1.3606414794921875, -1.308746337890625, -1.2568511962890625, -1.2049560546875, -1.1530609130859375, -1.101165771484375, -1.0492706298828125, -0.99737548828125, -0.9454803466796875, -0.893585205078125, -0.8416900634765625, -0.789794921875, -0.7378997802734375, -0.686004638671875, -0.6341094970703125, -0.58221435546875, -0.5303192138671875, -0.478424072265625, -0.4265289306640625, -0.3746337890625, -0.3227386474609375, -0.270843505859375, -0.2189483642578125, -0.16705322265625, -0.1151580810546875, -0.063262939453125, -0.0113677978515625, 0.04052734375, 0.0924224853515625, 0.144317626953125, 0.1962127685546875, 0.24810791015625, 0.3000030517578125, 0.351898193359375, 0.4037933349609375, 0.4556884765625, 0.5075836181640625, 0.559478759765625, 0.6113739013671875, 0.66326904296875, 0.7151641845703125, 0.767059326171875, 0.8189544677734375, 0.870849609375, 0.9227447509765625, 0.974639892578125, 1.0265350341796875, 1.07843017578125, 1.1303253173828125, 1.182220458984375, 1.2341156005859375, 1.2860107421875, 1.3379058837890625, 1.389801025390625, 1.4416961669921875, 1.49359130859375, 1.5454864501953125, 1.597381591796875, 1.6492767333984375, 1.701171875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 7.0, 7.0, 18.0, 18.0, 30.0, 34.0, 36.0, 62.0, 78.0, 105.0, 131.0, 138.0, 85.0, 58.0, 58.0, 33.0, 32.0, 13.0, 9.0, 10.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00011956319212913513, -0.0001149103045463562, -0.00011025741696357727, -0.00010560452938079834, -0.00010095164179801941, -9.629875421524048e-05, -9.164586663246155e-05, -8.699297904968262e-05, -8.234009146690369e-05, -7.768720388412476e-05, -7.303431630134583e-05, -6.83814287185669e-05, -6.372854113578796e-05, -5.907565355300903e-05, -5.44227659702301e-05, -4.976987838745117e-05, -4.511699080467224e-05, -4.046410322189331e-05, -3.581121563911438e-05, -3.115832805633545e-05, -2.650544047355652e-05, -2.1852552890777588e-05, -1.7199665307998657e-05, -1.2546777725219727e-05, -7.893890142440796e-06, -3.2410025596618652e-06, 1.4118850231170654e-06, 6.064772605895996e-06, 1.0717660188674927e-05, 1.5370547771453857e-05, 2.0023435354232788e-05, 2.467632293701172e-05, 2.932921051979065e-05, 3.398209810256958e-05, 3.863498568534851e-05, 4.328787326812744e-05, 4.794076085090637e-05, 5.25936484336853e-05, 5.7246536016464233e-05, 6.189942359924316e-05, 6.65523111820221e-05, 7.120519876480103e-05, 7.585808634757996e-05, 8.051097393035889e-05, 8.516386151313782e-05, 8.981674909591675e-05, 9.446963667869568e-05, 9.912252426147461e-05, 0.00010377541184425354, 0.00010842829942703247, 0.0001130811870098114, 0.00011773407459259033, 0.00012238696217536926, 0.0001270398497581482, 0.00013169273734092712, 0.00013634562492370605, 0.00014099851250648499, 0.00014565140008926392, 0.00015030428767204285, 0.00015495717525482178, 0.0001596100628376007, 0.00016426295042037964, 0.00016891583800315857, 0.0001735687255859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 6.0, 13.0, 16.0, 19.0, 32.0, 44.0, 48.0, 74.0, 99.0, 147.0, 239.0, 350.0, 513.0, 853.0, 1238.0, 1997.0, 3195.0, 5330.0, 9180.0, 16858.0, 34256.0, 81591.0, 274850.0, 399322.0, 122512.0, 45832.0, 21530.0, 11495.0, 6413.0, 3777.0, 2409.0, 1495.0, 969.0, 615.0, 353.0, 290.0, 188.0, 109.0, 75.0, 68.0, 36.0, 43.0, 25.0, 15.0, 14.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0], "bins": [-2.419921875, -2.3530426025390625, -2.286163330078125, -2.2192840576171875, -2.15240478515625, -2.0855255126953125, -2.018646240234375, -1.9517669677734375, -1.8848876953125, -1.8180084228515625, -1.751129150390625, -1.6842498779296875, -1.61737060546875, -1.5504913330078125, -1.483612060546875, -1.4167327880859375, -1.349853515625, -1.2829742431640625, -1.216094970703125, -1.1492156982421875, -1.08233642578125, -1.0154571533203125, -0.948577880859375, -0.8816986083984375, -0.8148193359375, -0.7479400634765625, -0.681060791015625, -0.6141815185546875, -0.54730224609375, -0.4804229736328125, -0.413543701171875, -0.3466644287109375, -0.27978515625, -0.2129058837890625, -0.146026611328125, -0.0791473388671875, -0.01226806640625, 0.0546112060546875, 0.121490478515625, 0.1883697509765625, 0.2552490234375, 0.3221282958984375, 0.389007568359375, 0.4558868408203125, 0.52276611328125, 0.5896453857421875, 0.656524658203125, 0.7234039306640625, 0.790283203125, 0.8571624755859375, 0.924041748046875, 0.9909210205078125, 1.05780029296875, 1.1246795654296875, 1.191558837890625, 1.2584381103515625, 1.3253173828125, 1.3921966552734375, 1.459075927734375, 1.5259552001953125, 1.59283447265625, 1.6597137451171875, 1.726593017578125, 1.7934722900390625, 1.8603515625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 7.0, 13.0, 13.0, 11.0, 17.0, 23.0, 32.0, 36.0, 48.0, 60.0, 90.0, 120.0, 117.0, 99.0, 74.0, 41.0, 32.0, 25.0, 19.0, 28.0, 20.0, 9.0, 20.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6328125, -0.6093902587890625, -0.585968017578125, -0.5625457763671875, -0.53912353515625, -0.5157012939453125, -0.492279052734375, -0.4688568115234375, -0.4454345703125, -0.4220123291015625, -0.398590087890625, -0.3751678466796875, -0.35174560546875, -0.3283233642578125, -0.304901123046875, -0.2814788818359375, -0.258056640625, -0.2346343994140625, -0.211212158203125, -0.1877899169921875, -0.16436767578125, -0.1409454345703125, -0.117523193359375, -0.0941009521484375, -0.0706787109375, -0.0472564697265625, -0.023834228515625, -0.0004119873046875, 0.02301025390625, 0.0464324951171875, 0.069854736328125, 0.0932769775390625, 0.11669921875, 0.1401214599609375, 0.163543701171875, 0.1869659423828125, 0.21038818359375, 0.2338104248046875, 0.257232666015625, 0.2806549072265625, 0.3040771484375, 0.3274993896484375, 0.350921630859375, 0.3743438720703125, 0.39776611328125, 0.4211883544921875, 0.444610595703125, 0.4680328369140625, 0.491455078125, 0.5148773193359375, 0.538299560546875, 0.5617218017578125, 0.58514404296875, 0.6085662841796875, 0.631988525390625, 0.6554107666015625, 0.6788330078125, 0.7022552490234375, 0.725677490234375, 0.7490997314453125, 0.77252197265625, 0.7959442138671875, 0.819366455078125, 0.8427886962890625, 0.8662109375]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 11.0, 4.0, 10.0, 12.0, 12.0, 18.0, 30.0, 41.0, 42.0, 64.0, 69.0, 69.0, 80.0, 66.0, 85.0, 64.0, 55.0, 55.0, 51.0, 30.0, 25.0, 20.0, 13.0, 15.0, 7.0, 9.0, 10.0, 7.0, 5.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.893570423126221, -6.693997383117676, -6.494424819946289, -6.294851779937744, -6.095278739929199, -5.895705699920654, -5.696132659912109, -5.496560096740723, -5.296987056732178, -5.097414016723633, -4.897841453552246, -4.698268413543701, -4.498695373535156, -4.299122333526611, -4.099549293518066, -3.8999767303466797, -3.7004036903381348, -3.50083065032959, -3.301257848739624, -3.101685047149658, -2.9021120071411133, -2.7025389671325684, -2.5029661655426025, -2.3033933639526367, -2.103820323944092, -1.9042474031448364, -1.704674482345581, -1.5051015615463257, -1.3055286407470703, -1.105955719947815, -0.9063827991485596, -0.7068098783493042, -0.5072364807128906, -0.30766355991363525, -0.10809063911437988, 0.09148228168487549, 0.29105520248413086, 0.49062812328338623, 0.6902010440826416, 0.889773964881897, 1.0893468856811523, 1.2889198064804077, 1.488492727279663, 1.6880656480789185, 1.8876385688781738, 2.0872116088867188, 2.2867844104766846, 2.4863572120666504, 2.6859302520751953, 2.8855032920837402, 3.085076093673706, 3.284648895263672, 3.484221935272217, 3.6837949752807617, 3.8833677768707275, 4.082940578460693, 4.282513618469238, 4.482086658477783, 4.681659698486328, 4.881232261657715, 5.08080530166626, 5.280378341674805, 5.479950904846191, 5.679523944854736, 5.879096984863281]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 1.0, 5.0, 10.0, 9.0, 11.0, 13.0, 17.0, 9.0, 22.0, 20.0, 30.0, 18.0, 22.0, 33.0, 32.0, 43.0, 36.0, 44.0, 39.0, 38.0, 43.0, 37.0, 34.0, 61.0, 41.0, 32.0, 34.0, 28.0, 47.0, 24.0, 22.0, 19.0, 28.0, 15.0, 8.0, 15.0, 7.0, 10.0, 13.0, 6.0, 8.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.741421222686768, -5.567446231842041, -5.3934712409973145, -5.219496250152588, -5.045520782470703, -4.871545791625977, -4.69757080078125, -4.523595809936523, -4.349620819091797, -4.17564582824707, -4.001670837402344, -3.827695608139038, -3.6537206172943115, -3.479745626449585, -3.3057703971862793, -3.1317954063415527, -2.957820415496826, -2.7838454246520996, -2.609870433807373, -2.4358952045440674, -2.261920213699341, -2.0879452228546143, -1.9139701128005981, -1.739995002746582, -1.5660200119018555, -1.392045021057129, -1.2180699110031128, -1.0440948009490967, -0.8701198101043701, -0.6961447596549988, -0.5221697092056274, -0.34819459915161133, -0.17421913146972656, -0.0002440810203552246, 0.1737309694290161, 0.34770601987838745, 0.5216810703277588, 0.6956561207771301, 0.8696311712265015, 1.0436062812805176, 1.2175812721252441, 1.3915562629699707, 1.5655313730239868, 1.739506483078003, 1.9134814739227295, 2.087456464767456, 2.2614316940307617, 2.4354066848754883, 2.609381675720215, 2.7833566665649414, 2.957331657409668, 3.1313068866729736, 3.3052818775177, 3.4792568683624268, 3.6532320976257324, 3.827207088470459, 4.0011820793151855, 4.175157070159912, 4.349132061004639, 4.523107051849365, 4.69708251953125, 4.871057510375977, 5.045032501220703, 5.21900749206543, 5.392982482910156]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 17.0, 23.0, 33.0, 50.0, 81.0, 110.0, 141.0, 227.0, 318.0, 516.0, 759.0, 1116.0, 1724.0, 2543.0, 4009.0, 6156.0, 9831.0, 15586.0, 25063.0, 41766.0, 72487.0, 134588.0, 302539.0, 873319.0, 1460290.0, 721049.0, 250714.0, 114010.0, 61336.0, 35114.0, 21015.0, 13135.0, 8272.0, 5432.0, 3527.0, 2409.0, 1604.0, 1078.0, 728.0, 512.0, 333.0, 239.0, 175.0, 87.0, 74.0, 54.0, 30.0, 19.0, 13.0, 9.0, 12.0, 7.0, 1.0, 2.0, 3.0], "bins": [-7.953125, -7.7149658203125, -7.476806640625, -7.2386474609375, -7.00048828125, -6.7623291015625, -6.524169921875, -6.2860107421875, -6.0478515625, -5.8096923828125, -5.571533203125, -5.3333740234375, -5.09521484375, -4.8570556640625, -4.618896484375, -4.3807373046875, -4.142578125, -3.9044189453125, -3.666259765625, -3.4281005859375, -3.18994140625, -2.9517822265625, -2.713623046875, -2.4754638671875, -2.2373046875, -1.9991455078125, -1.760986328125, -1.5228271484375, -1.28466796875, -1.0465087890625, -0.808349609375, -0.5701904296875, -0.33203125, -0.0938720703125, 0.144287109375, 0.3824462890625, 0.62060546875, 0.8587646484375, 1.096923828125, 1.3350830078125, 1.5732421875, 1.8114013671875, 2.049560546875, 2.2877197265625, 2.52587890625, 2.7640380859375, 3.002197265625, 3.2403564453125, 3.478515625, 3.7166748046875, 3.954833984375, 4.1929931640625, 4.43115234375, 4.6693115234375, 4.907470703125, 5.1456298828125, 5.3837890625, 5.6219482421875, 5.860107421875, 6.0982666015625, 6.33642578125, 6.5745849609375, 6.812744140625, 7.0509033203125, 7.2890625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 7.0, 8.0, 12.0, 13.0, 18.0, 20.0, 19.0, 16.0, 24.0, 31.0, 31.0, 28.0, 34.0, 40.0, 32.0, 46.0, 39.0, 42.0, 41.0, 37.0, 48.0, 52.0, 44.0, 40.0, 30.0, 28.0, 42.0, 23.0, 23.0, 14.0, 8.0, 10.0, 19.0, 16.0, 12.0, 5.0, 7.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.35406494140625, -4.2003173828125, -4.04656982421875, -3.892822265625, -3.73907470703125, -3.5853271484375, -3.43157958984375, -3.27783203125, -3.12408447265625, -2.9703369140625, -2.81658935546875, -2.662841796875, -2.50909423828125, -2.3553466796875, -2.20159912109375, -2.0478515625, -1.89410400390625, -1.7403564453125, -1.58660888671875, -1.432861328125, -1.27911376953125, -1.1253662109375, -0.97161865234375, -0.81787109375, -0.66412353515625, -0.5103759765625, -0.35662841796875, -0.202880859375, -0.04913330078125, 0.1046142578125, 0.25836181640625, 0.412109375, 0.56585693359375, 0.7196044921875, 0.87335205078125, 1.027099609375, 1.18084716796875, 1.3345947265625, 1.48834228515625, 1.64208984375, 1.79583740234375, 1.9495849609375, 2.10333251953125, 2.257080078125, 2.41082763671875, 2.5645751953125, 2.71832275390625, 2.8720703125, 3.02581787109375, 3.1795654296875, 3.33331298828125, 3.487060546875, 3.64080810546875, 3.7945556640625, 3.94830322265625, 4.10205078125, 4.25579833984375, 4.4095458984375, 4.56329345703125, 4.717041015625, 4.87078857421875, 5.0245361328125, 5.17828369140625, 5.33203125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 6.0, 2.0, 16.0, 19.0, 31.0, 29.0, 70.0, 98.0, 159.0, 251.0, 321.0, 552.0, 801.0, 1233.0, 2053.0, 3265.0, 5005.0, 8179.0, 13616.0, 23201.0, 39759.0, 70413.0, 129890.0, 255235.0, 533169.0, 1145181.0, 1011490.0, 459423.0, 223644.0, 115557.0, 63079.0, 35820.0, 20806.0, 12199.0, 7455.0, 4582.0, 2787.0, 1831.0, 1111.0, 651.0, 429.0, 311.0, 188.0, 137.0, 79.0, 53.0, 43.0, 13.0, 19.0, 9.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.43359375, -6.21844482421875, -6.0032958984375, -5.78814697265625, -5.572998046875, -5.35784912109375, -5.1427001953125, -4.92755126953125, -4.71240234375, -4.49725341796875, -4.2821044921875, -4.06695556640625, -3.851806640625, -3.63665771484375, -3.4215087890625, -3.20635986328125, -2.9912109375, -2.77606201171875, -2.5609130859375, -2.34576416015625, -2.130615234375, -1.91546630859375, -1.7003173828125, -1.48516845703125, -1.27001953125, -1.05487060546875, -0.8397216796875, -0.62457275390625, -0.409423828125, -0.19427490234375, 0.0208740234375, 0.23602294921875, 0.451171875, 0.66632080078125, 0.8814697265625, 1.09661865234375, 1.311767578125, 1.52691650390625, 1.7420654296875, 1.95721435546875, 2.17236328125, 2.38751220703125, 2.6026611328125, 2.81781005859375, 3.032958984375, 3.24810791015625, 3.4632568359375, 3.67840576171875, 3.8935546875, 4.10870361328125, 4.3238525390625, 4.53900146484375, 4.754150390625, 4.96929931640625, 5.1844482421875, 5.39959716796875, 5.61474609375, 5.82989501953125, 6.0450439453125, 6.26019287109375, 6.475341796875, 6.69049072265625, 6.9056396484375, 7.12078857421875, 7.3359375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 1.0, 5.0, 9.0, 6.0, 8.0, 16.0, 15.0, 16.0, 22.0, 43.0, 46.0, 78.0, 62.0, 83.0, 91.0, 129.0, 150.0, 168.0, 218.0, 231.0, 300.0, 351.0, 312.0, 303.0, 232.0, 222.0, 178.0, 153.0, 103.0, 104.0, 76.0, 54.0, 63.0, 49.0, 32.0, 24.0, 31.0, 23.0, 16.0, 14.0, 11.0, 12.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.859375, -2.777008056640625, -2.69464111328125, -2.612274169921875, -2.5299072265625, -2.447540283203125, -2.36517333984375, -2.282806396484375, -2.200439453125, -2.118072509765625, -2.03570556640625, -1.953338623046875, -1.8709716796875, -1.788604736328125, -1.70623779296875, -1.623870849609375, -1.54150390625, -1.459136962890625, -1.37677001953125, -1.294403076171875, -1.2120361328125, -1.129669189453125, -1.04730224609375, -0.964935302734375, -0.882568359375, -0.800201416015625, -0.71783447265625, -0.635467529296875, -0.5531005859375, -0.470733642578125, -0.38836669921875, -0.305999755859375, -0.2236328125, -0.141265869140625, -0.05889892578125, 0.023468017578125, 0.1058349609375, 0.188201904296875, 0.27056884765625, 0.352935791015625, 0.435302734375, 0.517669677734375, 0.60003662109375, 0.682403564453125, 0.7647705078125, 0.847137451171875, 0.92950439453125, 1.011871337890625, 1.09423828125, 1.176605224609375, 1.25897216796875, 1.341339111328125, 1.4237060546875, 1.506072998046875, 1.58843994140625, 1.670806884765625, 1.753173828125, 1.835540771484375, 1.91790771484375, 2.000274658203125, 2.0826416015625, 2.165008544921875, 2.24737548828125, 2.329742431640625, 2.412109375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 10.0, 5.0, 7.0, 11.0, 13.0, 23.0, 29.0, 33.0, 43.0, 59.0, 57.0, 70.0, 103.0, 84.0, 77.0, 68.0, 56.0, 48.0, 44.0, 32.0, 26.0, 23.0, 18.0, 9.0, 13.0, 6.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.524494171142578, -7.294224262237549, -7.063954830169678, -6.833684921264648, -6.603415489196777, -6.373145580291748, -6.142875671386719, -5.912606239318848, -5.682336330413818, -5.452066421508789, -5.221796989440918, -4.991527080535889, -4.761257171630859, -4.530987739562988, -4.300717830657959, -4.07044792175293, -3.8401784896850586, -3.6099088191986084, -3.379639148712158, -3.149369239807129, -2.9190995693206787, -2.6888298988342285, -2.458559989929199, -2.228290319442749, -1.9980206489562988, -1.7677509784698486, -1.5374811887741089, -1.3072113990783691, -1.076941728591919, -0.8466720581054688, -0.616402268409729, -0.38613247871398926, -0.15586280822753906, 0.07440692186355591, 0.3046766519546509, 0.5349463820457458, 0.7652161121368408, 0.995485782623291, 1.2257555723190308, 1.4560253620147705, 1.6862950325012207, 1.916564702987671, 2.146834373474121, 2.3771042823791504, 2.6073739528656006, 2.837643623352051, 3.06791353225708, 3.2981832027435303, 3.5284528732299805, 3.7587225437164307, 3.988992214202881, 4.21926212310791, 4.449531555175781, 4.6798014640808105, 4.91007137298584, 5.140340805053711, 5.37061071395874, 5.6008806228637695, 5.831150054931641, 6.06141996383667, 6.291689872741699, 6.52195930480957, 6.7522292137146, 6.982499122619629, 7.2127685546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 6.0, 10.0, 9.0, 11.0, 19.0, 15.0, 19.0, 17.0, 30.0, 27.0, 21.0, 34.0, 33.0, 35.0, 34.0, 43.0, 39.0, 43.0, 41.0, 47.0, 39.0, 37.0, 33.0, 35.0, 39.0, 36.0, 31.0, 27.0, 25.0, 20.0, 21.0, 21.0, 13.0, 13.0, 15.0, 12.0, 12.0, 10.0, 3.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.964505195617676, -4.787046432495117, -4.609588146209717, -4.432129383087158, -4.2546706199646, -4.077212333679199, -3.8997535705566406, -3.722295045852661, -3.5448365211486816, -3.367377996444702, -3.1899192333221436, -3.012460708618164, -2.8350021839141846, -2.657543659210205, -2.4800848960876465, -2.302626371383667, -2.1251676082611084, -1.9477089643478394, -1.7702504396438599, -1.5927917957305908, -1.4153332710266113, -1.2378746271133423, -1.0604159832000732, -0.8829574584960938, -0.7054988145828247, -0.5280402302742004, -0.3505816161632538, -0.17312300205230713, 0.004335582256317139, 0.1817941665649414, 0.35925281047821045, 0.5367113351821899, 0.714169979095459, 0.8916285634040833, 1.0690871477127075, 1.2465457916259766, 1.424004316329956, 1.601462960243225, 1.7789216041564941, 1.9563801288604736, 2.133838653564453, 2.3112971782684326, 2.488755941390991, 2.6662144660949707, 2.84367299079895, 3.0211315155029297, 3.1985902786254883, 3.3760488033294678, 3.5535075664520264, 3.730966091156006, 3.9084248542785645, 4.085883140563965, 4.263341903686523, 4.440800666809082, 4.618259429931641, 4.795717716217041, 4.9731764793396, 5.150635242462158, 5.328093528747559, 5.505552291870117, 5.683011054992676, 5.860469341278076, 6.037928104400635, 6.215386390686035, 6.392845153808594]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 11.0, 20.0, 27.0, 50.0, 56.0, 86.0, 112.0, 197.0, 269.0, 462.0, 600.0, 871.0, 1374.0, 2092.0, 3220.0, 4824.0, 7267.0, 11283.0, 16903.0, 26065.0, 39320.0, 61191.0, 94709.0, 148513.0, 206139.0, 150404.0, 95182.0, 61637.0, 40039.0, 25787.0, 17012.0, 11140.0, 7466.0, 4748.0, 3253.0, 2019.0, 1362.0, 953.0, 645.0, 411.0, 291.0, 175.0, 126.0, 90.0, 45.0, 40.0, 20.0, 20.0, 6.0, 9.0, 4.0, 1.0, 5.0, 3.0], "bins": [-2.130859375, -2.0691070556640625, -2.007354736328125, -1.9456024169921875, -1.88385009765625, -1.8220977783203125, -1.760345458984375, -1.6985931396484375, -1.6368408203125, -1.5750885009765625, -1.513336181640625, -1.4515838623046875, -1.38983154296875, -1.3280792236328125, -1.266326904296875, -1.2045745849609375, -1.142822265625, -1.0810699462890625, -1.019317626953125, -0.9575653076171875, -0.89581298828125, -0.8340606689453125, -0.772308349609375, -0.7105560302734375, -0.6488037109375, -0.5870513916015625, -0.525299072265625, -0.4635467529296875, -0.40179443359375, -0.3400421142578125, -0.278289794921875, -0.2165374755859375, -0.15478515625, -0.0930328369140625, -0.031280517578125, 0.0304718017578125, 0.09222412109375, 0.1539764404296875, 0.215728759765625, 0.2774810791015625, 0.3392333984375, 0.4009857177734375, 0.462738037109375, 0.5244903564453125, 0.58624267578125, 0.6479949951171875, 0.709747314453125, 0.7714996337890625, 0.833251953125, 0.8950042724609375, 0.956756591796875, 1.0185089111328125, 1.08026123046875, 1.1420135498046875, 1.203765869140625, 1.2655181884765625, 1.3272705078125, 1.3890228271484375, 1.450775146484375, 1.5125274658203125, 1.57427978515625, 1.6360321044921875, 1.697784423828125, 1.7595367431640625, 1.8212890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 9.0, 7.0, 16.0, 20.0, 14.0, 23.0, 27.0, 26.0, 16.0, 28.0, 34.0, 20.0, 39.0, 42.0, 34.0, 39.0, 50.0, 41.0, 35.0, 28.0, 46.0, 26.0, 42.0, 32.0, 33.0, 23.0, 40.0, 16.0, 23.0, 23.0, 23.0, 12.0, 9.0, 18.0, 9.0, 12.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.3828125, -5.21319580078125, -5.0435791015625, -4.87396240234375, -4.704345703125, -4.53472900390625, -4.3651123046875, -4.19549560546875, -4.02587890625, -3.85626220703125, -3.6866455078125, -3.51702880859375, -3.347412109375, -3.17779541015625, -3.0081787109375, -2.83856201171875, -2.6689453125, -2.49932861328125, -2.3297119140625, -2.16009521484375, -1.990478515625, -1.82086181640625, -1.6512451171875, -1.48162841796875, -1.31201171875, -1.14239501953125, -0.9727783203125, -0.80316162109375, -0.633544921875, -0.46392822265625, -0.2943115234375, -0.12469482421875, 0.044921875, 0.21453857421875, 0.3841552734375, 0.55377197265625, 0.723388671875, 0.89300537109375, 1.0626220703125, 1.23223876953125, 1.40185546875, 1.57147216796875, 1.7410888671875, 1.91070556640625, 2.080322265625, 2.24993896484375, 2.4195556640625, 2.58917236328125, 2.7587890625, 2.92840576171875, 3.0980224609375, 3.26763916015625, 3.437255859375, 3.60687255859375, 3.7764892578125, 3.94610595703125, 4.11572265625, 4.28533935546875, 4.4549560546875, 4.62457275390625, 4.794189453125, 4.96380615234375, 5.1334228515625, 5.30303955078125, 5.47265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 10.0, 12.0, 13.0, 19.0, 24.0, 37.0, 66.0, 85.0, 149.0, 268.0, 404.0, 698.0, 1162.0, 1915.0, 3318.0, 5966.0, 10689.0, 20106.0, 38827.0, 77675.0, 167373.0, 340696.0, 195171.0, 89380.0, 44197.0, 22413.0, 12100.0, 6625.0, 3730.0, 2172.0, 1268.0, 796.0, 459.0, 285.0, 175.0, 97.0, 53.0, 47.0, 21.0, 21.0, 14.0, 6.0, 4.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.1199951171875, -3.021240234375, -2.9224853515625, -2.82373046875, -2.7249755859375, -2.626220703125, -2.5274658203125, -2.4287109375, -2.3299560546875, -2.231201171875, -2.1324462890625, -2.03369140625, -1.9349365234375, -1.836181640625, -1.7374267578125, -1.638671875, -1.5399169921875, -1.441162109375, -1.3424072265625, -1.24365234375, -1.1448974609375, -1.046142578125, -0.9473876953125, -0.8486328125, -0.7498779296875, -0.651123046875, -0.5523681640625, -0.45361328125, -0.3548583984375, -0.256103515625, -0.1573486328125, -0.05859375, 0.0401611328125, 0.138916015625, 0.2376708984375, 0.33642578125, 0.4351806640625, 0.533935546875, 0.6326904296875, 0.7314453125, 0.8302001953125, 0.928955078125, 1.0277099609375, 1.12646484375, 1.2252197265625, 1.323974609375, 1.4227294921875, 1.521484375, 1.6202392578125, 1.718994140625, 1.8177490234375, 1.91650390625, 2.0152587890625, 2.114013671875, 2.2127685546875, 2.3115234375, 2.4102783203125, 2.509033203125, 2.6077880859375, 2.70654296875, 2.8052978515625, 2.904052734375, 3.0028076171875, 3.1015625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 3.0, 6.0, 9.0, 7.0, 18.0, 13.0, 12.0, 14.0, 24.0, 27.0, 30.0, 32.0, 35.0, 32.0, 41.0, 42.0, 42.0, 51.0, 32.0, 54.0, 44.0, 41.0, 45.0, 41.0, 42.0, 27.0, 35.0, 26.0, 28.0, 21.0, 22.0, 21.0, 14.0, 16.0, 12.0, 7.0, 5.0, 5.0, 7.0, 3.0, 0.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.89453125, -3.773590087890625, -3.65264892578125, -3.531707763671875, -3.4107666015625, -3.289825439453125, -3.16888427734375, -3.047943115234375, -2.927001953125, -2.806060791015625, -2.68511962890625, -2.564178466796875, -2.4432373046875, -2.322296142578125, -2.20135498046875, -2.080413818359375, -1.95947265625, -1.838531494140625, -1.71759033203125, -1.596649169921875, -1.4757080078125, -1.354766845703125, -1.23382568359375, -1.112884521484375, -0.991943359375, -0.871002197265625, -0.75006103515625, -0.629119873046875, -0.5081787109375, -0.387237548828125, -0.26629638671875, -0.145355224609375, -0.0244140625, 0.096527099609375, 0.21746826171875, 0.338409423828125, 0.4593505859375, 0.580291748046875, 0.70123291015625, 0.822174072265625, 0.943115234375, 1.064056396484375, 1.18499755859375, 1.305938720703125, 1.4268798828125, 1.547821044921875, 1.66876220703125, 1.789703369140625, 1.91064453125, 2.031585693359375, 2.15252685546875, 2.273468017578125, 2.3944091796875, 2.515350341796875, 2.63629150390625, 2.757232666015625, 2.878173828125, 2.999114990234375, 3.12005615234375, 3.240997314453125, 3.3619384765625, 3.482879638671875, 3.60382080078125, 3.724761962890625, 3.845703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 6.0, 12.0, 9.0, 18.0, 20.0, 45.0, 62.0, 108.0, 139.0, 212.0, 390.0, 626.0, 1060.0, 1822.0, 3001.0, 5563.0, 10186.0, 20513.0, 44603.0, 123700.0, 433308.0, 261058.0, 77766.0, 31312.0, 15001.0, 7757.0, 4266.0, 2385.0, 1349.0, 876.0, 490.0, 313.0, 218.0, 117.0, 63.0, 46.0, 45.0, 34.0, 19.0, 9.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0244903564453125, -0.023743391036987305, -0.02299642562866211, -0.022249460220336914, -0.02150249481201172, -0.020755529403686523, -0.020008563995361328, -0.019261598587036133, -0.018514633178710938, -0.017767667770385742, -0.017020702362060547, -0.01627373695373535, -0.015526771545410156, -0.014779806137084961, -0.014032840728759766, -0.01328587532043457, -0.012538909912109375, -0.01179194450378418, -0.011044979095458984, -0.010298013687133789, -0.009551048278808594, -0.008804082870483398, -0.008057117462158203, -0.007310152053833008, -0.0065631866455078125, -0.005816221237182617, -0.005069255828857422, -0.0043222904205322266, -0.0035753250122070312, -0.002828359603881836, -0.0020813941955566406, -0.0013344287872314453, -0.00058746337890625, 0.0001595020294189453, 0.0009064674377441406, 0.001653432846069336, 0.0024003982543945312, 0.0031473636627197266, 0.003894329071044922, 0.004641294479370117, 0.0053882598876953125, 0.006135225296020508, 0.006882190704345703, 0.0076291561126708984, 0.008376121520996094, 0.009123086929321289, 0.009870052337646484, 0.01061701774597168, 0.011363983154296875, 0.01211094856262207, 0.012857913970947266, 0.013604879379272461, 0.014351844787597656, 0.015098810195922852, 0.015845775604248047, 0.016592741012573242, 0.017339706420898438, 0.018086671829223633, 0.018833637237548828, 0.019580602645874023, 0.02032756805419922, 0.021074533462524414, 0.02182149887084961, 0.022568464279174805, 0.0233154296875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 7.0, 4.0, 7.0, 15.0, 10.0, 14.0, 26.0, 37.0, 47.0, 49.0, 50.0, 78.0, 75.0, 101.0, 87.0, 82.0, 62.0, 36.0, 48.0, 35.0, 34.0, 28.0, 10.0, 11.0, 8.0, 12.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.119510650634766e-06, -8.8568776845932e-06, -8.594244718551636e-06, -8.33161175251007e-06, -8.068978786468506e-06, -7.806345820426941e-06, -7.543712854385376e-06, -7.281079888343811e-06, -7.018446922302246e-06, -6.755813956260681e-06, -6.493180990219116e-06, -6.230548024177551e-06, -5.967915058135986e-06, -5.705282092094421e-06, -5.4426491260528564e-06, -5.1800161600112915e-06, -4.9173831939697266e-06, -4.654750227928162e-06, -4.392117261886597e-06, -4.129484295845032e-06, -3.866851329803467e-06, -3.604218363761902e-06, -3.341585397720337e-06, -3.078952431678772e-06, -2.816319465637207e-06, -2.553686499595642e-06, -2.291053533554077e-06, -2.028420567512512e-06, -1.7657876014709473e-06, -1.5031546354293823e-06, -1.2405216693878174e-06, -9.778887033462524e-07, -7.152557373046875e-07, -4.5262277126312256e-07, -1.8998980522155762e-07, 7.264316082000732e-08, 3.3527612686157227e-07, 5.979090929031372e-07, 8.605420589447021e-07, 1.123175024986267e-06, 1.385807991027832e-06, 1.648440957069397e-06, 1.911073923110962e-06, 2.173706889152527e-06, 2.436339855194092e-06, 2.6989728212356567e-06, 2.9616057872772217e-06, 3.2242387533187866e-06, 3.4868717193603516e-06, 3.7495046854019165e-06, 4.0121376514434814e-06, 4.274770617485046e-06, 4.537403583526611e-06, 4.800036549568176e-06, 5.062669515609741e-06, 5.325302481651306e-06, 5.587935447692871e-06, 5.850568413734436e-06, 6.113201379776001e-06, 6.375834345817566e-06, 6.638467311859131e-06, 6.901100277900696e-06, 7.163733243942261e-06, 7.426366209983826e-06, 7.68899917602539e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 13.0, 7.0, 18.0, 21.0, 24.0, 50.0, 54.0, 81.0, 93.0, 134.0, 204.0, 235.0, 354.0, 483.0, 680.0, 995.0, 1453.0, 2217.0, 3258.0, 4942.0, 7798.0, 12500.0, 21038.0, 36211.0, 66293.0, 138389.0, 293550.0, 227505.0, 101922.0, 51929.0, 29088.0, 16916.0, 10297.0, 6751.0, 4152.0, 2800.0, 1861.0, 1252.0, 847.0, 596.0, 434.0, 309.0, 207.0, 157.0, 129.0, 76.0, 65.0, 47.0, 31.0, 28.0, 26.0, 7.0, 6.0, 7.0, 6.0, 6.0, 4.0], "bins": [-0.0171661376953125, -0.016658306121826172, -0.016150474548339844, -0.015642642974853516, -0.015134811401367188, -0.01462697982788086, -0.014119148254394531, -0.013611316680908203, -0.013103485107421875, -0.012595653533935547, -0.012087821960449219, -0.01157999038696289, -0.011072158813476562, -0.010564327239990234, -0.010056495666503906, -0.009548664093017578, -0.00904083251953125, -0.008533000946044922, -0.008025169372558594, -0.007517337799072266, -0.0070095062255859375, -0.006501674652099609, -0.005993843078613281, -0.005486011505126953, -0.004978179931640625, -0.004470348358154297, -0.003962516784667969, -0.0034546852111816406, -0.0029468536376953125, -0.0024390220642089844, -0.0019311904907226562, -0.0014233589172363281, -0.00091552734375, -0.0004076957702636719, 0.00010013580322265625, 0.0006079673767089844, 0.0011157989501953125, 0.0016236305236816406, 0.0021314620971679688, 0.002639293670654297, 0.003147125244140625, 0.003654956817626953, 0.004162788391113281, 0.004670619964599609, 0.0051784515380859375, 0.005686283111572266, 0.006194114685058594, 0.006701946258544922, 0.00720977783203125, 0.007717609405517578, 0.008225440979003906, 0.008733272552490234, 0.009241104125976562, 0.00974893569946289, 0.010256767272949219, 0.010764598846435547, 0.011272430419921875, 0.011780261993408203, 0.012288093566894531, 0.01279592514038086, 0.013303756713867188, 0.013811588287353516, 0.014319419860839844, 0.014827251434326172, 0.0153350830078125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 5.0, 9.0, 12.0, 12.0, 18.0, 21.0, 23.0, 33.0, 29.0, 48.0, 50.0, 74.0, 115.0, 102.0, 96.0, 75.0, 46.0, 37.0, 30.0, 31.0, 19.0, 15.0, 12.0, 11.0, 12.0, 10.0, 10.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.005950927734375, -0.0057541728019714355, -0.005557417869567871, -0.005360662937164307, -0.005163908004760742, -0.004967153072357178, -0.004770398139953613, -0.004573643207550049, -0.004376888275146484, -0.00418013334274292, -0.0039833784103393555, -0.003786623477935791, -0.0035898685455322266, -0.003393113613128662, -0.0031963586807250977, -0.002999603748321533, -0.0028028488159179688, -0.0026060938835144043, -0.00240933895111084, -0.0022125840187072754, -0.002015829086303711, -0.0018190741539001465, -0.001622319221496582, -0.0014255642890930176, -0.0012288093566894531, -0.0010320544242858887, -0.0008352994918823242, -0.0006385445594787598, -0.0004417896270751953, -0.00024503469467163086, -4.8279762268066406e-05, 0.00014847517013549805, 0.0003452301025390625, 0.000541985034942627, 0.0007387399673461914, 0.0009354948997497559, 0.0011322498321533203, 0.0013290047645568848, 0.0015257596969604492, 0.0017225146293640137, 0.0019192695617675781, 0.0021160244941711426, 0.002312779426574707, 0.0025095343589782715, 0.002706289291381836, 0.0029030442237854004, 0.003099799156188965, 0.0032965540885925293, 0.0034933090209960938, 0.003690063953399658, 0.0038868188858032227, 0.004083573818206787, 0.0042803287506103516, 0.004477083683013916, 0.0046738386154174805, 0.004870593547821045, 0.005067348480224609, 0.005264103412628174, 0.005460858345031738, 0.005657613277435303, 0.005854368209838867, 0.006051123142242432, 0.006247878074645996, 0.0064446330070495605, 0.006641387939453125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 7.0, 8.0, 10.0, 13.0, 13.0, 28.0, 26.0, 42.0, 59.0, 55.0, 75.0, 79.0, 100.0, 86.0, 69.0, 61.0, 44.0, 52.0, 36.0, 30.0, 18.0, 14.0, 14.0, 17.0, 5.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.669878959655762, -7.4376091957092285, -7.205339431762695, -6.973069667816162, -6.740799903869629, -6.508530139923096, -6.2762603759765625, -6.043990135192871, -5.811720848083496, -5.579451084136963, -5.34718132019043, -5.1149115562438965, -4.882641792297363, -4.65037202835083, -4.418102264404297, -4.1858320236206055, -3.9535622596740723, -3.721292495727539, -3.489022731781006, -3.2567529678344727, -3.0244832038879395, -2.7922134399414062, -2.559943437576294, -2.3276736736297607, -2.0954039096832275, -1.8631341457366943, -1.6308643817901611, -1.3985944986343384, -1.1663247346878052, -0.934054970741272, -0.7017850875854492, -0.469515323638916, -0.2372455596923828, -0.004975765943527222, 0.22729402780532837, 0.45956385135650635, 0.6918336153030396, 0.9241033792495728, 1.1563732624053955, 1.3886430263519287, 1.620912790298462, 1.8531825542449951, 2.0854523181915283, 2.3177223205566406, 2.549992084503174, 2.782261848449707, 3.0145316123962402, 3.2468013763427734, 3.4790711402893066, 3.71134090423584, 3.943610668182373, 4.175880432128906, 4.4081501960754395, 4.640419960021973, 4.872690200805664, 5.104959487915039, 5.3372297286987305, 5.569499492645264, 5.801769256591797, 6.03403902053833, 6.266308784484863, 6.4985785484313965, 6.73084831237793, 6.963118553161621, 7.195387840270996]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 9.0, 10.0, 11.0, 18.0, 15.0, 19.0, 17.0, 30.0, 29.0, 19.0, 35.0, 31.0, 38.0, 32.0, 43.0, 42.0, 40.0, 41.0, 47.0, 39.0, 36.0, 36.0, 33.0, 40.0, 36.0, 32.0, 26.0, 25.0, 19.0, 24.0, 19.0, 12.0, 13.0, 15.0, 12.0, 12.0, 10.0, 3.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97727108001709, -4.8003034591674805, -4.623335838317871, -4.4463677406311035, -4.269400119781494, -4.092432498931885, -3.9154648780822754, -3.738497018814087, -3.5615291595458984, -3.384561538696289, -3.2075936794281006, -3.030626058578491, -2.8536581993103027, -2.6766905784606934, -2.499722957611084, -2.3227550983428955, -2.145787477493286, -1.9688197374343872, -1.7918519973754883, -1.614884376525879, -1.4379165172576904, -1.260948896408081, -1.0839811563491821, -0.9070134162902832, -0.7300456762313843, -0.5530779361724854, -0.3761102259159088, -0.19914251565933228, -0.02217477560043335, 0.15479296445846558, 0.3317606449127197, 0.5087283849716187, 0.6856961250305176, 0.8626638650894165, 1.0396316051483154, 1.2165992259979248, 1.3935670852661133, 1.5705347061157227, 1.7475024461746216, 1.9244701862335205, 2.101438045501709, 2.2784056663513184, 2.455373525619507, 2.632341146469116, 2.8093090057373047, 2.986276626586914, 3.1632442474365234, 3.340212106704712, 3.5171797275543213, 3.6941473484039307, 3.871115207672119, 4.0480828285217285, 4.225050449371338, 4.4020185470581055, 4.578986167907715, 4.755953788757324, 4.932921409606934, 5.109889030456543, 5.286856651306152, 5.46382474899292, 5.640792369842529, 5.817759990692139, 5.994727611541748, 6.171695709228516, 6.348663330078125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 10.0, 16.0, 11.0, 20.0, 43.0, 49.0, 81.0, 114.0, 141.0, 199.0, 283.0, 398.0, 648.0, 878.0, 1258.0, 1715.0, 2556.0, 3785.0, 5650.0, 8316.0, 12525.0, 18907.0, 28681.0, 44883.0, 71844.0, 117892.0, 178869.0, 190595.0, 132210.0, 80587.0, 49884.0, 31990.0, 20887.0, 13773.0, 9155.0, 6306.0, 4228.0, 2826.0, 1974.0, 1349.0, 948.0, 649.0, 454.0, 287.0, 212.0, 144.0, 112.0, 62.0, 38.0, 39.0, 24.0, 21.0, 16.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0], "bins": [-8.4140625, -8.152099609375, -7.89013671875, -7.628173828125, -7.3662109375, -7.104248046875, -6.84228515625, -6.580322265625, -6.318359375, -6.056396484375, -5.79443359375, -5.532470703125, -5.2705078125, -5.008544921875, -4.74658203125, -4.484619140625, -4.22265625, -3.960693359375, -3.69873046875, -3.436767578125, -3.1748046875, -2.912841796875, -2.65087890625, -2.388916015625, -2.126953125, -1.864990234375, -1.60302734375, -1.341064453125, -1.0791015625, -0.817138671875, -0.55517578125, -0.293212890625, -0.03125, 0.230712890625, 0.49267578125, 0.754638671875, 1.0166015625, 1.278564453125, 1.54052734375, 1.802490234375, 2.064453125, 2.326416015625, 2.58837890625, 2.850341796875, 3.1123046875, 3.374267578125, 3.63623046875, 3.898193359375, 4.16015625, 4.422119140625, 4.68408203125, 4.946044921875, 5.2080078125, 5.469970703125, 5.73193359375, 5.993896484375, 6.255859375, 6.517822265625, 6.77978515625, 7.041748046875, 7.3037109375, 7.565673828125, 7.82763671875, 8.089599609375, 8.3515625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 9.0, 12.0, 5.0, 14.0, 21.0, 13.0, 15.0, 25.0, 28.0, 21.0, 37.0, 30.0, 34.0, 36.0, 38.0, 31.0, 42.0, 48.0, 47.0, 42.0, 43.0, 38.0, 27.0, 43.0, 34.0, 37.0, 23.0, 29.0, 22.0, 16.0, 20.0, 23.0, 13.0, 13.0, 9.0, 12.0, 14.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.31640625, -5.1435546875, -4.970703125, -4.7978515625, -4.625, -4.4521484375, -4.279296875, -4.1064453125, -3.93359375, -3.7607421875, -3.587890625, -3.4150390625, -3.2421875, -3.0693359375, -2.896484375, -2.7236328125, -2.55078125, -2.3779296875, -2.205078125, -2.0322265625, -1.859375, -1.6865234375, -1.513671875, -1.3408203125, -1.16796875, -0.9951171875, -0.822265625, -0.6494140625, -0.4765625, -0.3037109375, -0.130859375, 0.0419921875, 0.21484375, 0.3876953125, 0.560546875, 0.7333984375, 0.90625, 1.0791015625, 1.251953125, 1.4248046875, 1.59765625, 1.7705078125, 1.943359375, 2.1162109375, 2.2890625, 2.4619140625, 2.634765625, 2.8076171875, 2.98046875, 3.1533203125, 3.326171875, 3.4990234375, 3.671875, 3.8447265625, 4.017578125, 4.1904296875, 4.36328125, 4.5361328125, 4.708984375, 4.8818359375, 5.0546875, 5.2275390625, 5.400390625, 5.5732421875, 5.74609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 10.0, 17.0, 27.0, 38.0, 45.0, 79.0, 113.0, 186.0, 295.0, 392.0, 680.0, 968.0, 1431.0, 2154.0, 3261.0, 5057.0, 7667.0, 11728.0, 18466.0, 30490.0, 50714.0, 87807.0, 152047.0, 217700.0, 183255.0, 110404.0, 62808.0, 37371.0, 22634.0, 14130.0, 9226.0, 5785.0, 3895.0, 2645.0, 1696.0, 1127.0, 774.0, 481.0, 319.0, 226.0, 140.0, 87.0, 69.0, 45.0, 21.0, 15.0, 14.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.8580322265625, -8.559814453125, -8.2615966796875, -7.96337890625, -7.6651611328125, -7.366943359375, -7.0687255859375, -6.7705078125, -6.4722900390625, -6.174072265625, -5.8758544921875, -5.57763671875, -5.2794189453125, -4.981201171875, -4.6829833984375, -4.384765625, -4.0865478515625, -3.788330078125, -3.4901123046875, -3.19189453125, -2.8936767578125, -2.595458984375, -2.2972412109375, -1.9990234375, -1.7008056640625, -1.402587890625, -1.1043701171875, -0.80615234375, -0.5079345703125, -0.209716796875, 0.0885009765625, 0.38671875, 0.6849365234375, 0.983154296875, 1.2813720703125, 1.57958984375, 1.8778076171875, 2.176025390625, 2.4742431640625, 2.7724609375, 3.0706787109375, 3.368896484375, 3.6671142578125, 3.96533203125, 4.2635498046875, 4.561767578125, 4.8599853515625, 5.158203125, 5.4564208984375, 5.754638671875, 6.0528564453125, 6.35107421875, 6.6492919921875, 6.947509765625, 7.2457275390625, 7.5439453125, 7.8421630859375, 8.140380859375, 8.4385986328125, 8.73681640625, 9.0350341796875, 9.333251953125, 9.6314697265625, 9.9296875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 9.0, 7.0, 9.0, 12.0, 15.0, 15.0, 18.0, 22.0, 29.0, 26.0, 24.0, 37.0, 34.0, 38.0, 39.0, 53.0, 33.0, 45.0, 46.0, 42.0, 49.0, 38.0, 44.0, 36.0, 36.0, 39.0, 23.0, 23.0, 23.0, 16.0, 30.0, 18.0, 15.0, 5.0, 12.0, 13.0, 7.0, 7.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951171875, -3.83111572265625, -3.7110595703125, -3.59100341796875, -3.470947265625, -3.35089111328125, -3.2308349609375, -3.11077880859375, -2.99072265625, -2.87066650390625, -2.7506103515625, -2.63055419921875, -2.510498046875, -2.39044189453125, -2.2703857421875, -2.15032958984375, -2.0302734375, -1.91021728515625, -1.7901611328125, -1.67010498046875, -1.550048828125, -1.42999267578125, -1.3099365234375, -1.18988037109375, -1.06982421875, -0.94976806640625, -0.8297119140625, -0.70965576171875, -0.589599609375, -0.46954345703125, -0.3494873046875, -0.22943115234375, -0.109375, 0.01068115234375, 0.1307373046875, 0.25079345703125, 0.370849609375, 0.49090576171875, 0.6109619140625, 0.73101806640625, 0.85107421875, 0.97113037109375, 1.0911865234375, 1.21124267578125, 1.331298828125, 1.45135498046875, 1.5714111328125, 1.69146728515625, 1.8115234375, 1.93157958984375, 2.0516357421875, 2.17169189453125, 2.291748046875, 2.41180419921875, 2.5318603515625, 2.65191650390625, 2.77197265625, 2.89202880859375, 3.0120849609375, 3.13214111328125, 3.252197265625, 3.37225341796875, 3.4923095703125, 3.61236572265625, 3.732421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 10.0, 10.0, 24.0, 35.0, 50.0, 100.0, 127.0, 204.0, 352.0, 547.0, 887.0, 1466.0, 2364.0, 3954.0, 6584.0, 10981.0, 20294.0, 39273.0, 89125.0, 238968.0, 354969.0, 151312.0, 60517.0, 29014.0, 15409.0, 8676.0, 5223.0, 3012.0, 1953.0, 1173.0, 736.0, 428.0, 298.0, 176.0, 120.0, 63.0, 55.0, 21.0, 22.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.349609375, -1.3018798828125, -1.254150390625, -1.2064208984375, -1.15869140625, -1.1109619140625, -1.063232421875, -1.0155029296875, -0.9677734375, -0.9200439453125, -0.872314453125, -0.8245849609375, -0.77685546875, -0.7291259765625, -0.681396484375, -0.6336669921875, -0.5859375, -0.5382080078125, -0.490478515625, -0.4427490234375, -0.39501953125, -0.3472900390625, -0.299560546875, -0.2518310546875, -0.2041015625, -0.1563720703125, -0.108642578125, -0.0609130859375, -0.01318359375, 0.0345458984375, 0.082275390625, 0.1300048828125, 0.177734375, 0.2254638671875, 0.273193359375, 0.3209228515625, 0.36865234375, 0.4163818359375, 0.464111328125, 0.5118408203125, 0.5595703125, 0.6072998046875, 0.655029296875, 0.7027587890625, 0.75048828125, 0.7982177734375, 0.845947265625, 0.8936767578125, 0.94140625, 0.9891357421875, 1.036865234375, 1.0845947265625, 1.13232421875, 1.1800537109375, 1.227783203125, 1.2755126953125, 1.3232421875, 1.3709716796875, 1.418701171875, 1.4664306640625, 1.51416015625, 1.5618896484375, 1.609619140625, 1.6573486328125, 1.705078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 7.0, 1.0, 5.0, 3.0, 11.0, 16.0, 20.0, 25.0, 23.0, 29.0, 37.0, 54.0, 59.0, 77.0, 65.0, 92.0, 86.0, 92.0, 59.0, 54.0, 37.0, 19.0, 38.0, 16.0, 19.0, 12.0, 12.0, 6.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.256601333618164e-05, -8.952617645263672e-05, -8.64863395690918e-05, -8.344650268554688e-05, -8.040666580200195e-05, -7.736682891845703e-05, -7.432699203491211e-05, -7.128715515136719e-05, -6.824731826782227e-05, -6.520748138427734e-05, -6.216764450073242e-05, -5.91278076171875e-05, -5.608797073364258e-05, -5.3048133850097656e-05, -5.0008296966552734e-05, -4.696846008300781e-05, -4.392862319946289e-05, -4.088878631591797e-05, -3.784894943237305e-05, -3.4809112548828125e-05, -3.17692756652832e-05, -2.872943878173828e-05, -2.568960189819336e-05, -2.2649765014648438e-05, -1.9609928131103516e-05, -1.6570091247558594e-05, -1.3530254364013672e-05, -1.049041748046875e-05, -7.450580596923828e-06, -4.410743713378906e-06, -1.3709068298339844e-06, 1.6689300537109375e-06, 4.708766937255859e-06, 7.748603820800781e-06, 1.0788440704345703e-05, 1.3828277587890625e-05, 1.6868114471435547e-05, 1.990795135498047e-05, 2.294778823852539e-05, 2.5987625122070312e-05, 2.9027462005615234e-05, 3.2067298889160156e-05, 3.510713577270508e-05, 3.814697265625e-05, 4.118680953979492e-05, 4.4226646423339844e-05, 4.7266483306884766e-05, 5.030632019042969e-05, 5.334615707397461e-05, 5.638599395751953e-05, 5.942583084106445e-05, 6.246566772460938e-05, 6.55055046081543e-05, 6.854534149169922e-05, 7.158517837524414e-05, 7.462501525878906e-05, 7.766485214233398e-05, 8.07046890258789e-05, 8.374452590942383e-05, 8.678436279296875e-05, 8.982419967651367e-05, 9.28640365600586e-05, 9.590387344360352e-05, 9.894371032714844e-05, 0.00010198354721069336]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 14.0, 9.0, 19.0, 19.0, 47.0, 72.0, 101.0, 150.0, 221.0, 380.0, 547.0, 867.0, 1360.0, 2092.0, 3463.0, 5536.0, 9301.0, 16148.0, 29832.0, 62872.0, 155715.0, 336002.0, 238182.0, 93139.0, 41068.0, 20962.0, 11900.0, 6960.0, 4238.0, 2664.0, 1665.0, 1089.0, 686.0, 434.0, 264.0, 188.0, 114.0, 74.0, 54.0, 38.0, 25.0, 13.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3857421875, -1.3433990478515625, -1.301055908203125, -1.2587127685546875, -1.21636962890625, -1.1740264892578125, -1.131683349609375, -1.0893402099609375, -1.0469970703125, -1.0046539306640625, -0.962310791015625, -0.9199676513671875, -0.87762451171875, -0.8352813720703125, -0.792938232421875, -0.7505950927734375, -0.708251953125, -0.6659088134765625, -0.623565673828125, -0.5812225341796875, -0.53887939453125, -0.4965362548828125, -0.454193115234375, -0.4118499755859375, -0.3695068359375, -0.3271636962890625, -0.284820556640625, -0.2424774169921875, -0.20013427734375, -0.1577911376953125, -0.115447998046875, -0.0731048583984375, -0.03076171875, 0.0115814208984375, 0.053924560546875, 0.0962677001953125, 0.13861083984375, 0.1809539794921875, 0.223297119140625, 0.2656402587890625, 0.3079833984375, 0.3503265380859375, 0.392669677734375, 0.4350128173828125, 0.47735595703125, 0.5196990966796875, 0.562042236328125, 0.6043853759765625, 0.646728515625, 0.6890716552734375, 0.731414794921875, 0.7737579345703125, 0.81610107421875, 0.8584442138671875, 0.900787353515625, 0.9431304931640625, 0.9854736328125, 1.0278167724609375, 1.070159912109375, 1.1125030517578125, 1.15484619140625, 1.1971893310546875, 1.239532470703125, 1.2818756103515625, 1.32421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 8.0, 12.0, 7.0, 17.0, 16.0, 15.0, 22.0, 16.0, 31.0, 39.0, 47.0, 38.0, 62.0, 53.0, 76.0, 74.0, 72.0, 79.0, 48.0, 48.0, 36.0, 38.0, 23.0, 26.0, 13.0, 9.0, 16.0, 9.0, 9.0, 4.0, 7.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458984375, -0.4451560974121094, -0.43132781982421875, -0.4174995422363281, -0.4036712646484375, -0.3898429870605469, -0.37601470947265625, -0.3621864318847656, -0.348358154296875, -0.3345298767089844, -0.32070159912109375, -0.3068733215332031, -0.2930450439453125, -0.2792167663574219, -0.26538848876953125, -0.2515602111816406, -0.23773193359375, -0.22390365600585938, -0.21007537841796875, -0.19624710083007812, -0.1824188232421875, -0.16859054565429688, -0.15476226806640625, -0.14093399047851562, -0.127105712890625, -0.11327743530273438, -0.09944915771484375, -0.08562088012695312, -0.0717926025390625, -0.057964324951171875, -0.04413604736328125, -0.030307769775390625, -0.0164794921875, -0.002651214599609375, 0.01117706298828125, 0.025005340576171875, 0.0388336181640625, 0.052661895751953125, 0.06649017333984375, 0.08031845092773438, 0.094146728515625, 0.10797500610351562, 0.12180328369140625, 0.13563156127929688, 0.1494598388671875, 0.16328811645507812, 0.17711639404296875, 0.19094467163085938, 0.20477294921875, 0.21860122680664062, 0.23242950439453125, 0.24625778198242188, 0.2600860595703125, 0.2739143371582031, 0.28774261474609375, 0.3015708923339844, 0.315399169921875, 0.3292274475097656, 0.34305572509765625, 0.3568840026855469, 0.3707122802734375, 0.3845405578613281, 0.39836883544921875, 0.4121971130371094, 0.426025390625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 13.0, 14.0, 18.0, 19.0, 27.0, 32.0, 38.0, 58.0, 62.0, 55.0, 62.0, 86.0, 69.0, 67.0, 64.0, 56.0, 47.0, 36.0, 27.0, 26.0, 21.0, 17.0, 15.0, 7.0, 6.0, 3.0, 5.0, 3.0, 7.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.819007396697998, -5.612675189971924, -5.40634298324585, -5.200010299682617, -4.993678092956543, -4.787345886230469, -4.5810136795043945, -4.37468147277832, -4.168349266052246, -3.962017059326172, -3.7556846141815186, -3.5493524074554443, -3.34302020072937, -3.136687755584717, -2.9303555488586426, -2.7240233421325684, -2.517690896987915, -2.311358690261841, -2.1050262451171875, -1.8986940383911133, -1.692361831665039, -1.4860295057296753, -1.2796971797943115, -1.0733649730682373, -0.8670326471328735, -0.6607003808021545, -0.45436808466911316, -0.24803578853607178, -0.04170352220535278, 0.1646287441253662, 0.37096107006073, 0.5772932767868042, 0.783625602722168, 0.989957869052887, 1.196290135383606, 1.4026224613189697, 1.608954668045044, 1.8152869939804077, 2.0216193199157715, 2.2279515266418457, 2.43428373336792, 2.640615940093994, 2.8469483852386475, 3.0532805919647217, 3.259612798690796, 3.465945243835449, 3.6722774505615234, 3.8786096572875977, 4.084941864013672, 4.291274070739746, 4.49760627746582, 4.7039384841918945, 4.910271167755127, 5.116603374481201, 5.322935581207275, 5.52926778793335, 5.735600471496582, 5.941932678222656, 6.1482648849487305, 6.354597091674805, 6.560929775238037, 6.767261981964111, 6.9735941886901855, 7.17992639541626, 7.386258602142334]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 12.0, 13.0, 18.0, 14.0, 10.0, 24.0, 21.0, 34.0, 30.0, 38.0, 25.0, 36.0, 44.0, 48.0, 35.0, 45.0, 39.0, 48.0, 41.0, 40.0, 38.0, 36.0, 34.0, 35.0, 42.0, 40.0, 25.0, 14.0, 20.0, 13.0, 6.0, 17.0, 13.0, 14.0, 5.0, 8.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.596944808959961, -5.398220062255859, -5.199495315551758, -5.000770568847656, -4.8020453453063965, -4.603320598602295, -4.404595851898193, -4.205871105194092, -4.007145881652832, -3.8084211349487305, -3.60969614982605, -3.4109714031219482, -3.2122464179992676, -3.013521671295166, -2.8147969245910645, -2.616072177886963, -2.4173474311828613, -2.2186226844787598, -2.019897699356079, -1.8211729526519775, -1.6224480867385864, -1.4237232208251953, -1.2249984741210938, -1.0262736082077026, -0.8275487422943115, -0.6288238763809204, -0.4300990700721741, -0.23137426376342773, -0.03264939785003662, 0.1660754680633545, 0.36480021476745605, 0.5635250806808472, 0.7622504234313965, 0.9609752893447876, 1.1597001552581787, 1.3584249019622803, 1.5571497678756714, 1.7558746337890625, 1.954599380493164, 2.1533241271972656, 2.3520491123199463, 2.550773859024048, 2.7494988441467285, 2.94822359085083, 3.1469483375549316, 3.3456733226776123, 3.544398069381714, 3.7431230545043945, 3.941847801208496, 4.140572547912598, 4.339297294616699, 4.538022041320801, 4.7367472648620605, 4.935472011566162, 5.134196758270264, 5.332921504974365, 5.531646728515625, 5.730371475219727, 5.929096221923828, 6.12782096862793, 6.3265461921691895, 6.525270938873291, 6.723995685577393, 6.922720432281494, 7.121445178985596]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 13.0, 16.0, 29.0, 41.0, 46.0, 91.0, 169.0, 212.0, 372.0, 547.0, 880.0, 1362.0, 2205.0, 3645.0, 5788.0, 9629.0, 16273.0, 27695.0, 49441.0, 91648.0, 196082.0, 605745.0, 1624237.0, 1006015.0, 283732.0, 118218.0, 61730.0, 34625.0, 20287.0, 12221.0, 7715.0, 4842.0, 3011.0, 1946.0, 1243.0, 858.0, 531.0, 353.0, 229.0, 180.0, 114.0, 83.0, 46.0, 51.0, 25.0, 19.0, 13.0, 13.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.421875, -8.12841796875, -7.8349609375, -7.54150390625, -7.248046875, -6.95458984375, -6.6611328125, -6.36767578125, -6.07421875, -5.78076171875, -5.4873046875, -5.19384765625, -4.900390625, -4.60693359375, -4.3134765625, -4.02001953125, -3.7265625, -3.43310546875, -3.1396484375, -2.84619140625, -2.552734375, -2.25927734375, -1.9658203125, -1.67236328125, -1.37890625, -1.08544921875, -0.7919921875, -0.49853515625, -0.205078125, 0.08837890625, 0.3818359375, 0.67529296875, 0.96875, 1.26220703125, 1.5556640625, 1.84912109375, 2.142578125, 2.43603515625, 2.7294921875, 3.02294921875, 3.31640625, 3.60986328125, 3.9033203125, 4.19677734375, 4.490234375, 4.78369140625, 5.0771484375, 5.37060546875, 5.6640625, 5.95751953125, 6.2509765625, 6.54443359375, 6.837890625, 7.13134765625, 7.4248046875, 7.71826171875, 8.01171875, 8.30517578125, 8.5986328125, 8.89208984375, 9.185546875, 9.47900390625, 9.7724609375, 10.06591796875, 10.359375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 3.0, 8.0, 0.0, 3.0, 9.0, 11.0, 10.0, 11.0, 13.0, 12.0, 14.0, 24.0, 26.0, 30.0, 20.0, 27.0, 33.0, 42.0, 52.0, 39.0, 39.0, 41.0, 39.0, 48.0, 40.0, 44.0, 33.0, 39.0, 28.0, 32.0, 29.0, 39.0, 28.0, 24.0, 16.0, 19.0, 14.0, 8.0, 8.0, 10.0, 10.0, 14.0, 3.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.2783203125, -4.107421875, -3.9365234375, -3.765625, -3.5947265625, -3.423828125, -3.2529296875, -3.08203125, -2.9111328125, -2.740234375, -2.5693359375, -2.3984375, -2.2275390625, -2.056640625, -1.8857421875, -1.71484375, -1.5439453125, -1.373046875, -1.2021484375, -1.03125, -0.8603515625, -0.689453125, -0.5185546875, -0.34765625, -0.1767578125, -0.005859375, 0.1650390625, 0.3359375, 0.5068359375, 0.677734375, 0.8486328125, 1.01953125, 1.1904296875, 1.361328125, 1.5322265625, 1.703125, 1.8740234375, 2.044921875, 2.2158203125, 2.38671875, 2.5576171875, 2.728515625, 2.8994140625, 3.0703125, 3.2412109375, 3.412109375, 3.5830078125, 3.75390625, 3.9248046875, 4.095703125, 4.2666015625, 4.4375, 4.6083984375, 4.779296875, 4.9501953125, 5.12109375, 5.2919921875, 5.462890625, 5.6337890625, 5.8046875, 5.9755859375, 6.146484375, 6.3173828125, 6.48828125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 25.0, 38.0, 48.0, 66.0, 105.0, 157.0, 206.0, 296.0, 462.0, 671.0, 1077.0, 1471.0, 2445.0, 3771.0, 5765.0, 9168.0, 14538.0, 24631.0, 41350.0, 71546.0, 130005.0, 252490.0, 544131.0, 1288489.0, 956398.0, 400023.0, 195684.0, 103420.0, 58137.0, 33637.0, 20355.0, 12223.0, 7588.0, 4824.0, 3129.0, 2009.0, 1290.0, 856.0, 536.0, 418.0, 252.0, 184.0, 120.0, 74.0, 52.0, 32.0, 29.0, 16.0, 11.0, 10.0, 5.0, 1.0, 2.0, 2.0], "bins": [-8.1328125, -7.89227294921875, -7.6517333984375, -7.41119384765625, -7.170654296875, -6.93011474609375, -6.6895751953125, -6.44903564453125, -6.20849609375, -5.96795654296875, -5.7274169921875, -5.48687744140625, -5.246337890625, -5.00579833984375, -4.7652587890625, -4.52471923828125, -4.2841796875, -4.04364013671875, -3.8031005859375, -3.56256103515625, -3.322021484375, -3.08148193359375, -2.8409423828125, -2.60040283203125, -2.35986328125, -2.11932373046875, -1.8787841796875, -1.63824462890625, -1.397705078125, -1.15716552734375, -0.9166259765625, -0.67608642578125, -0.435546875, -0.19500732421875, 0.0455322265625, 0.28607177734375, 0.526611328125, 0.76715087890625, 1.0076904296875, 1.24822998046875, 1.48876953125, 1.72930908203125, 1.9698486328125, 2.21038818359375, 2.450927734375, 2.69146728515625, 2.9320068359375, 3.17254638671875, 3.4130859375, 3.65362548828125, 3.8941650390625, 4.13470458984375, 4.375244140625, 4.61578369140625, 4.8563232421875, 5.09686279296875, 5.33740234375, 5.57794189453125, 5.8184814453125, 6.05902099609375, 6.299560546875, 6.54010009765625, 6.7806396484375, 7.02117919921875, 7.26171875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 7.0, 4.0, 19.0, 16.0, 13.0, 24.0, 25.0, 39.0, 64.0, 72.0, 66.0, 83.0, 102.0, 127.0, 140.0, 189.0, 237.0, 304.0, 376.0, 376.0, 312.0, 275.0, 200.0, 171.0, 145.0, 131.0, 100.0, 94.0, 72.0, 56.0, 52.0, 41.0, 21.0, 19.0, 21.0, 14.0, 14.0, 16.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.96484375, -2.86944580078125, -2.7740478515625, -2.67864990234375, -2.583251953125, -2.48785400390625, -2.3924560546875, -2.29705810546875, -2.20166015625, -2.10626220703125, -2.0108642578125, -1.91546630859375, -1.820068359375, -1.72467041015625, -1.6292724609375, -1.53387451171875, -1.4384765625, -1.34307861328125, -1.2476806640625, -1.15228271484375, -1.056884765625, -0.96148681640625, -0.8660888671875, -0.77069091796875, -0.67529296875, -0.57989501953125, -0.4844970703125, -0.38909912109375, -0.293701171875, -0.19830322265625, -0.1029052734375, -0.00750732421875, 0.087890625, 0.18328857421875, 0.2786865234375, 0.37408447265625, 0.469482421875, 0.56488037109375, 0.6602783203125, 0.75567626953125, 0.85107421875, 0.94647216796875, 1.0418701171875, 1.13726806640625, 1.232666015625, 1.32806396484375, 1.4234619140625, 1.51885986328125, 1.6142578125, 1.70965576171875, 1.8050537109375, 1.90045166015625, 1.995849609375, 2.09124755859375, 2.1866455078125, 2.28204345703125, 2.37744140625, 2.47283935546875, 2.5682373046875, 2.66363525390625, 2.759033203125, 2.85443115234375, 2.9498291015625, 3.04522705078125, 3.140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 12.0, 6.0, 6.0, 12.0, 17.0, 20.0, 22.0, 25.0, 33.0, 51.0, 54.0, 64.0, 69.0, 93.0, 83.0, 82.0, 54.0, 53.0, 47.0, 35.0, 33.0, 22.0, 17.0, 20.0, 8.0, 12.0, 4.0, 10.0, 9.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.8986358642578125, -6.67137336730957, -6.44411039352417, -6.216847896575928, -5.9895853996276855, -5.762322425842285, -5.535059928894043, -5.307797431945801, -5.080534934997559, -4.853272438049316, -4.626009464263916, -4.398746967315674, -4.171484470367432, -3.9442217350006104, -3.716958999633789, -3.489696502685547, -3.2624335289001465, -3.035170793533325, -2.807908296585083, -2.5806455612182617, -2.3533830642700195, -2.1261203289031982, -1.898857593536377, -1.6715949773788452, -1.4443323612213135, -1.2170697450637817, -0.9898070693016052, -0.7625443935394287, -0.535281777381897, -0.30801916122436523, -0.08075642585754395, 0.1465061902999878, 0.37376880645751953, 0.6010314226150513, 0.8282940983772278, 1.0555567741394043, 1.282819390296936, 1.5100820064544678, 1.737344741821289, 1.9646073579788208, 2.1918699741363525, 2.419132709503174, 2.646395206451416, 2.8736579418182373, 3.1009206771850586, 3.328183174133301, 3.555445909500122, 3.7827086448669434, 4.0099711418151855, 4.237233638763428, 4.464496612548828, 4.69175910949707, 4.9190216064453125, 5.146284103393555, 5.373547077178955, 5.600809574127197, 5.828072547912598, 6.05533504486084, 6.28259801864624, 6.509860515594482, 6.737123012542725, 6.964385986328125, 7.191648483276367, 7.418910980224609, 7.646173477172852]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 0.0, 1.0, 6.0, 4.0, 7.0, 7.0, 3.0, 11.0, 11.0, 13.0, 16.0, 18.0, 16.0, 20.0, 20.0, 25.0, 32.0, 32.0, 48.0, 37.0, 38.0, 38.0, 44.0, 29.0, 38.0, 29.0, 44.0, 49.0, 39.0, 42.0, 27.0, 35.0, 30.0, 27.0, 32.0, 11.0, 23.0, 14.0, 10.0, 18.0, 15.0, 10.0, 10.0, 3.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.312921524047852, -5.121008396148682, -4.9290947914123535, -4.737181663513184, -4.5452680587768555, -4.3533549308776855, -4.161441802978516, -3.9695281982421875, -3.7776150703430176, -3.5857017040252686, -3.3937883377075195, -3.2018752098083496, -3.0099618434906006, -2.8180484771728516, -2.6261351108551025, -2.4342217445373535, -2.2423083782196045, -2.0503950119018555, -1.858481764793396, -1.666568398475647, -1.4746551513671875, -1.2827417850494385, -1.0908284187316895, -0.89891517162323, -0.707001805305481, -0.5150884985923767, -0.3231751620769501, -0.13126182556152344, 0.06065148115158081, 0.25256478786468506, 0.4444781541824341, 0.6363914012908936, 0.8283047676086426, 1.0202181339263916, 1.212131381034851, 1.4040447473526, 1.5959579944610596, 1.7878713607788086, 1.9797847270965576, 2.1716980934143066, 2.3636112213134766, 2.5555245876312256, 2.7474379539489746, 2.9393510818481445, 3.1312644481658936, 3.3231778144836426, 3.5150911808013916, 3.7070045471191406, 3.8989179134368896, 4.090831279754639, 4.282744407653809, 4.474658012390137, 4.666571140289307, 4.858484268188477, 5.050397872924805, 5.242311000823975, 5.434224605560303, 5.626137733459473, 5.818051338195801, 6.009964466094971, 6.201878070831299, 6.393791198730469, 6.585704803466797, 6.777617931365967, 6.969531059265137]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 14.0, 26.0, 30.0, 57.0, 69.0, 110.0, 147.0, 246.0, 311.0, 484.0, 703.0, 1019.0, 1528.0, 2130.0, 3263.0, 4844.0, 7063.0, 10738.0, 15966.0, 24368.0, 37752.0, 59441.0, 93318.0, 145160.0, 202556.0, 155739.0, 99562.0, 63687.0, 40247.0, 26253.0, 17183.0, 11329.0, 7375.0, 5052.0, 3453.0, 2362.0, 1614.0, 1039.0, 717.0, 517.0, 344.0, 229.0, 175.0, 122.0, 75.0, 45.0, 25.0, 26.0, 19.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.033111572265625, -1.96661376953125, -1.900115966796875, -1.8336181640625, -1.767120361328125, -1.70062255859375, -1.634124755859375, -1.567626953125, -1.501129150390625, -1.43463134765625, -1.368133544921875, -1.3016357421875, -1.235137939453125, -1.16864013671875, -1.102142333984375, -1.03564453125, -0.969146728515625, -0.90264892578125, -0.836151123046875, -0.7696533203125, -0.703155517578125, -0.63665771484375, -0.570159912109375, -0.503662109375, -0.437164306640625, -0.37066650390625, -0.304168701171875, -0.2376708984375, -0.171173095703125, -0.10467529296875, -0.038177490234375, 0.0283203125, 0.094818115234375, 0.16131591796875, 0.227813720703125, 0.2943115234375, 0.360809326171875, 0.42730712890625, 0.493804931640625, 0.560302734375, 0.626800537109375, 0.69329833984375, 0.759796142578125, 0.8262939453125, 0.892791748046875, 0.95928955078125, 1.025787353515625, 1.09228515625, 1.158782958984375, 1.22528076171875, 1.291778564453125, 1.3582763671875, 1.424774169921875, 1.49127197265625, 1.557769775390625, 1.624267578125, 1.690765380859375, 1.75726318359375, 1.823760986328125, 1.8902587890625, 1.956756591796875, 2.02325439453125, 2.089752197265625, 2.15625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 8.0, 1.0, 6.0, 3.0, 5.0, 9.0, 8.0, 5.0, 5.0, 13.0, 13.0, 15.0, 20.0, 12.0, 29.0, 28.0, 27.0, 33.0, 46.0, 40.0, 36.0, 33.0, 36.0, 37.0, 41.0, 38.0, 41.0, 39.0, 50.0, 37.0, 29.0, 36.0, 25.0, 29.0, 30.0, 20.0, 17.0, 15.0, 7.0, 23.0, 9.0, 13.0, 15.0, 3.0, 7.0, 6.0, 2.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.40325927734375, -5.2088623046875, -5.01446533203125, -4.820068359375, -4.62567138671875, -4.4312744140625, -4.23687744140625, -4.04248046875, -3.84808349609375, -3.6536865234375, -3.45928955078125, -3.264892578125, -3.07049560546875, -2.8760986328125, -2.68170166015625, -2.4873046875, -2.29290771484375, -2.0985107421875, -1.90411376953125, -1.709716796875, -1.51531982421875, -1.3209228515625, -1.12652587890625, -0.93212890625, -0.73773193359375, -0.5433349609375, -0.34893798828125, -0.154541015625, 0.03985595703125, 0.2342529296875, 0.42864990234375, 0.623046875, 0.81744384765625, 1.0118408203125, 1.20623779296875, 1.400634765625, 1.59503173828125, 1.7894287109375, 1.98382568359375, 2.17822265625, 2.37261962890625, 2.5670166015625, 2.76141357421875, 2.955810546875, 3.15020751953125, 3.3446044921875, 3.53900146484375, 3.7333984375, 3.92779541015625, 4.1221923828125, 4.31658935546875, 4.510986328125, 4.70538330078125, 4.8997802734375, 5.09417724609375, 5.28857421875, 5.48297119140625, 5.6773681640625, 5.87176513671875, 6.066162109375, 6.26055908203125, 6.4549560546875, 6.64935302734375, 6.84375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 7.0, 11.0, 18.0, 25.0, 38.0, 51.0, 86.0, 135.0, 196.0, 309.0, 501.0, 833.0, 1185.0, 1990.0, 3268.0, 5286.0, 8891.0, 15135.0, 26241.0, 45656.0, 81793.0, 152213.0, 279605.0, 191731.0, 100504.0, 55872.0, 31456.0, 18253.0, 10660.0, 6381.0, 3782.0, 2440.0, 1427.0, 925.0, 626.0, 355.0, 246.0, 144.0, 89.0, 63.0, 36.0, 27.0, 19.0, 11.0, 16.0, 13.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.970703125, -2.882476806640625, -2.79425048828125, -2.706024169921875, -2.6177978515625, -2.529571533203125, -2.44134521484375, -2.353118896484375, -2.264892578125, -2.176666259765625, -2.08843994140625, -2.000213623046875, -1.9119873046875, -1.823760986328125, -1.73553466796875, -1.647308349609375, -1.55908203125, -1.470855712890625, -1.38262939453125, -1.294403076171875, -1.2061767578125, -1.117950439453125, -1.02972412109375, -0.941497802734375, -0.853271484375, -0.765045166015625, -0.67681884765625, -0.588592529296875, -0.5003662109375, -0.412139892578125, -0.32391357421875, -0.235687255859375, -0.1474609375, -0.059234619140625, 0.02899169921875, 0.117218017578125, 0.2054443359375, 0.293670654296875, 0.38189697265625, 0.470123291015625, 0.558349609375, 0.646575927734375, 0.73480224609375, 0.823028564453125, 0.9112548828125, 0.999481201171875, 1.08770751953125, 1.175933837890625, 1.26416015625, 1.352386474609375, 1.44061279296875, 1.528839111328125, 1.6170654296875, 1.705291748046875, 1.79351806640625, 1.881744384765625, 1.969970703125, 2.058197021484375, 2.14642333984375, 2.234649658203125, 2.3228759765625, 2.411102294921875, 2.49932861328125, 2.587554931640625, 2.67578125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 14.0, 18.0, 7.0, 12.0, 18.0, 25.0, 11.0, 29.0, 25.0, 27.0, 32.0, 29.0, 39.0, 42.0, 43.0, 48.0, 41.0, 41.0, 38.0, 33.0, 29.0, 35.0, 45.0, 21.0, 43.0, 27.0, 23.0, 21.0, 26.0, 26.0, 17.0, 23.0, 15.0, 8.0, 18.0, 12.0, 2.0, 7.0, 6.0, 3.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-4.40234375, -4.278411865234375, -4.15447998046875, -4.030548095703125, -3.9066162109375, -3.782684326171875, -3.65875244140625, -3.534820556640625, -3.410888671875, -3.286956787109375, -3.16302490234375, -3.039093017578125, -2.9151611328125, -2.791229248046875, -2.66729736328125, -2.543365478515625, -2.41943359375, -2.295501708984375, -2.17156982421875, -2.047637939453125, -1.9237060546875, -1.799774169921875, -1.67584228515625, -1.551910400390625, -1.427978515625, -1.304046630859375, -1.18011474609375, -1.056182861328125, -0.9322509765625, -0.808319091796875, -0.68438720703125, -0.560455322265625, -0.4365234375, -0.312591552734375, -0.18865966796875, -0.064727783203125, 0.0592041015625, 0.183135986328125, 0.30706787109375, 0.430999755859375, 0.554931640625, 0.678863525390625, 0.80279541015625, 0.926727294921875, 1.0506591796875, 1.174591064453125, 1.29852294921875, 1.422454833984375, 1.54638671875, 1.670318603515625, 1.79425048828125, 1.918182373046875, 2.0421142578125, 2.166046142578125, 2.28997802734375, 2.413909912109375, 2.537841796875, 2.661773681640625, 2.78570556640625, 2.909637451171875, 3.0335693359375, 3.157501220703125, 3.28143310546875, 3.405364990234375, 3.529296875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 9.0, 13.0, 16.0, 27.0, 31.0, 72.0, 99.0, 154.0, 261.0, 414.0, 635.0, 1178.0, 2101.0, 3617.0, 6673.0, 13398.0, 29451.0, 75404.0, 283729.0, 449535.0, 107686.0, 38422.0, 17057.0, 8247.0, 4375.0, 2412.0, 1476.0, 802.0, 488.0, 275.0, 178.0, 96.0, 64.0, 57.0, 30.0, 25.0, 16.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.034149169921875, -0.03308725357055664, -0.03202533721923828, -0.030963420867919922, -0.029901504516601562, -0.028839588165283203, -0.027777671813964844, -0.026715755462646484, -0.025653839111328125, -0.024591922760009766, -0.023530006408691406, -0.022468090057373047, -0.021406173706054688, -0.020344257354736328, -0.01928234100341797, -0.01822042465209961, -0.01715850830078125, -0.01609659194946289, -0.015034675598144531, -0.013972759246826172, -0.012910842895507812, -0.011848926544189453, -0.010787010192871094, -0.009725093841552734, -0.008663177490234375, -0.007601261138916016, -0.006539344787597656, -0.005477428436279297, -0.0044155120849609375, -0.003353595733642578, -0.0022916793823242188, -0.0012297630310058594, -0.0001678466796875, 0.0008940696716308594, 0.0019559860229492188, 0.003017902374267578, 0.0040798187255859375, 0.005141735076904297, 0.006203651428222656, 0.007265567779541016, 0.008327484130859375, 0.009389400482177734, 0.010451316833496094, 0.011513233184814453, 0.012575149536132812, 0.013637065887451172, 0.014698982238769531, 0.01576089859008789, 0.01682281494140625, 0.01788473129272461, 0.01894664764404297, 0.020008563995361328, 0.021070480346679688, 0.022132396697998047, 0.023194313049316406, 0.024256229400634766, 0.025318145751953125, 0.026380062103271484, 0.027441978454589844, 0.028503894805908203, 0.029565811157226562, 0.030627727508544922, 0.03168964385986328, 0.03275156021118164, 0.0338134765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 8.0, 16.0, 18.0, 20.0, 34.0, 28.0, 46.0, 45.0, 62.0, 82.0, 87.0, 89.0, 105.0, 87.0, 47.0, 50.0, 36.0, 37.0, 23.0, 10.0, 13.0, 6.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-06, -8.5439532995224e-06, -8.206814527511597e-06, -7.869675755500793e-06, -7.53253698348999e-06, -7.195398211479187e-06, -6.858259439468384e-06, -6.5211206674575806e-06, -6.183981895446777e-06, -5.846843123435974e-06, -5.509704351425171e-06, -5.172565579414368e-06, -4.8354268074035645e-06, -4.498288035392761e-06, -4.161149263381958e-06, -3.824010491371155e-06, -3.4868717193603516e-06, -3.1497329473495483e-06, -2.812594175338745e-06, -2.475455403327942e-06, -2.1383166313171387e-06, -1.8011778593063354e-06, -1.4640390872955322e-06, -1.126900315284729e-06, -7.897615432739258e-07, -4.5262277126312256e-07, -1.1548399925231934e-07, 2.2165477275848389e-07, 5.587935447692871e-07, 8.959323167800903e-07, 1.2330710887908936e-06, 1.5702098608016968e-06, 1.9073486328125e-06, 2.2444874048233032e-06, 2.5816261768341064e-06, 2.9187649488449097e-06, 3.255903720855713e-06, 3.593042492866516e-06, 3.930181264877319e-06, 4.2673200368881226e-06, 4.604458808898926e-06, 4.941597580909729e-06, 5.278736352920532e-06, 5.6158751249313354e-06, 5.953013896942139e-06, 6.290152668952942e-06, 6.627291440963745e-06, 6.964430212974548e-06, 7.3015689849853516e-06, 7.638707756996155e-06, 7.975846529006958e-06, 8.312985301017761e-06, 8.650124073028564e-06, 8.987262845039368e-06, 9.324401617050171e-06, 9.661540389060974e-06, 9.998679161071777e-06, 1.033581793308258e-05, 1.0672956705093384e-05, 1.1010095477104187e-05, 1.134723424911499e-05, 1.1684373021125793e-05, 1.2021511793136597e-05, 1.23586505651474e-05, 1.2695789337158203e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 13.0, 14.0, 19.0, 25.0, 38.0, 62.0, 89.0, 141.0, 173.0, 244.0, 420.0, 644.0, 872.0, 1342.0, 1981.0, 3111.0, 5008.0, 8302.0, 14155.0, 25080.0, 48732.0, 106494.0, 289855.0, 311575.0, 114157.0, 51934.0, 26409.0, 14586.0, 8401.0, 5196.0, 3262.0, 2060.0, 1334.0, 922.0, 580.0, 397.0, 289.0, 192.0, 134.0, 99.0, 51.0, 55.0, 30.0, 32.0, 15.0, 9.0, 3.0, 5.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0233612060546875, -0.022608518600463867, -0.021855831146240234, -0.0211031436920166, -0.02035045623779297, -0.019597768783569336, -0.018845081329345703, -0.01809239387512207, -0.017339706420898438, -0.016587018966674805, -0.015834331512451172, -0.015081644058227539, -0.014328956604003906, -0.013576269149780273, -0.01282358169555664, -0.012070894241333008, -0.011318206787109375, -0.010565519332885742, -0.00981283187866211, -0.009060144424438477, -0.008307456970214844, -0.007554769515991211, -0.006802082061767578, -0.006049394607543945, -0.0052967071533203125, -0.00454401969909668, -0.003791332244873047, -0.003038644790649414, -0.0022859573364257812, -0.0015332698822021484, -0.0007805824279785156, -2.7894973754882812e-05, 0.00072479248046875, 0.0014774799346923828, 0.0022301673889160156, 0.0029828548431396484, 0.0037355422973632812, 0.004488229751586914, 0.005240917205810547, 0.00599360466003418, 0.0067462921142578125, 0.007498979568481445, 0.008251667022705078, 0.009004354476928711, 0.009757041931152344, 0.010509729385375977, 0.01126241683959961, 0.012015104293823242, 0.012767791748046875, 0.013520479202270508, 0.01427316665649414, 0.015025854110717773, 0.015778541564941406, 0.01653122901916504, 0.017283916473388672, 0.018036603927612305, 0.018789291381835938, 0.01954197883605957, 0.020294666290283203, 0.021047353744506836, 0.02180004119873047, 0.0225527286529541, 0.023305416107177734, 0.024058103561401367, 0.024810791015625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 8.0, 6.0, 7.0, 10.0, 3.0, 10.0, 6.0, 13.0, 16.0, 24.0, 19.0, 25.0, 26.0, 39.0, 47.0, 46.0, 50.0, 74.0, 87.0, 88.0, 55.0, 49.0, 48.0, 40.0, 36.0, 23.0, 28.0, 16.0, 20.0, 12.0, 18.0, 6.0, 11.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008056640625, -0.00780332088470459, -0.00755000114440918, -0.0072966814041137695, -0.007043361663818359, -0.006790041923522949, -0.006536722183227539, -0.006283402442932129, -0.006030082702636719, -0.005776762962341309, -0.0055234432220458984, -0.005270123481750488, -0.005016803741455078, -0.004763484001159668, -0.004510164260864258, -0.004256844520568848, -0.0040035247802734375, -0.0037502050399780273, -0.003496885299682617, -0.003243565559387207, -0.002990245819091797, -0.0027369260787963867, -0.0024836063385009766, -0.0022302865982055664, -0.0019769668579101562, -0.001723647117614746, -0.001470327377319336, -0.0012170076370239258, -0.0009636878967285156, -0.0007103681564331055, -0.0004570484161376953, -0.00020372867584228516, 4.9591064453125e-05, 0.00030291080474853516, 0.0005562305450439453, 0.0008095502853393555, 0.0010628700256347656, 0.0013161897659301758, 0.001569509506225586, 0.001822829246520996, 0.0020761489868164062, 0.0023294687271118164, 0.0025827884674072266, 0.0028361082077026367, 0.003089427947998047, 0.003342747688293457, 0.003596067428588867, 0.0038493871688842773, 0.0041027069091796875, 0.004356026649475098, 0.004609346389770508, 0.004862666130065918, 0.005115985870361328, 0.005369305610656738, 0.0056226253509521484, 0.005875945091247559, 0.006129264831542969, 0.006382584571838379, 0.006635904312133789, 0.006889224052429199, 0.007142543792724609, 0.0073958635330200195, 0.00764918327331543, 0.00790250301361084, 0.00815582275390625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 10.0, 9.0, 9.0, 11.0, 17.0, 20.0, 22.0, 34.0, 34.0, 55.0, 45.0, 69.0, 87.0, 74.0, 86.0, 80.0, 59.0, 50.0, 44.0, 33.0, 28.0, 21.0, 21.0, 13.0, 11.0, 7.0, 8.0, 8.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.92464017868042, -6.695237159729004, -6.46583366394043, -6.236430644989014, -6.007027626037598, -5.777624130249023, -5.548221111297607, -5.318818092346191, -5.089414596557617, -4.860011577606201, -4.630608081817627, -4.401205062866211, -4.171802043914795, -3.9423985481262207, -3.7129955291748047, -3.4835922718048096, -3.2541892528533936, -3.0247859954833984, -2.7953829765319824, -2.5659797191619873, -2.336576461791992, -2.107173442840576, -1.877770185470581, -1.648366928100586, -1.4189637899398804, -1.1895606517791748, -0.9601573944091797, -0.7307542562484741, -0.5013510584831238, -0.27194786071777344, -0.04254472255706787, 0.18685853481292725, 0.4162616729736328, 0.6456648707389832, 0.8750680685043335, 1.104471206665039, 1.3338744640350342, 1.5632776021957397, 1.7926807403564453, 2.0220839977264404, 2.2514872550964355, 2.4808905124664307, 2.7102935314178467, 2.939696788787842, 3.169100046157837, 3.398503303527832, 3.627906322479248, 3.857309579849243, 4.086712837219238, 4.316115856170654, 4.5455193519592285, 4.7749223709106445, 5.0043253898620605, 5.233728885650635, 5.463131904602051, 5.692535400390625, 5.921937942504883, 6.151340961456299, 6.380744457244873, 6.610147476196289, 6.839550495147705, 7.068953990936279, 7.298357009887695, 7.5277605056762695, 7.7571635246276855]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 0.0, 1.0, 5.0, 6.0, 6.0, 8.0, 2.0, 11.0, 11.0, 14.0, 17.0, 16.0, 16.0, 22.0, 21.0, 22.0, 35.0, 35.0, 44.0, 37.0, 37.0, 41.0, 41.0, 30.0, 40.0, 26.0, 47.0, 45.0, 43.0, 39.0, 28.0, 34.0, 30.0, 29.0, 29.0, 11.0, 23.0, 14.0, 11.0, 18.0, 15.0, 9.0, 10.0, 3.0, 5.0, 8.0, 5.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2548418045043945, -5.063096046447754, -4.871350288391113, -4.679604530334473, -4.487858772277832, -4.296113014221191, -4.104367256164551, -3.912621021270752, -3.7208752632141113, -3.5291295051574707, -3.33738374710083, -3.1456379890441895, -2.9538919925689697, -2.762146234512329, -2.5704004764556885, -2.3786544799804688, -2.1869089603424072, -1.9951632022857666, -1.8034173250198364, -1.6116715669631958, -1.4199256896972656, -1.228179931640625, -1.0364341735839844, -0.8446882963180542, -0.6529425382614136, -0.4611967206001282, -0.26945093274116516, -0.07770514488220215, 0.11404067277908325, 0.30578649044036865, 0.4975322484970093, 0.6892781257629395, 0.8810238838195801, 1.0727696418762207, 1.2645155191421509, 1.4562612771987915, 1.6480071544647217, 1.8397529125213623, 2.031498670578003, 2.2232446670532227, 2.4149904251098633, 2.606736183166504, 2.7984819412231445, 2.990227699279785, 3.181973695755005, 3.3737194538116455, 3.565465211868286, 3.757211208343506, 3.9489567279815674, 4.140702724456787, 4.332448482513428, 4.524194240570068, 4.715939998626709, 4.90768575668335, 5.09943151473999, 5.291177272796631, 5.4829230308532715, 5.674668788909912, 5.866414546966553, 6.058160305023193, 6.249906063079834, 6.441652297973633, 6.633398056030273, 6.825143814086914, 7.016889572143555]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 14.0, 15.0, 19.0, 35.0, 62.0, 80.0, 132.0, 232.0, 325.0, 488.0, 753.0, 1231.0, 1871.0, 2832.0, 4588.0, 6907.0, 10947.0, 17084.0, 28219.0, 48205.0, 88162.0, 165086.0, 246738.0, 186580.0, 99617.0, 54544.0, 31284.0, 18949.0, 12023.0, 7704.0, 4853.0, 3202.0, 2092.0, 1328.0, 802.0, 528.0, 346.0, 236.0, 138.0, 106.0, 74.0, 38.0, 28.0, 18.0, 12.0, 8.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.546875, -11.2032470703125, -10.859619140625, -10.5159912109375, -10.17236328125, -9.8287353515625, -9.485107421875, -9.1414794921875, -8.7978515625, -8.4542236328125, -8.110595703125, -7.7669677734375, -7.42333984375, -7.0797119140625, -6.736083984375, -6.3924560546875, -6.048828125, -5.7052001953125, -5.361572265625, -5.0179443359375, -4.67431640625, -4.3306884765625, -3.987060546875, -3.6434326171875, -3.2998046875, -2.9561767578125, -2.612548828125, -2.2689208984375, -1.92529296875, -1.5816650390625, -1.238037109375, -0.8944091796875, -0.55078125, -0.2071533203125, 0.136474609375, 0.4801025390625, 0.82373046875, 1.1673583984375, 1.510986328125, 1.8546142578125, 2.1982421875, 2.5418701171875, 2.885498046875, 3.2291259765625, 3.57275390625, 3.9163818359375, 4.260009765625, 4.6036376953125, 4.947265625, 5.2908935546875, 5.634521484375, 5.9781494140625, 6.32177734375, 6.6654052734375, 7.009033203125, 7.3526611328125, 7.6962890625, 8.0399169921875, 8.383544921875, 8.7271728515625, 9.07080078125, 9.4144287109375, 9.758056640625, 10.1016845703125, 10.4453125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 0.0, 4.0, 12.0, 12.0, 9.0, 8.0, 19.0, 19.0, 22.0, 15.0, 16.0, 21.0, 28.0, 43.0, 45.0, 42.0, 38.0, 38.0, 56.0, 37.0, 40.0, 50.0, 37.0, 40.0, 41.0, 39.0, 37.0, 35.0, 27.0, 25.0, 21.0, 17.0, 22.0, 12.0, 22.0, 14.0, 8.0, 9.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.9832763671875, -4.794677734375, -4.6060791015625, -4.41748046875, -4.2288818359375, -4.040283203125, -3.8516845703125, -3.6630859375, -3.4744873046875, -3.285888671875, -3.0972900390625, -2.90869140625, -2.7200927734375, -2.531494140625, -2.3428955078125, -2.154296875, -1.9656982421875, -1.777099609375, -1.5885009765625, -1.39990234375, -1.2113037109375, -1.022705078125, -0.8341064453125, -0.6455078125, -0.4569091796875, -0.268310546875, -0.0797119140625, 0.10888671875, 0.2974853515625, 0.486083984375, 0.6746826171875, 0.86328125, 1.0518798828125, 1.240478515625, 1.4290771484375, 1.61767578125, 1.8062744140625, 1.994873046875, 2.1834716796875, 2.3720703125, 2.5606689453125, 2.749267578125, 2.9378662109375, 3.12646484375, 3.3150634765625, 3.503662109375, 3.6922607421875, 3.880859375, 4.0694580078125, 4.258056640625, 4.4466552734375, 4.63525390625, 4.8238525390625, 5.012451171875, 5.2010498046875, 5.3896484375, 5.5782470703125, 5.766845703125, 5.9554443359375, 6.14404296875, 6.3326416015625, 6.521240234375, 6.7098388671875, 6.8984375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 15.0, 12.0, 17.0, 34.0, 37.0, 70.0, 99.0, 150.0, 189.0, 322.0, 523.0, 778.0, 1132.0, 1751.0, 2737.0, 4309.0, 6786.0, 10414.0, 16648.0, 27038.0, 44885.0, 78550.0, 142293.0, 238581.0, 201314.0, 110740.0, 62517.0, 36662.0, 21870.0, 13732.0, 8634.0, 5433.0, 3572.0, 2325.0, 1522.0, 970.0, 617.0, 425.0, 284.0, 194.0, 137.0, 65.0, 48.0, 39.0, 27.0, 22.0, 12.0, 8.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.453125, -11.1038818359375, -10.754638671875, -10.4053955078125, -10.05615234375, -9.7069091796875, -9.357666015625, -9.0084228515625, -8.6591796875, -8.3099365234375, -7.960693359375, -7.6114501953125, -7.26220703125, -6.9129638671875, -6.563720703125, -6.2144775390625, -5.865234375, -5.5159912109375, -5.166748046875, -4.8175048828125, -4.46826171875, -4.1190185546875, -3.769775390625, -3.4205322265625, -3.0712890625, -2.7220458984375, -2.372802734375, -2.0235595703125, -1.67431640625, -1.3250732421875, -0.975830078125, -0.6265869140625, -0.27734375, 0.0718994140625, 0.421142578125, 0.7703857421875, 1.11962890625, 1.4688720703125, 1.818115234375, 2.1673583984375, 2.5166015625, 2.8658447265625, 3.215087890625, 3.5643310546875, 3.91357421875, 4.2628173828125, 4.612060546875, 4.9613037109375, 5.310546875, 5.6597900390625, 6.009033203125, 6.3582763671875, 6.70751953125, 7.0567626953125, 7.406005859375, 7.7552490234375, 8.1044921875, 8.4537353515625, 8.802978515625, 9.1522216796875, 9.50146484375, 9.8507080078125, 10.199951171875, 10.5491943359375, 10.8984375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 1.0, 2.0, 9.0, 6.0, 8.0, 9.0, 15.0, 17.0, 16.0, 17.0, 22.0, 14.0, 16.0, 22.0, 22.0, 29.0, 34.0, 42.0, 49.0, 40.0, 37.0, 39.0, 42.0, 31.0, 36.0, 50.0, 31.0, 33.0, 40.0, 37.0, 18.0, 24.0, 33.0, 26.0, 18.0, 21.0, 22.0, 7.0, 13.0, 14.0, 11.0, 11.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.56640625, -3.453125, -3.33984375, -3.2265625, -3.11328125, -3.0, -2.88671875, -2.7734375, -2.66015625, -2.546875, -2.43359375, -2.3203125, -2.20703125, -2.09375, -1.98046875, -1.8671875, -1.75390625, -1.640625, -1.52734375, -1.4140625, -1.30078125, -1.1875, -1.07421875, -0.9609375, -0.84765625, -0.734375, -0.62109375, -0.5078125, -0.39453125, -0.28125, -0.16796875, -0.0546875, 0.05859375, 0.171875, 0.28515625, 0.3984375, 0.51171875, 0.625, 0.73828125, 0.8515625, 0.96484375, 1.078125, 1.19140625, 1.3046875, 1.41796875, 1.53125, 1.64453125, 1.7578125, 1.87109375, 1.984375, 2.09765625, 2.2109375, 2.32421875, 2.4375, 2.55078125, 2.6640625, 2.77734375, 2.890625, 3.00390625, 3.1171875, 3.23046875, 3.34375, 3.45703125, 3.5703125, 3.68359375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 10.0, 15.0, 22.0, 27.0, 38.0, 49.0, 72.0, 94.0, 140.0, 201.0, 238.0, 360.0, 503.0, 674.0, 935.0, 1342.0, 1989.0, 2921.0, 4280.0, 6214.0, 10159.0, 16566.0, 29027.0, 54198.0, 117819.0, 304417.0, 271581.0, 104577.0, 49369.0, 26522.0, 15583.0, 9663.0, 6044.0, 3973.0, 2638.0, 1807.0, 1214.0, 887.0, 656.0, 470.0, 346.0, 236.0, 187.0, 137.0, 115.0, 68.0, 49.0, 42.0, 25.0, 14.0, 19.0, 7.0, 5.0, 8.0, 4.0, 1.0, 2.0], "bins": [-1.9521484375, -1.8928680419921875, -1.833587646484375, -1.7743072509765625, -1.71502685546875, -1.6557464599609375, -1.596466064453125, -1.5371856689453125, -1.4779052734375, -1.4186248779296875, -1.359344482421875, -1.3000640869140625, -1.24078369140625, -1.1815032958984375, -1.122222900390625, -1.0629425048828125, -1.003662109375, -0.9443817138671875, -0.885101318359375, -0.8258209228515625, -0.76654052734375, -0.7072601318359375, -0.647979736328125, -0.5886993408203125, -0.5294189453125, -0.4701385498046875, -0.410858154296875, -0.3515777587890625, -0.29229736328125, -0.2330169677734375, -0.173736572265625, -0.1144561767578125, -0.05517578125, 0.0041046142578125, 0.063385009765625, 0.1226654052734375, 0.18194580078125, 0.2412261962890625, 0.300506591796875, 0.3597869873046875, 0.4190673828125, 0.4783477783203125, 0.537628173828125, 0.5969085693359375, 0.65618896484375, 0.7154693603515625, 0.774749755859375, 0.8340301513671875, 0.893310546875, 0.9525909423828125, 1.011871337890625, 1.0711517333984375, 1.13043212890625, 1.1897125244140625, 1.248992919921875, 1.3082733154296875, 1.3675537109375, 1.4268341064453125, 1.486114501953125, 1.5453948974609375, 1.60467529296875, 1.6639556884765625, 1.723236083984375, 1.7825164794921875, 1.841796875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 3.0, 10.0, 6.0, 17.0, 18.0, 24.0, 31.0, 43.0, 62.0, 75.0, 115.0, 124.0, 137.0, 69.0, 69.0, 59.0, 37.0, 21.0, 20.0, 17.0, 7.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017702579498291016, -0.0001714322715997696, -0.00016583874821662903, -0.00016024522483348846, -0.0001546517014503479, -0.00014905817806720734, -0.00014346465468406677, -0.0001378711313009262, -0.00013227760791778564, -0.00012668408453464508, -0.00012109056115150452, -0.00011549703776836395, -0.00010990351438522339, -0.00010430999100208282, -9.871646761894226e-05, -9.31229442358017e-05, -8.752942085266113e-05, -8.193589746952057e-05, -7.634237408638e-05, -7.074885070323944e-05, -6.515532732009888e-05, -5.956180393695831e-05, -5.396828055381775e-05, -4.8374757170677185e-05, -4.278123378753662e-05, -3.718771040439606e-05, -3.159418702125549e-05, -2.600066363811493e-05, -2.0407140254974365e-05, -1.4813616871833801e-05, -9.220093488693237e-06, -3.6265701055526733e-06, 1.9669532775878906e-06, 7.560476660728455e-06, 1.3154000043869019e-05, 1.8747523427009583e-05, 2.4341046810150146e-05, 2.993457019329071e-05, 3.5528093576431274e-05, 4.112161695957184e-05, 4.67151403427124e-05, 5.2308663725852966e-05, 5.790218710899353e-05, 6.34957104921341e-05, 6.908923387527466e-05, 7.468275725841522e-05, 8.027628064155579e-05, 8.586980402469635e-05, 9.146332740783691e-05, 9.705685079097748e-05, 0.00010265037417411804, 0.0001082438975572586, 0.00011383742094039917, 0.00011943094432353973, 0.0001250244677066803, 0.00013061799108982086, 0.00013621151447296143, 0.000141805037856102, 0.00014739856123924255, 0.00015299208462238312, 0.00015858560800552368, 0.00016417913138866425, 0.0001697726547718048, 0.00017536617815494537, 0.00018095970153808594]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 5.0, 17.0, 14.0, 15.0, 23.0, 39.0, 42.0, 50.0, 85.0, 119.0, 150.0, 226.0, 320.0, 461.0, 695.0, 1025.0, 1541.0, 2337.0, 3693.0, 5952.0, 10172.0, 18253.0, 35161.0, 78946.0, 240445.0, 402281.0, 134117.0, 52138.0, 25131.0, 13447.0, 7969.0, 4714.0, 3097.0, 1928.0, 1290.0, 916.0, 574.0, 351.0, 248.0, 146.0, 129.0, 83.0, 63.0, 38.0, 26.0, 23.0, 18.0, 8.0, 10.0, 11.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.220703125, -2.149658203125, -2.07861328125, -2.007568359375, -1.9365234375, -1.865478515625, -1.79443359375, -1.723388671875, -1.65234375, -1.581298828125, -1.51025390625, -1.439208984375, -1.3681640625, -1.297119140625, -1.22607421875, -1.155029296875, -1.083984375, -1.012939453125, -0.94189453125, -0.870849609375, -0.7998046875, -0.728759765625, -0.65771484375, -0.586669921875, -0.515625, -0.444580078125, -0.37353515625, -0.302490234375, -0.2314453125, -0.160400390625, -0.08935546875, -0.018310546875, 0.052734375, 0.123779296875, 0.19482421875, 0.265869140625, 0.3369140625, 0.407958984375, 0.47900390625, 0.550048828125, 0.62109375, 0.692138671875, 0.76318359375, 0.834228515625, 0.9052734375, 0.976318359375, 1.04736328125, 1.118408203125, 1.189453125, 1.260498046875, 1.33154296875, 1.402587890625, 1.4736328125, 1.544677734375, 1.61572265625, 1.686767578125, 1.7578125, 1.828857421875, 1.89990234375, 1.970947265625, 2.0419921875, 2.113037109375, 2.18408203125, 2.255126953125, 2.326171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 8.0, 6.0, 10.0, 14.0, 13.0, 15.0, 10.0, 17.0, 24.0, 33.0, 33.0, 53.0, 54.0, 54.0, 77.0, 89.0, 76.0, 70.0, 63.0, 36.0, 36.0, 40.0, 28.0, 16.0, 14.0, 16.0, 14.0, 13.0, 7.0, 9.0, 7.0, 7.0, 11.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54833984375, -0.5283737182617188, -0.5084075927734375, -0.48844146728515625, -0.468475341796875, -0.44850921630859375, -0.4285430908203125, -0.40857696533203125, -0.38861083984375, -0.36864471435546875, -0.3486785888671875, -0.32871246337890625, -0.308746337890625, -0.28878021240234375, -0.2688140869140625, -0.24884796142578125, -0.2288818359375, -0.20891571044921875, -0.1889495849609375, -0.16898345947265625, -0.149017333984375, -0.12905120849609375, -0.1090850830078125, -0.08911895751953125, -0.06915283203125, -0.04918670654296875, -0.0292205810546875, -0.00925445556640625, 0.010711669921875, 0.03067779541015625, 0.0506439208984375, 0.07061004638671875, 0.090576171875, 0.11054229736328125, 0.1305084228515625, 0.15047454833984375, 0.170440673828125, 0.19040679931640625, 0.2103729248046875, 0.23033905029296875, 0.25030517578125, 0.27027130126953125, 0.2902374267578125, 0.31020355224609375, 0.330169677734375, 0.35013580322265625, 0.3701019287109375, 0.39006805419921875, 0.4100341796875, 0.43000030517578125, 0.4499664306640625, 0.46993255615234375, 0.489898681640625, 0.5098648071289062, 0.5298309326171875, 0.5497970581054688, 0.56976318359375, 0.5897293090820312, 0.6096954345703125, 0.6296615600585938, 0.649627685546875, 0.6695938110351562, 0.6895599365234375, 0.7095260620117188, 0.7294921875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 9.0, 4.0, 13.0, 8.0, 18.0, 20.0, 23.0, 26.0, 29.0, 51.0, 69.0, 50.0, 70.0, 81.0, 81.0, 77.0, 56.0, 62.0, 50.0, 32.0, 29.0, 22.0, 19.0, 14.0, 10.0, 14.0, 5.0, 7.0, 8.0, 7.0, 5.0, 2.0, 3.0, 1.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.106236934661865, -5.873978137969971, -5.641719818115234, -5.40946102142334, -5.177202224731445, -4.944943904876709, -4.7126851081848145, -4.480426788330078, -4.248167991638184, -4.015909194946289, -3.7836508750915527, -3.551392078399658, -3.3191335201263428, -3.0868749618530273, -2.854616165161133, -2.6223576068878174, -2.390099048614502, -2.1578404903411865, -1.9255818128585815, -1.6933231353759766, -1.4610645771026611, -1.2288060188293457, -0.9965473413467407, -0.7642886638641357, -0.5320301055908203, -0.2997714877128601, -0.0675128698348999, 0.1647457480430603, 0.3970043659210205, 0.6292629241943359, 0.8615216016769409, 1.093780279159546, 1.3260393142700195, 1.558297872543335, 1.79055655002594, 2.022815227508545, 2.2550737857818604, 2.487332344055176, 2.7195911407470703, 2.9518496990203857, 3.184108257293701, 3.4163668155670166, 3.648625373840332, 3.8808841705322266, 4.113142967224121, 4.345401287078857, 4.577660083770752, 4.809918403625488, 5.042177200317383, 5.274435997009277, 5.506694316864014, 5.738953113555908, 5.9712114334106445, 6.203470230102539, 6.435729026794434, 6.667987823486328, 6.9002461433410645, 7.132504940032959, 7.364763259887695, 7.59702205657959, 7.829280853271484, 8.061538696289062, 8.293797492980957, 8.526056289672852, 8.758315086364746]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 14.0, 14.0, 18.0, 23.0, 31.0, 29.0, 26.0, 29.0, 41.0, 29.0, 49.0, 37.0, 56.0, 53.0, 53.0, 44.0, 38.0, 45.0, 40.0, 40.0, 33.0, 38.0, 28.0, 28.0, 22.0, 26.0, 17.0, 21.0, 12.0, 10.0, 8.0, 6.0, 9.0, 7.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.909386157989502, -6.6782732009887695, -6.447160720825195, -6.216047763824463, -5.984935283660889, -5.753822326660156, -5.522709846496582, -5.29159688949585, -5.060483932495117, -4.829370975494385, -4.5982584953308105, -4.367145538330078, -4.136033058166504, -3.9049201011657715, -3.673807382583618, -3.442694664001465, -3.2115821838378906, -2.9804694652557373, -2.749356746673584, -2.5182437896728516, -2.2871313095092773, -2.056018352508545, -1.8249056339263916, -1.5937929153442383, -1.362680196762085, -1.1315674781799316, -0.9004546999931335, -0.6693419218063354, -0.43822920322418213, -0.2071164846420288, 0.023996353149414062, 0.2551090717315674, 0.4862217903137207, 0.717334508895874, 0.9484472870826721, 1.1795600652694702, 1.4106727838516235, 1.6417855024337769, 1.8728983402252197, 2.104011058807373, 2.3351237773895264, 2.5662364959716797, 2.797349214553833, 3.0284619331359863, 3.2595748901367188, 3.490687370300293, 3.7218003273010254, 3.9529130458831787, 4.184025764465332, 4.4151387214660645, 4.646251201629639, 4.877364158630371, 5.108476638793945, 5.339589595794678, 5.57070255279541, 5.801815032958984, 6.032927513122559, 6.264040470123291, 6.495152950286865, 6.726265907287598, 6.957378387451172, 7.188491344451904, 7.419604301452637, 7.650716781616211, 7.881829738616943]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 14.0, 13.0, 16.0, 20.0, 21.0, 27.0, 28.0, 40.0, 49.0, 55.0, 56.0, 76.0, 81.0, 96.0, 135.0, 193.0, 449.0, 3698.0, 517620.0, 588.0, 211.0, 139.0, 97.0, 86.0, 68.0, 64.0, 57.0, 41.0, 46.0, 28.0, 33.0, 20.0, 22.0, 15.0, 13.0, 15.0, 10.0, 5.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-148.86351013183594, -144.73992919921875, -140.61634826660156, -136.49276733398438, -132.3691864013672, -128.24560546875, -124.12201690673828, -119.9984359741211, -115.8748550415039, -111.75127410888672, -107.62769317626953, -103.50411224365234, -99.38052368164062, -95.25694274902344, -91.13336181640625, -87.00978088378906, -82.88619995117188, -78.76261901855469, -74.6390380859375, -70.51545715332031, -66.39187622070312, -62.26829147338867, -58.14470672607422, -54.02112579345703, -49.897544860839844, -45.773963928222656, -41.65038299560547, -37.526798248291016, -33.40321731567383, -29.27963638305664, -25.15605354309082, -21.032470703125, -16.90888214111328, -12.785300254821777, -8.661718368530273, -4.5381364822387695, -0.4145545959472656, 3.709026336669922, 7.832609176635742, 11.956192016601562, 16.07977294921875, 20.203353881835938, 24.326936721801758, 28.450519561767578, 32.574100494384766, 36.69768142700195, 40.821266174316406, 44.944847106933594, 49.06842803955078, 53.19200897216797, 57.315589904785156, 61.43917465209961, 65.56275939941406, 69.68634033203125, 73.80992126464844, 77.93350219726562, 82.05708312988281, 86.1806640625, 90.30424499511719, 94.42782592773438, 98.55140686035156, 102.67498779296875, 106.79857635498047, 110.92215728759766, 115.04573822021484]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 6.0, 7.0, 6.0, 15.0, 12.0, 21.0, 22.0, 30.0, 28.0, 30.0, 29.0, 37.0, 32.0, 46.0, 34.0, 62.0, 51.0, 1073.0, 49.0, 40.0, 44.0, 42.0, 33.0, 39.0, 35.0, 30.0, 27.0, 23.0, 26.0, 16.0, 22.0, 12.0, 9.0, 7.0, 7.0, 9.0, 7.0, 7.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.80368041992188, -191.18812561035156, -184.57257080078125, -177.95701599121094, -171.34146118164062, -164.7259063720703, -158.1103515625, -151.4947967529297, -144.87924194335938, -138.26368713378906, -131.64813232421875, -125.03257751464844, -118.41702270507812, -111.80146789550781, -105.1859130859375, -98.57035827636719, -91.95479583740234, -85.33924102783203, -78.72368621826172, -72.1081314086914, -65.4925765991211, -58.877017974853516, -52.2614631652832, -45.64590835571289, -39.03035354614258, -32.414798736572266, -25.799243927001953, -19.183687210083008, -12.568132400512695, -5.95257568359375, 0.6629791259765625, 7.278533935546875, 13.894088745117188, 20.5096435546875, 27.125198364257812, 33.740753173828125, 40.35630798339844, 46.971866607666016, 53.58742141723633, 60.20297622680664, 66.81852722167969, 73.43408203125, 80.04963684082031, 86.66519165039062, 93.28074645996094, 99.89630126953125, 106.51185607910156, 113.12741088867188, 119.74297332763672, 126.35852813720703, 132.97409057617188, 139.5896453857422, 146.2052001953125, 152.8207550048828, 159.43630981445312, 166.05186462402344, 172.66741943359375, 179.28297424316406, 185.89852905273438, 192.5140838623047, 199.129638671875, 205.7451934814453, 212.36074829101562, 218.97630310058594, 225.59185791015625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 8.0, 3.0, 8.0, 11.0, 16.0, 22.0, 22.0, 30.0, 45.0, 73.0, 79.0, 89.0, 94.0, 161.0, 197.0, 255.0, 305.0, 364.0, 403.0, 481.0, 461.0, 574.0, 663.0, 671.0, 778.0, 807.0, 866.0, 1186.0, 1290.0, 1285.0, 1612.0, 2355.0, 5242.0, 52713.0, 31145534.0, 11244.0, 3827.0, 2433.0, 2275.0, 2518.0, 3403.0, 7270.0, 1126.0, 310.0, 716.0, 408.0, 177.0, 28.0, 24.0, 10.0, 14.0, 9.0, 9.0, 0.0, 1.0, 5.0, 3.0], "bins": [-3884.83935546875, -3790.58349609375, -3696.327392578125, -3602.071533203125, -3507.815673828125, -3413.5595703125, -3319.3037109375, -3225.0478515625, -3130.7919921875, -3036.5361328125, -2942.280029296875, -2848.024169921875, -2753.768310546875, -2659.51220703125, -2565.25634765625, -2471.00048828125, -2376.744384765625, -2282.488525390625, -2188.232421875, -2093.9765625, -1999.720703125, -1905.4647216796875, -1811.208740234375, -1716.952880859375, -1622.6968994140625, -1528.44091796875, -1434.18505859375, -1339.9290771484375, -1245.673095703125, -1151.417236328125, -1057.1612548828125, -962.9053344726562, -868.6494140625, -774.3934936523438, -680.1375732421875, -585.881591796875, -491.62567138671875, -397.3697509765625, -303.11376953125, -208.85784912109375, -114.6019287109375, -20.345993041992188, 73.90994262695312, 168.1658935546875, 262.42181396484375, 356.677734375, 450.9337158203125, 545.1896362304688, 639.445556640625, 733.7014770507812, 827.9573974609375, 922.21337890625, 1016.4692993164062, 1110.7252197265625, 1204.981201171875, 1299.237060546875, 1393.4930419921875, 1487.7490234375, 1582.0048828125, 1676.2608642578125, 1770.516845703125, 1864.772705078125, 1959.0286865234375, 2053.28466796875, 2147.54052734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 1.0, 3.0, 8.0, 8.0, 16.0, 24.0, 23.0, 46.0, 71.0, 122.0, 188.0, 271.0, 408.0, 562.0, 942.0, 1448.0, 2359.0, 3558.0, 5683.0, 8785.0, 14223.0, 23838.0, 40214.0, 73748.0, 140398.0, 297576.0, 894699.0, 3638891.0, 625214.0, 244173.0, 119035.0, 63715.0, 36199.0, 21299.0, 12726.0, 7839.0, 4807.0, 2931.0, 1860.0, 1195.0, 791.0, 508.0, 313.0, 229.0, 155.0, 100.0, 81.0, 56.0, 31.0, 23.0, 14.0, 11.0, 6.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-27.046875, -26.15625, -25.265625, -24.375, -23.484375, -22.59375, -21.703125, -20.8125, -19.921875, -19.03125, -18.140625, -17.25, -16.359375, -15.46875, -14.578125, -13.6875, -12.796875, -11.90625, -11.015625, -10.125, -9.234375, -8.34375, -7.453125, -6.5625, -5.671875, -4.78125, -3.890625, -3.0, -2.109375, -1.21875, -0.328125, 0.5625, 1.453125, 2.34375, 3.234375, 4.125, 5.015625, 5.90625, 6.796875, 7.6875, 8.578125, 9.46875, 10.359375, 11.25, 12.140625, 13.03125, 13.921875, 14.8125, 15.703125, 16.59375, 17.484375, 18.375, 19.265625, 20.15625, 21.046875, 21.9375, 22.828125, 23.71875, 24.609375, 25.5, 26.390625, 27.28125, 28.171875, 29.0625, 29.953125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 10.0, 5.0, 2.0, 8.0, 15.0, 7.0, 10.0, 15.0, 23.0, 16.0, 27.0, 33.0, 37.0, 42.0, 43.0, 61.0, 84.0, 94.0, 175.0, 433.0, 309.0, 149.0, 80.0, 53.0, 47.0, 32.0, 36.0, 23.0, 34.0, 16.0, 25.0, 11.0, 20.0, 7.0, 10.0, 9.0, 7.0, 5.0, 10.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.90625, -39.62158203125, -38.3369140625, -37.05224609375, -35.767578125, -34.48291015625, -33.1982421875, -31.91357421875, -30.62890625, -29.34423828125, -28.0595703125, -26.77490234375, -25.490234375, -24.20556640625, -22.9208984375, -21.63623046875, -20.3515625, -19.06689453125, -17.7822265625, -16.49755859375, -15.212890625, -13.92822265625, -12.6435546875, -11.35888671875, -10.07421875, -8.78955078125, -7.5048828125, -6.22021484375, -4.935546875, -3.65087890625, -2.3662109375, -1.08154296875, 0.203125, 1.48779296875, 2.7724609375, 4.05712890625, 5.341796875, 6.62646484375, 7.9111328125, 9.19580078125, 10.48046875, 11.76513671875, 13.0498046875, 14.33447265625, 15.619140625, 16.90380859375, 18.1884765625, 19.47314453125, 20.7578125, 22.04248046875, 23.3271484375, 24.61181640625, 25.896484375, 27.18115234375, 28.4658203125, 29.75048828125, 31.03515625, 32.31982421875, 33.6044921875, 34.88916015625, 36.173828125, 37.45849609375, 38.7431640625, 40.02783203125, 41.3125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 7.0, 0.0, 0.0, 7.0, 21.0, 33.0, 44.0, 41.0, 52.0, 90.0, 114.0, 202.0, 372.0, 545.0, 911.0, 1812.0, 3109.0, 5692.0, 11684.0, 25454.0, 62014.0, 175565.0, 662165.0, 4546080.0, 541472.0, 153326.0, 54989.0, 22893.0, 10549.0, 5156.0, 2874.0, 1641.0, 886.0, 613.0, 343.0, 206.0, 106.0, 74.0, 58.0, 69.0, 53.0, 47.0, 26.0, 16.0, 14.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0], "bins": [-32.3125, -31.09033203125, -29.8681640625, -28.64599609375, -27.423828125, -26.20166015625, -24.9794921875, -23.75732421875, -22.53515625, -21.31298828125, -20.0908203125, -18.86865234375, -17.646484375, -16.42431640625, -15.2021484375, -13.97998046875, -12.7578125, -11.53564453125, -10.3134765625, -9.09130859375, -7.869140625, -6.64697265625, -5.4248046875, -4.20263671875, -2.98046875, -1.75830078125, -0.5361328125, 0.68603515625, 1.908203125, 3.13037109375, 4.3525390625, 5.57470703125, 6.796875, 8.01904296875, 9.2412109375, 10.46337890625, 11.685546875, 12.90771484375, 14.1298828125, 15.35205078125, 16.57421875, 17.79638671875, 19.0185546875, 20.24072265625, 21.462890625, 22.68505859375, 23.9072265625, 25.12939453125, 26.3515625, 27.57373046875, 28.7958984375, 30.01806640625, 31.240234375, 32.46240234375, 33.6845703125, 34.90673828125, 36.12890625, 37.35107421875, 38.5732421875, 39.79541015625, 41.017578125, 42.23974609375, 43.4619140625, 44.68408203125, 45.90625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 8.0, 8.0, 9.0, 9.0, 14.0, 17.0, 32.0, 33.0, 41.0, 34.0, 52.0, 49.0, 83.0, 147.0, 380.0, 506.0, 156.0, 90.0, 58.0, 39.0, 49.0, 43.0, 32.0, 24.0, 28.0, 15.0, 13.0, 13.0, 9.0, 4.0, 4.0, 3.0, 7.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.53125, -32.337890625, -31.14453125, -29.951171875, -28.7578125, -27.564453125, -26.37109375, -25.177734375, -23.984375, -22.791015625, -21.59765625, -20.404296875, -19.2109375, -18.017578125, -16.82421875, -15.630859375, -14.4375, -13.244140625, -12.05078125, -10.857421875, -9.6640625, -8.470703125, -7.27734375, -6.083984375, -4.890625, -3.697265625, -2.50390625, -1.310546875, -0.1171875, 1.076171875, 2.26953125, 3.462890625, 4.65625, 5.849609375, 7.04296875, 8.236328125, 9.4296875, 10.623046875, 11.81640625, 13.009765625, 14.203125, 15.396484375, 16.58984375, 17.783203125, 18.9765625, 20.169921875, 21.36328125, 22.556640625, 23.75, 24.943359375, 26.13671875, 27.330078125, 28.5234375, 29.716796875, 30.91015625, 32.103515625, 33.296875, 34.490234375, 35.68359375, 36.876953125, 38.0703125, 39.263671875, 40.45703125, 41.650390625, 42.84375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 0.0, 4.0, 8.0, 6.0, 24.0, 52.0, 60.0, 53.0, 136.0, 156.0, 288.0, 440.0, 704.0, 1228.0, 2354.0, 5048.0, 13448.0, 57989.0, 6052491.0, 123029.0, 20500.0, 6633.0, 2925.0, 1579.0, 840.0, 506.0, 347.0, 236.0, 99.0, 78.0, 49.0, 38.0, 23.0, 17.0, 8.0, 0.0, 15.0, 2.0, 12.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-148.875, -144.453125, -140.03125, -135.609375, -131.1875, -126.765625, -122.34375, -117.921875, -113.5, -109.078125, -104.65625, -100.234375, -95.8125, -91.390625, -86.96875, -82.546875, -78.125, -73.703125, -69.28125, -64.859375, -60.4375, -56.015625, -51.59375, -47.171875, -42.75, -38.328125, -33.90625, -29.484375, -25.0625, -20.640625, -16.21875, -11.796875, -7.375, -2.953125, 1.46875, 5.890625, 10.3125, 14.734375, 19.15625, 23.578125, 28.0, 32.421875, 36.84375, 41.265625, 45.6875, 50.109375, 54.53125, 58.953125, 63.375, 67.796875, 72.21875, 76.640625, 81.0625, 85.484375, 89.90625, 94.328125, 98.75, 103.171875, 107.59375, 112.015625, 116.4375, 120.859375, 125.28125, 129.703125, 134.125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 12.0, 15.0, 18.0, 23.0, 30.0, 28.0, 35.0, 42.0, 58.0, 76.0, 135.0, 369.0, 589.0, 145.0, 90.0, 72.0, 46.0, 50.0, 29.0, 26.0, 26.0, 17.0, 19.0, 18.0, 11.0, 3.0, 7.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-54.5, -53.210693359375, -51.92138671875, -50.632080078125, -49.3427734375, -48.053466796875, -46.76416015625, -45.474853515625, -44.185546875, -42.896240234375, -41.60693359375, -40.317626953125, -39.0283203125, -37.739013671875, -36.44970703125, -35.160400390625, -33.87109375, -32.581787109375, -31.29248046875, -30.003173828125, -28.7138671875, -27.424560546875, -26.13525390625, -24.845947265625, -23.556640625, -22.267333984375, -20.97802734375, -19.688720703125, -18.3994140625, -17.110107421875, -15.82080078125, -14.531494140625, -13.2421875, -11.952880859375, -10.66357421875, -9.374267578125, -8.0849609375, -6.795654296875, -5.50634765625, -4.217041015625, -2.927734375, -1.638427734375, -0.34912109375, 0.940185546875, 2.2294921875, 3.518798828125, 4.80810546875, 6.097412109375, 7.38671875, 8.676025390625, 9.96533203125, 11.254638671875, 12.5439453125, 13.833251953125, 15.12255859375, 16.411865234375, 17.701171875, 18.990478515625, 20.27978515625, 21.569091796875, 22.8583984375, 24.147705078125, 25.43701171875, 26.726318359375, 28.015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 6.0, 16.0, 36.0, 57.0, 178.0, 457.0, 140.0, 54.0, 21.0, 8.0, 10.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.2786407470703, -205.92442321777344, -200.57020568847656, -195.21600341796875, -189.86178588867188, -184.507568359375, -179.15335083007812, -173.79913330078125, -168.44491577148438, -163.0906982421875, -157.73648071289062, -152.38226318359375, -147.02806091308594, -141.67384338378906, -136.3196258544922, -130.9654083251953, -125.6112060546875, -120.25698852539062, -114.90277862548828, -109.5485610961914, -104.19435119628906, -98.84013366699219, -93.48591613769531, -88.13169860839844, -82.7774887084961, -77.42327117919922, -72.06906127929688, -66.71484375, -61.36063003540039, -56.00641632080078, -50.652198791503906, -45.2979850769043, -39.94378662109375, -34.58957290649414, -29.2353572845459, -23.881141662597656, -18.526927947998047, -13.172714233398438, -7.8184967041015625, -2.464282989501953, 2.8899307250976562, 8.244145393371582, 13.598360061645508, 18.95257568359375, 24.30678939819336, 29.66100311279297, 35.015220642089844, 40.36943435668945, 45.72364807128906, 51.07786178588867, 56.43207550048828, 61.786293029785156, 67.1405029296875, 72.49472045898438, 77.84893798828125, 83.20315551757812, 88.55736541748047, 93.91158294677734, 99.26579284667969, 104.62001037597656, 109.97422790527344, 115.32843780517578, 120.68265533447266, 126.036865234375, 131.39108276367188]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 6.0, 3.0, 16.0, 22.0, 53.0, 60.0, 84.0, 101.0, 122.0, 144.0, 112.0, 90.0, 74.0, 47.0, 31.0, 16.0, 10.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-192.77662658691406, -188.59075927734375, -184.40489196777344, -180.21902465820312, -176.0331573486328, -171.8472900390625, -167.66143798828125, -163.47557067871094, -159.28970336914062, -155.1038360595703, -150.91796875, -146.7321014404297, -142.54623413085938, -138.36038208007812, -134.17449951171875, -129.9886474609375, -125.80277252197266, -121.61690521240234, -117.43103790283203, -113.24517822265625, -109.05931091308594, -104.87344360351562, -100.68757629394531, -96.501708984375, -92.31584167480469, -88.12997436523438, -83.94410705566406, -79.75823974609375, -75.57238006591797, -71.38651275634766, -67.20064544677734, -63.01477813720703, -58.82892608642578, -54.64305877685547, -50.45719528198242, -46.27132797241211, -42.08546447753906, -37.89959716796875, -33.71372985839844, -29.527864456176758, -25.341999053955078, -21.1561336517334, -16.97026824951172, -12.784400939941406, -8.598535537719727, -4.412670135498047, -0.22680282592773438, 3.9590625762939453, 8.144927978515625, 12.330793380737305, 16.516658782958984, 20.702526092529297, 24.888391494750977, 29.074256896972656, 33.26012420654297, 37.44599151611328, 41.63185501098633, 45.81772232055664, 50.00358581542969, 54.189453125, 58.37532043457031, 62.56118392944336, 66.74705505371094, 70.93291473388672, 75.11878204345703]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 16.0, 13.0, 18.0, 17.0, 29.0, 37.0, 41.0, 63.0, 95.0, 115.0, 180.0, 278.0, 405.0, 690.0, 1136.0, 1984.0, 3803.0, 7911.0, 19833.0, 81208.0, 3989408.0, 64379.0, 13830.0, 4658.0, 1895.0, 973.0, 486.0, 289.0, 181.0, 100.0, 68.0, 41.0, 32.0, 16.0, 11.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5087890625, -0.49651336669921875, -0.4842376708984375, -0.47196197509765625, -0.459686279296875, -0.44741058349609375, -0.4351348876953125, -0.42285919189453125, -0.41058349609375, -0.39830780029296875, -0.3860321044921875, -0.37375640869140625, -0.361480712890625, -0.34920501708984375, -0.3369293212890625, -0.32465362548828125, -0.3123779296875, -0.30010223388671875, -0.2878265380859375, -0.27555084228515625, -0.263275146484375, -0.25099945068359375, -0.2387237548828125, -0.22644805908203125, -0.21417236328125, -0.20189666748046875, -0.1896209716796875, -0.17734527587890625, -0.165069580078125, -0.15279388427734375, -0.1405181884765625, -0.12824249267578125, -0.115966796875, -0.10369110107421875, -0.0914154052734375, -0.07913970947265625, -0.066864013671875, -0.05458831787109375, -0.0423126220703125, -0.03003692626953125, -0.01776123046875, -0.00548553466796875, 0.0067901611328125, 0.01906585693359375, 0.031341552734375, 0.04361724853515625, 0.0558929443359375, 0.06816864013671875, 0.0804443359375, 0.09272003173828125, 0.1049957275390625, 0.11727142333984375, 0.129547119140625, 0.14182281494140625, 0.1540985107421875, 0.16637420654296875, 0.17864990234375, 0.19092559814453125, 0.2032012939453125, 0.21547698974609375, 0.227752685546875, 0.24002838134765625, 0.2523040771484375, 0.26457977294921875, 0.27685546875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 3.0, 9.0, 16.0, 21.0, 33.0, 770.0, 54.0, 20.0, 12.0, 16.0, 16.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07320261001586914, -0.07139301300048828, -0.06958341598510742, -0.06777381896972656, -0.0659642219543457, -0.06415462493896484, -0.062345027923583984, -0.060535430908203125, -0.058725833892822266, -0.056916236877441406, -0.05510663986206055, -0.05329704284667969, -0.05148744583129883, -0.04967784881591797, -0.04786825180053711, -0.04605865478515625, -0.04424905776977539, -0.04243946075439453, -0.04062986373901367, -0.03882026672363281, -0.03701066970825195, -0.035201072692871094, -0.033391475677490234, -0.031581878662109375, -0.029772281646728516, -0.027962684631347656, -0.026153087615966797, -0.024343490600585938, -0.022533893585205078, -0.02072429656982422, -0.01891469955444336, -0.0171051025390625, -0.01529550552368164, -0.013485908508300781, -0.011676311492919922, -0.009866714477539062, -0.008057117462158203, -0.006247520446777344, -0.004437923431396484, -0.002628326416015625, -0.0008187294006347656, 0.0009908676147460938, 0.002800464630126953, 0.0046100616455078125, 0.006419658660888672, 0.008229255676269531, 0.01003885269165039, 0.01184844970703125, 0.01365804672241211, 0.015467643737792969, 0.017277240753173828, 0.019086837768554688, 0.020896434783935547, 0.022706031799316406, 0.024515628814697266, 0.026325225830078125, 0.028134822845458984, 0.029944419860839844, 0.0317540168762207, 0.03356361389160156, 0.03537321090698242, 0.03718280792236328, 0.03899240493774414, 0.040802001953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 9.0, 18.0, 22.0, 32.0, 50.0, 66.0, 147.0, 178.0, 306.0, 585.0, 1152.0, 2426.0, 6128.0, 16893.0, 56099.0, 278407.0, 3347558.0, 385664.0, 67267.0, 19378.0, 6628.0, 2634.0, 1235.0, 568.0, 280.0, 188.0, 129.0, 69.0, 45.0, 38.0, 21.0, 14.0, 9.0, 5.0, 4.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267822265625, -0.2584495544433594, -0.24907684326171875, -0.23970413208007812, -0.2303314208984375, -0.22095870971679688, -0.21158599853515625, -0.20221328735351562, -0.192840576171875, -0.18346786499023438, -0.17409515380859375, -0.16472244262695312, -0.1553497314453125, -0.14597702026367188, -0.13660430908203125, -0.12723159790039062, -0.11785888671875, -0.10848617553710938, -0.09911346435546875, -0.08974075317382812, -0.0803680419921875, -0.07099533081054688, -0.06162261962890625, -0.052249908447265625, -0.042877197265625, -0.033504486083984375, -0.02413177490234375, -0.014759063720703125, -0.0053863525390625, 0.003986358642578125, 0.01335906982421875, 0.022731781005859375, 0.0321044921875, 0.041477203369140625, 0.05084991455078125, 0.060222625732421875, 0.0695953369140625, 0.07896804809570312, 0.08834075927734375, 0.09771347045898438, 0.107086181640625, 0.11645889282226562, 0.12583160400390625, 0.13520431518554688, 0.1445770263671875, 0.15394973754882812, 0.16332244873046875, 0.17269515991210938, 0.18206787109375, 0.19144058227539062, 0.20081329345703125, 0.21018600463867188, 0.2195587158203125, 0.22893142700195312, 0.23830413818359375, 0.24767684936523438, 0.257049560546875, 0.2664222717285156, 0.27579498291015625, 0.2851676940917969, 0.2945404052734375, 0.3039131164550781, 0.31328582763671875, 0.3226585388183594, 0.33203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 1.0, 2.0, 3.0, 8.0, 7.0, 11.0, 12.0, 13.0, 12.0, 17.0, 30.0, 31.0, 35.0, 41.0, 49.0, 58.0, 81.0, 103.0, 124.0, 194.0, 221.0, 342.0, 770.0, 659.0, 312.0, 204.0, 136.0, 125.0, 92.0, 68.0, 57.0, 53.0, 34.0, 32.0, 30.0, 19.0, 17.0, 12.0, 14.0, 9.0, 9.0, 6.0, 10.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052459716796875, -0.05086803436279297, -0.04927635192871094, -0.047684669494628906, -0.046092987060546875, -0.044501304626464844, -0.04290962219238281, -0.04131793975830078, -0.03972625732421875, -0.03813457489013672, -0.03654289245605469, -0.034951210021972656, -0.033359527587890625, -0.031767845153808594, -0.030176162719726562, -0.02858448028564453, -0.0269927978515625, -0.02540111541748047, -0.023809432983398438, -0.022217750549316406, -0.020626068115234375, -0.019034385681152344, -0.017442703247070312, -0.01585102081298828, -0.01425933837890625, -0.012667655944824219, -0.011075973510742188, -0.009484291076660156, -0.007892608642578125, -0.006300926208496094, -0.0047092437744140625, -0.0031175613403320312, -0.00152587890625, 6.580352783203125e-05, 0.0016574859619140625, 0.0032491683959960938, 0.004840850830078125, 0.006432533264160156, 0.008024215698242188, 0.009615898132324219, 0.01120758056640625, 0.012799263000488281, 0.014390945434570312, 0.015982627868652344, 0.017574310302734375, 0.019165992736816406, 0.020757675170898438, 0.02234935760498047, 0.0239410400390625, 0.02553272247314453, 0.027124404907226562, 0.028716087341308594, 0.030307769775390625, 0.031899452209472656, 0.03349113464355469, 0.03508281707763672, 0.03667449951171875, 0.03826618194580078, 0.03985786437988281, 0.041449546813964844, 0.043041229248046875, 0.044632911682128906, 0.04622459411621094, 0.04781627655029297, 0.049407958984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 5.0, 7.0, 10.0, 29.0, 49.0, 160.0, 305.0, 244.0, 96.0, 52.0, 23.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3530807495117188, -1.3235763311386108, -1.2940720319747925, -1.2645676136016846, -1.2350633144378662, -1.2055588960647583, -1.1760544776916504, -1.146550178527832, -1.1170457601547241, -1.0875413417816162, -1.0580370426177979, -1.02853262424469, -0.9990282654762268, -0.9695239067077637, -0.9400195479393005, -0.9105151891708374, -0.881010890007019, -0.8515065312385559, -0.8220021724700928, -0.7924977540969849, -0.7629933953285217, -0.7334890365600586, -0.7039846777915955, -0.6744803190231323, -0.6449759006500244, -0.6154715418815613, -0.5859671831130981, -0.5564627647399902, -0.5269584059715271, -0.49745404720306396, -0.46794968843460083, -0.4384453296661377, -0.40894097089767456, -0.3794366121292114, -0.3499322235584259, -0.32042786478996277, -0.29092350602149963, -0.2614191174507141, -0.23191475868225098, -0.20241039991378784, -0.1729060262441635, -0.14340165257453918, -0.11389729380607605, -0.08439292013645172, -0.05488855391740799, -0.025384187698364258, 0.004120185971260071, 0.033624544739723206, 0.06312891840934753, 0.09263328462839127, 0.122137650847435, 0.15164202451705933, 0.18114638328552246, 0.2106507569551468, 0.24015513062477112, 0.26965948939323425, 0.2991638779640198, 0.3286682367324829, 0.35817262530326843, 0.38767698407173157, 0.4171813428401947, 0.4466857314109802, 0.47619009017944336, 0.5056944489479065, 0.5351988077163696]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 12.0, 18.0, 17.0, 19.0, 31.0, 30.0, 36.0, 46.0, 58.0, 55.0, 75.0, 78.0, 75.0, 64.0, 75.0, 67.0, 51.0, 39.0, 36.0, 32.0, 19.0, 15.0, 20.0, 7.0, 9.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3119039535522461, -0.29974228143692017, -0.28758060932159424, -0.2754189670085907, -0.26325729489326477, -0.25109562277793884, -0.2389339655637741, -0.22677230834960938, -0.21461063623428345, -0.20244896411895752, -0.19028730690479279, -0.17812564969062805, -0.16596397757530212, -0.1538023054599762, -0.14164064824581146, -0.12947899103164673, -0.1173173189163208, -0.10515565425157547, -0.09299398958683014, -0.08083232492208481, -0.06867066025733948, -0.05650899559259415, -0.044347330927848816, -0.032185666263103485, -0.020024001598358154, -0.007862336933612823, 0.004299327731132507, 0.016460992395877838, 0.02862265706062317, 0.0407843217253685, 0.05294598639011383, 0.06510765105485916, 0.07726931571960449, 0.08943098038434982, 0.10159264504909515, 0.11375430971384048, 0.12591597437858582, 0.13807764649391174, 0.15023930370807648, 0.1624009609222412, 0.17456263303756714, 0.18672430515289307, 0.1988859623670578, 0.21104761958122253, 0.22320929169654846, 0.2353709638118744, 0.24753262102603912, 0.25969427824020386, 0.2718559503555298, 0.2840176224708557, 0.29617929458618164, 0.3083409368991852, 0.3205026090145111, 0.33266428112983704, 0.3448259234428406, 0.3569875955581665, 0.36914926767349243, 0.38131093978881836, 0.3934726119041443, 0.4056342542171478, 0.41779592633247375, 0.4299575984477997, 0.4421192407608032, 0.45428091287612915, 0.4664425849914551]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 6.0, 9.0, 11.0, 29.0, 33.0, 33.0, 56.0, 85.0, 126.0, 200.0, 342.0, 598.0, 1117.0, 2465.0, 5838.0, 17586.0, 242036.0, 743067.0, 22215.0, 6997.0, 2812.0, 1298.0, 638.0, 369.0, 223.0, 112.0, 70.0, 42.0, 38.0, 30.0, 15.0, 14.0, 15.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.471923828125, -0.45721435546875, -0.4425048828125, -0.42779541015625, -0.4130859375, -0.39837646484375, -0.3836669921875, -0.36895751953125, -0.354248046875, -0.33953857421875, -0.3248291015625, -0.31011962890625, -0.29541015625, -0.28070068359375, -0.2659912109375, -0.25128173828125, -0.236572265625, -0.22186279296875, -0.2071533203125, -0.19244384765625, -0.177734375, -0.16302490234375, -0.1483154296875, -0.13360595703125, -0.118896484375, -0.10418701171875, -0.0894775390625, -0.07476806640625, -0.06005859375, -0.04534912109375, -0.0306396484375, -0.01593017578125, -0.001220703125, 0.01348876953125, 0.0281982421875, 0.04290771484375, 0.0576171875, 0.07232666015625, 0.0870361328125, 0.10174560546875, 0.116455078125, 0.13116455078125, 0.1458740234375, 0.16058349609375, 0.17529296875, 0.19000244140625, 0.2047119140625, 0.21942138671875, 0.234130859375, 0.24884033203125, 0.2635498046875, 0.27825927734375, 0.29296875, 0.30767822265625, 0.3223876953125, 0.33709716796875, 0.351806640625, 0.36651611328125, 0.3812255859375, 0.39593505859375, 0.41064453125, 0.42535400390625, 0.4400634765625, 0.45477294921875, 0.469482421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 10.0, 11.0, 9.0, 24.0, 100.0, 340.0, 316.0, 90.0, 26.0, 15.0, 13.0, 11.0, 10.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055267333984375, -0.05372333526611328, -0.05217933654785156, -0.050635337829589844, -0.049091339111328125, -0.047547340393066406, -0.04600334167480469, -0.04445934295654297, -0.04291534423828125, -0.04137134552001953, -0.03982734680175781, -0.038283348083496094, -0.036739349365234375, -0.035195350646972656, -0.03365135192871094, -0.03210735321044922, -0.0305633544921875, -0.02901935577392578, -0.027475357055664062, -0.025931358337402344, -0.024387359619140625, -0.022843360900878906, -0.021299362182617188, -0.01975536346435547, -0.01821136474609375, -0.01666736602783203, -0.015123367309570312, -0.013579368591308594, -0.012035369873046875, -0.010491371154785156, -0.008947372436523438, -0.007403373718261719, -0.005859375, -0.004315376281738281, -0.0027713775634765625, -0.0012273788452148438, 0.000316619873046875, 0.0018606185913085938, 0.0034046173095703125, 0.004948616027832031, 0.00649261474609375, 0.008036613464355469, 0.009580612182617188, 0.011124610900878906, 0.012668609619140625, 0.014212608337402344, 0.015756607055664062, 0.01730060577392578, 0.0188446044921875, 0.02038860321044922, 0.021932601928710938, 0.023476600646972656, 0.025020599365234375, 0.026564598083496094, 0.028108596801757812, 0.02965259552001953, 0.03119659423828125, 0.03274059295654297, 0.03428459167480469, 0.035828590393066406, 0.037372589111328125, 0.038916587829589844, 0.04046058654785156, 0.04200458526611328, 0.043548583984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 3.0, 12.0, 14.0, 13.0, 14.0, 14.0, 22.0, 33.0, 59.0, 93.0, 116.0, 184.0, 265.0, 442.0, 664.0, 1101.0, 2125.0, 4208.0, 11376.0, 46196.0, 508823.0, 412061.0, 41555.0, 10205.0, 3976.0, 1976.0, 1133.0, 624.0, 439.0, 254.0, 170.0, 107.0, 76.0, 60.0, 35.0, 17.0, 23.0, 19.0, 13.0, 9.0, 9.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.3662109375, -0.3547554016113281, -0.34329986572265625, -0.3318443298339844, -0.3203887939453125, -0.3089332580566406, -0.29747772216796875, -0.2860221862792969, -0.274566650390625, -0.2631111145019531, -0.25165557861328125, -0.24020004272460938, -0.2287445068359375, -0.21728897094726562, -0.20583343505859375, -0.19437789916992188, -0.18292236328125, -0.17146682739257812, -0.16001129150390625, -0.14855575561523438, -0.1371002197265625, -0.12564468383789062, -0.11418914794921875, -0.10273361206054688, -0.091278076171875, -0.07982254028320312, -0.06836700439453125, -0.056911468505859375, -0.0454559326171875, -0.034000396728515625, -0.02254486083984375, -0.011089324951171875, 0.0003662109375, 0.011821746826171875, 0.02327728271484375, 0.034732818603515625, 0.0461883544921875, 0.057643890380859375, 0.06909942626953125, 0.08055496215820312, 0.092010498046875, 0.10346603393554688, 0.11492156982421875, 0.12637710571289062, 0.1378326416015625, 0.14928817749023438, 0.16074371337890625, 0.17219924926757812, 0.18365478515625, 0.19511032104492188, 0.20656585693359375, 0.21802139282226562, 0.2294769287109375, 0.24093246459960938, 0.25238800048828125, 0.2638435363769531, 0.275299072265625, 0.2867546081542969, 0.29821014404296875, 0.3096656799316406, 0.3211212158203125, 0.3325767517089844, 0.34403228759765625, 0.3554878234863281, 0.366943359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 14.0, 13.0, 14.0, 18.0, 22.0, 20.0, 25.0, 17.0, 32.0, 31.0, 40.0, 35.0, 39.0, 44.0, 48.0, 36.0, 40.0, 36.0, 40.0, 41.0, 28.0, 38.0, 43.0, 33.0, 28.0, 36.0, 32.0, 18.0, 17.0, 24.0, 17.0, 10.0, 14.0, 6.0, 10.0, 7.0, 0.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1292724609375, -0.12526512145996094, -0.12125778198242188, -0.11725044250488281, -0.11324310302734375, -0.10923576354980469, -0.10522842407226562, -0.10122108459472656, -0.0972137451171875, -0.09320640563964844, -0.08919906616210938, -0.08519172668457031, -0.08118438720703125, -0.07717704772949219, -0.07316970825195312, -0.06916236877441406, -0.065155029296875, -0.06114768981933594, -0.057140350341796875, -0.05313301086425781, -0.04912567138671875, -0.04511833190917969, -0.041110992431640625, -0.03710365295410156, -0.0330963134765625, -0.029088973999023438, -0.025081634521484375, -0.021074295043945312, -0.01706695556640625, -0.013059616088867188, -0.009052276611328125, -0.0050449371337890625, -0.00103759765625, 0.0029697418212890625, 0.006977081298828125, 0.010984420776367188, 0.01499176025390625, 0.018999099731445312, 0.023006439208984375, 0.027013778686523438, 0.0310211181640625, 0.03502845764160156, 0.039035797119140625, 0.04304313659667969, 0.04705047607421875, 0.05105781555175781, 0.055065155029296875, 0.05907249450683594, 0.063079833984375, 0.06708717346191406, 0.07109451293945312, 0.07510185241699219, 0.07910919189453125, 0.08311653137207031, 0.08712387084960938, 0.09113121032714844, 0.0951385498046875, 0.09914588928222656, 0.10315322875976562, 0.10716056823730469, 0.11116790771484375, 0.11517524719238281, 0.11918258666992188, 0.12318992614746094, 0.127197265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 12.0, 10.0, 19.0, 23.0, 44.0, 74.0, 127.0, 218.0, 418.0, 1019.0, 3239.0, 20444.0, 960961.0, 54224.0, 5085.0, 1447.0, 553.0, 242.0, 154.0, 89.0, 38.0, 38.0, 14.0, 10.0, 11.0, 10.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.5122604370117188, -0.4922943115234375, -0.47232818603515625, -0.452362060546875, -0.43239593505859375, -0.4124298095703125, -0.39246368408203125, -0.37249755859375, -0.35253143310546875, -0.3325653076171875, -0.31259918212890625, -0.292633056640625, -0.27266693115234375, -0.2527008056640625, -0.23273468017578125, -0.2127685546875, -0.19280242919921875, -0.1728363037109375, -0.15287017822265625, -0.132904052734375, -0.11293792724609375, -0.0929718017578125, -0.07300567626953125, -0.05303955078125, -0.03307342529296875, -0.0131072998046875, 0.00685882568359375, 0.026824951171875, 0.04679107666015625, 0.0667572021484375, 0.08672332763671875, 0.106689453125, 0.12665557861328125, 0.1466217041015625, 0.16658782958984375, 0.186553955078125, 0.20652008056640625, 0.2264862060546875, 0.24645233154296875, 0.26641845703125, 0.28638458251953125, 0.3063507080078125, 0.32631683349609375, 0.346282958984375, 0.36624908447265625, 0.3862152099609375, 0.40618133544921875, 0.4261474609375, 0.44611358642578125, 0.4660797119140625, 0.48604583740234375, 0.506011962890625, 0.5259780883789062, 0.5459442138671875, 0.5659103393554688, 0.58587646484375, 0.6058425903320312, 0.6258087158203125, 0.6457748413085938, 0.665740966796875, 0.6857070922851562, 0.7056732177734375, 0.7256393432617188, 0.74560546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 4.0, 9.0, 13.0, 15.0, 61.0, 125.0, 210.0, 272.0, 142.0, 61.0, 22.0, 19.0, 10.0, 6.0, 4.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.863723784685135e-05, -2.777017652988434e-05, -2.6903115212917328e-05, -2.6036053895950317e-05, -2.5168992578983307e-05, -2.4301931262016296e-05, -2.3434869945049286e-05, -2.2567808628082275e-05, -2.1700747311115265e-05, -2.0833685994148254e-05, -1.9966624677181244e-05, -1.9099563360214233e-05, -1.8232502043247223e-05, -1.7365440726280212e-05, -1.6498379409313202e-05, -1.563131809234619e-05, -1.4764256775379181e-05, -1.389719545841217e-05, -1.303013414144516e-05, -1.216307282447815e-05, -1.1296011507511139e-05, -1.0428950190544128e-05, -9.561888873577118e-06, -8.694827556610107e-06, -7.827766239643097e-06, -6.9607049226760864e-06, -6.093643605709076e-06, -5.2265822887420654e-06, -4.359520971775055e-06, -3.4924596548080444e-06, -2.625398337841034e-06, -1.7583370208740234e-06, -8.912757039070129e-07, -2.421438694000244e-08, 8.428469300270081e-07, 1.7099082469940186e-06, 2.576969563961029e-06, 3.4440308809280396e-06, 4.31109219789505e-06, 5.1781535148620605e-06, 6.045214831829071e-06, 6.9122761487960815e-06, 7.779337465763092e-06, 8.646398782730103e-06, 9.513460099697113e-06, 1.0380521416664124e-05, 1.1247582733631134e-05, 1.2114644050598145e-05, 1.2981705367565155e-05, 1.3848766684532166e-05, 1.4715828001499176e-05, 1.5582889318466187e-05, 1.6449950635433197e-05, 1.7317011952400208e-05, 1.8184073269367218e-05, 1.905113458633423e-05, 1.991819590330124e-05, 2.078525722026825e-05, 2.165231853723526e-05, 2.251937985420227e-05, 2.338644117116928e-05, 2.425350248813629e-05, 2.5120563805103302e-05, 2.5987625122070312e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 12.0, 11.0, 24.0, 20.0, 29.0, 44.0, 62.0, 89.0, 136.0, 210.0, 325.0, 560.0, 1049.0, 2029.0, 4354.0, 11468.0, 43116.0, 586591.0, 345633.0, 34529.0, 10026.0, 3845.0, 1847.0, 998.0, 528.0, 345.0, 206.0, 152.0, 90.0, 57.0, 26.0, 31.0, 27.0, 24.0, 11.0, 10.0, 12.0, 10.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.25927734375, -0.2516365051269531, -0.24399566650390625, -0.23635482788085938, -0.2287139892578125, -0.22107315063476562, -0.21343231201171875, -0.20579147338867188, -0.198150634765625, -0.19050979614257812, -0.18286895751953125, -0.17522811889648438, -0.1675872802734375, -0.15994644165039062, -0.15230560302734375, -0.14466476440429688, -0.13702392578125, -0.12938308715820312, -0.12174224853515625, -0.11410140991210938, -0.1064605712890625, -0.09881973266601562, -0.09117889404296875, -0.08353805541992188, -0.075897216796875, -0.06825637817382812, -0.06061553955078125, -0.052974700927734375, -0.0453338623046875, -0.037693023681640625, -0.03005218505859375, -0.022411346435546875, -0.0147705078125, -0.007129669189453125, 0.00051116943359375, 0.008152008056640625, 0.0157928466796875, 0.023433685302734375, 0.03107452392578125, 0.038715362548828125, 0.046356201171875, 0.053997039794921875, 0.06163787841796875, 0.06927871704101562, 0.0769195556640625, 0.08456039428710938, 0.09220123291015625, 0.09984207153320312, 0.10748291015625, 0.11512374877929688, 0.12276458740234375, 0.13040542602539062, 0.1380462646484375, 0.14568710327148438, 0.15332794189453125, 0.16096878051757812, 0.168609619140625, 0.17625045776367188, 0.18389129638671875, 0.19153213500976562, 0.1991729736328125, 0.20681381225585938, 0.21445465087890625, 0.22209548950195312, 0.229736328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 4.0, 10.0, 13.0, 21.0, 16.0, 20.0, 34.0, 42.0, 51.0, 85.0, 87.0, 123.0, 115.0, 79.0, 70.0, 58.0, 43.0, 22.0, 17.0, 16.0, 18.0, 8.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12519073486328125, -0.1209869384765625, -0.11678314208984375, -0.112579345703125, -0.10837554931640625, -0.1041717529296875, -0.09996795654296875, -0.09576416015625, -0.09156036376953125, -0.0873565673828125, -0.08315277099609375, -0.078948974609375, -0.07474517822265625, -0.0705413818359375, -0.06633758544921875, -0.0621337890625, -0.05792999267578125, -0.0537261962890625, -0.04952239990234375, -0.045318603515625, -0.04111480712890625, -0.0369110107421875, -0.03270721435546875, -0.02850341796875, -0.02429962158203125, -0.0200958251953125, -0.01589202880859375, -0.011688232421875, -0.00748443603515625, -0.0032806396484375, 0.00092315673828125, 0.005126953125, 0.00933074951171875, 0.0135345458984375, 0.01773834228515625, 0.021942138671875, 0.02614593505859375, 0.0303497314453125, 0.03455352783203125, 0.03875732421875, 0.04296112060546875, 0.0471649169921875, 0.05136871337890625, 0.055572509765625, 0.05977630615234375, 0.0639801025390625, 0.06818389892578125, 0.0723876953125, 0.07659149169921875, 0.0807952880859375, 0.08499908447265625, 0.089202880859375, 0.09340667724609375, 0.0976104736328125, 0.10181427001953125, 0.10601806640625, 0.11022186279296875, 0.1144256591796875, 0.11862945556640625, 0.122833251953125, 0.12703704833984375, 0.1312408447265625, 0.13544464111328125, 0.1396484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 17.0, 39.0, 137.0, 437.0, 210.0, 65.0, 35.0, 19.0, 7.0, 11.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.813207626342773, -5.685390472412109, -5.557573318481445, -5.429756164550781, -5.301939010620117, -5.174122333526611, -5.046305179595947, -4.918488025665283, -4.790670871734619, -4.662853717803955, -4.535036563873291, -4.407219409942627, -4.279402732849121, -4.151585578918457, -4.023768424987793, -3.895951271057129, -3.768134117126465, -3.640316963195801, -3.5124998092651367, -3.3846828937530518, -3.2568657398223877, -3.1290485858917236, -3.0012316703796387, -2.8734145164489746, -2.7455973625183105, -2.6177802085876465, -2.4899630546569824, -2.3621461391448975, -2.2343289852142334, -2.1065118312835693, -1.9786947965621948, -1.8508777618408203, -1.7230610847473145, -1.5952439308166504, -1.4674268960952759, -1.3396098613739014, -1.2117927074432373, -1.0839755535125732, -0.9561585187911987, -0.8283414244651794, -0.7005243301391602, -0.5727072358131409, -0.4448901414871216, -0.3170730471611023, -0.189255952835083, -0.06143885850906372, 0.06637823581695557, 0.19419533014297485, 0.32201242446899414, 0.4498295187950134, 0.5776466131210327, 0.705463707447052, 0.8332808017730713, 0.9610978960990906, 1.0889149904251099, 1.2167320251464844, 1.3445491790771484, 1.4723663330078125, 1.600183367729187, 1.7280004024505615, 1.8558175563812256, 1.9836347103118896, 2.1114516258239746, 2.2392687797546387, 2.3670859336853027]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 7.0, 4.0, 15.0, 19.0, 17.0, 41.0, 70.0, 113.0, 141.0, 180.0, 128.0, 108.0, 46.0, 26.0, 24.0, 10.0, 15.0, 6.0, 2.0, 6.0, 6.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3744959831237793, -3.2789382934570312, -3.1833808422088623, -3.0878231525421143, -2.992265462875366, -2.8967080116271973, -2.801150321960449, -2.705592632293701, -2.6100351810455322, -2.514477491378784, -2.4189200401306152, -2.323362350463867, -2.227804660797119, -2.13224720954895, -2.036689519882202, -1.9411319494247437, -1.8455742597579956, -1.750016689300537, -1.654458999633789, -1.5589014291763306, -1.463343858718872, -1.367786169052124, -1.2722285985946655, -1.176671028137207, -1.081113338470459, -0.9855557084083557, -0.8899981379508972, -0.794440507888794, -0.6988829374313354, -0.6033253073692322, -0.5077676773071289, -0.4122101068496704, -0.3166525363922119, -0.22109493613243103, -0.12553732097148895, -0.029979705810546875, 0.06557789444923401, 0.1611354947090149, 0.25669312477111816, 0.35225069522857666, 0.44780832529067993, 0.5433659553527832, 0.6389235258102417, 0.734481155872345, 0.8300387859344482, 0.9255963563919067, 1.0211539268493652, 1.1167116165161133, 1.2122691869735718, 1.3078267574310303, 1.4033844470977783, 1.4989420175552368, 1.5944995880126953, 1.6900572776794434, 1.7856148481369019, 1.8811724185943604, 1.9767301082611084, 2.0722877979278564, 2.1678452491760254, 2.2634029388427734, 2.3589606285095215, 2.4545180797576904, 2.5500757694244385, 2.6456332206726074, 2.7411909103393555]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 12.0, 24.0, 28.0, 89.0, 385.0, 12609.0, 4180615.0, 389.0, 65.0, 23.0, 18.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.40625, -57.022705078125, -55.63916015625, -54.255615234375, -52.8720703125, -51.488525390625, -50.10498046875, -48.721435546875, -47.337890625, -45.954345703125, -44.57080078125, -43.187255859375, -41.8037109375, -40.420166015625, -39.03662109375, -37.653076171875, -36.26953125, -34.885986328125, -33.50244140625, -32.118896484375, -30.7353515625, -29.351806640625, -27.96826171875, -26.584716796875, -25.201171875, -23.817626953125, -22.43408203125, -21.050537109375, -19.6669921875, -18.283447265625, -16.89990234375, -15.516357421875, -14.1328125, -12.749267578125, -11.36572265625, -9.982177734375, -8.5986328125, -7.215087890625, -5.83154296875, -4.447998046875, -3.064453125, -1.680908203125, -0.29736328125, 1.086181640625, 2.4697265625, 3.853271484375, 5.23681640625, 6.620361328125, 8.00390625, 9.387451171875, 10.77099609375, 12.154541015625, 13.5380859375, 14.921630859375, 16.30517578125, 17.688720703125, 19.072265625, 20.455810546875, 21.83935546875, 23.222900390625, 24.6064453125, 25.989990234375, 27.37353515625, 28.757080078125, 30.140625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 7.0, 12.0, 14.0, 20.0, 29.0, 80.0, 260.0, 253.0, 158.0, 73.0, 33.0, 15.0, 10.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06103515625, -0.059685468673706055, -0.05833578109741211, -0.056986093521118164, -0.05563640594482422, -0.05428671836853027, -0.05293703079223633, -0.05158734321594238, -0.05023765563964844, -0.04888796806335449, -0.04753828048706055, -0.0461885929107666, -0.044838905334472656, -0.04348921775817871, -0.042139530181884766, -0.04078984260559082, -0.039440155029296875, -0.03809046745300293, -0.036740779876708984, -0.03539109230041504, -0.034041404724121094, -0.03269171714782715, -0.0313420295715332, -0.029992341995239258, -0.028642654418945312, -0.027292966842651367, -0.025943279266357422, -0.024593591690063477, -0.02324390411376953, -0.021894216537475586, -0.02054452896118164, -0.019194841384887695, -0.01784515380859375, -0.016495466232299805, -0.01514577865600586, -0.013796091079711914, -0.012446403503417969, -0.011096715927124023, -0.009747028350830078, -0.008397340774536133, -0.0070476531982421875, -0.005697965621948242, -0.004348278045654297, -0.0029985904693603516, -0.0016489028930664062, -0.00029921531677246094, 0.0010504722595214844, 0.0024001598358154297, 0.003749847412109375, 0.00509953498840332, 0.006449222564697266, 0.007798910140991211, 0.009148597717285156, 0.010498285293579102, 0.011847972869873047, 0.013197660446166992, 0.014547348022460938, 0.015897035598754883, 0.017246723175048828, 0.018596410751342773, 0.01994609832763672, 0.021295785903930664, 0.02264547348022461, 0.023995161056518555, 0.0253448486328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [5.0, 8.0, 21.0, 49.0, 134.0, 388.0, 4163421.0, 29086.0, 406.0, 289.0, 209.0, 112.0, 80.0, 42.0, 24.0, 9.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.17840576171875, -1.8060302734375, -1.43365478515625, -1.061279296875, -0.68890380859375, -0.3165283203125, 0.05584716796875, 0.42822265625, 0.80059814453125, 1.1729736328125, 1.54534912109375, 1.917724609375, 2.29010009765625, 2.6624755859375, 3.03485107421875, 3.4072265625, 3.77960205078125, 4.1519775390625, 4.52435302734375, 4.896728515625, 5.26910400390625, 5.6414794921875, 6.01385498046875, 6.38623046875, 6.75860595703125, 7.1309814453125, 7.50335693359375, 7.875732421875, 8.24810791015625, 8.6204833984375, 8.99285888671875, 9.365234375, 9.73760986328125, 10.1099853515625, 10.48236083984375, 10.854736328125, 11.22711181640625, 11.5994873046875, 11.97186279296875, 12.34423828125, 12.71661376953125, 13.0889892578125, 13.46136474609375, 13.833740234375, 14.20611572265625, 14.5784912109375, 14.95086669921875, 15.3232421875, 15.69561767578125, 16.0679931640625, 16.44036865234375, 16.812744140625, 17.18511962890625, 17.5574951171875, 17.92987060546875, 18.30224609375, 18.67462158203125, 19.0469970703125, 19.41937255859375, 19.791748046875, 20.16412353515625, 20.5364990234375, 20.90887451171875, 21.28125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 16.0, 14.0, 29.0, 61.0, 125.0, 234.0, 602.0, 1653.0, 456.0, 321.0, 212.0, 136.0, 75.0, 53.0, 31.0, 18.0, 10.0, 12.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.070556640625, -0.06689643859863281, -0.06323623657226562, -0.05957603454589844, -0.05591583251953125, -0.05225563049316406, -0.048595428466796875, -0.04493522644042969, -0.0412750244140625, -0.03761482238769531, -0.033954620361328125, -0.030294418334960938, -0.02663421630859375, -0.022974014282226562, -0.019313812255859375, -0.015653610229492188, -0.011993408203125, -0.008333206176757812, -0.004673004150390625, -0.0010128021240234375, 0.00264739990234375, 0.0063076019287109375, 0.009967803955078125, 0.013628005981445312, 0.0172882080078125, 0.020948410034179688, 0.024608612060546875, 0.028268814086914062, 0.03192901611328125, 0.03558921813964844, 0.039249420166015625, 0.04290962219238281, 0.04656982421875, 0.05023002624511719, 0.053890228271484375, 0.05755043029785156, 0.06121063232421875, 0.06487083435058594, 0.06853103637695312, 0.07219123840332031, 0.0758514404296875, 0.07951164245605469, 0.08317184448242188, 0.08683204650878906, 0.09049224853515625, 0.09415245056152344, 0.09781265258789062, 0.10147285461425781, 0.105133056640625, 0.10879325866699219, 0.11245346069335938, 0.11611366271972656, 0.11977386474609375, 0.12343406677246094, 0.12709426879882812, 0.1307544708251953, 0.1344146728515625, 0.1380748748779297, 0.14173507690429688, 0.14539527893066406, 0.14905548095703125, 0.15271568298339844, 0.15637588500976562, 0.1600360870361328, 0.1636962890625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [514.0, 490.0, 17.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4438745975494385, 0.05692780017852783, 1.5577301979064941, 3.058532476425171, 4.559334754943848, 6.060137748718262, 7.560939788818359, 9.061742782592773, 10.562544822692871, 12.063346862792969, 13.564149856567383, 15.06495189666748, 16.565753936767578, 18.066556930541992, 19.567359924316406, 21.068161010742188, 22.5689640045166, 24.069766998291016, 25.570568084716797, 27.07137107849121, 28.572174072265625, 30.072975158691406, 31.57377815246582, 33.074581146240234, 34.575382232666016, 36.0761833190918, 37.576988220214844, 39.077789306640625, 40.578590393066406, 42.07939529418945, 43.580196380615234, 45.08100128173828, 46.5817985534668, 48.08259963989258, 49.583404541015625, 51.084205627441406, 52.58500671386719, 54.085811614990234, 55.586612701416016, 57.08741760253906, 58.588218688964844, 60.089019775390625, 61.58982467651367, 63.09062576293945, 64.5914306640625, 66.09223175048828, 67.59303283691406, 69.09383392333984, 70.59463500976562, 72.0954360961914, 73.59623718261719, 75.0970458984375, 76.59784698486328, 78.09864807128906, 79.59944915771484, 81.10025024414062, 82.60105895996094, 84.10186004638672, 85.6026611328125, 87.10346984863281, 88.6042709350586, 90.10507202148438, 91.60587310791016, 93.10667419433594, 94.60747528076172]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 10.0, 12.0, 37.0, 60.0, 93.0, 153.0, 170.0, 183.0, 129.0, 74.0, 45.0, 21.0, 14.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4809374809265137, -1.3477340936660767, -1.2145307064056396, -1.0813273191452026, -0.9481239318847656, -0.8149205446243286, -0.6817171573638916, -0.5485137701034546, -0.4153103828430176, -0.28210699558258057, -0.14890360832214355, -0.015700221061706543, 0.11750316619873047, 0.2507065534591675, 0.3839099407196045, 0.5171133279800415, 0.6503167152404785, 0.7835201025009155, 0.9167234897613525, 1.0499268770217896, 1.1831302642822266, 1.3163336515426636, 1.4495370388031006, 1.5827404260635376, 1.7159438133239746, 1.8491472005844116, 1.9823505878448486, 2.115553855895996, 2.2487573623657227, 2.381960868835449, 2.5151641368865967, 2.648367404937744, 2.7815704345703125, 2.914773941040039, 3.0479772090911865, 3.181180477142334, 3.3143839836120605, 3.447587490081787, 3.5807907581329346, 3.713994026184082, 3.8471975326538086, 3.980401039123535, 4.113604545593262, 4.24680757522583, 4.380011081695557, 4.513214588165283, 4.646417617797852, 4.779621124267578, 4.912824630737305, 5.046028137207031, 5.179231643676758, 5.312434673309326, 5.445638179779053, 5.578841686248779, 5.712044715881348, 5.845248222351074, 5.978451728820801, 6.111655235290527, 6.244858741760254, 6.378061771392822, 6.511265277862549, 6.644468784332275, 6.777671813964844, 6.91087532043457, 7.044078826904297]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 5.0, 16.0, 5.0, 13.0, 24.0, 32.0, 29.0, 43.0, 71.0, 122.0, 1087.0, 53493.0, 988263.0, 4803.0, 239.0, 83.0, 57.0, 35.0, 32.0, 23.0, 23.0, 11.0, 10.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.956634521484375, -1.88201904296875, -1.807403564453125, -1.7327880859375, -1.658172607421875, -1.58355712890625, -1.508941650390625, -1.434326171875, -1.359710693359375, -1.28509521484375, -1.210479736328125, -1.1358642578125, -1.061248779296875, -0.98663330078125, -0.912017822265625, -0.83740234375, -0.762786865234375, -0.68817138671875, -0.613555908203125, -0.5389404296875, -0.464324951171875, -0.38970947265625, -0.315093994140625, -0.240478515625, -0.165863037109375, -0.09124755859375, -0.016632080078125, 0.0579833984375, 0.132598876953125, 0.20721435546875, 0.281829833984375, 0.3564453125, 0.431060791015625, 0.50567626953125, 0.580291748046875, 0.6549072265625, 0.729522705078125, 0.80413818359375, 0.878753662109375, 0.953369140625, 1.027984619140625, 1.10260009765625, 1.177215576171875, 1.2518310546875, 1.326446533203125, 1.40106201171875, 1.475677490234375, 1.55029296875, 1.624908447265625, 1.69952392578125, 1.774139404296875, 1.8487548828125, 1.923370361328125, 1.99798583984375, 2.072601318359375, 2.147216796875, 2.221832275390625, 2.29644775390625, 2.371063232421875, 2.4456787109375, 2.520294189453125, 2.59490966796875, 2.669525146484375, 2.744140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [9.0, 11.0, 33.0, 78.0, 306.0, 366.0, 140.0, 51.0, 16.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174102783203125, -0.014097929000854492, -0.010785579681396484, -0.0074732303619384766, -0.004160881042480469, -0.0008485317230224609, 0.002463817596435547, 0.005776166915893555, 0.009088516235351562, 0.01240086555480957, 0.015713214874267578, 0.019025564193725586, 0.022337913513183594, 0.0256502628326416, 0.02896261215209961, 0.03227496147155762, 0.035587310791015625, 0.03889966011047363, 0.04221200942993164, 0.04552435874938965, 0.048836708068847656, 0.052149057388305664, 0.05546140670776367, 0.05877375602722168, 0.06208610534667969, 0.0653984546661377, 0.0687108039855957, 0.07202315330505371, 0.07533550262451172, 0.07864785194396973, 0.08196020126342773, 0.08527255058288574, 0.08858489990234375, 0.09189724922180176, 0.09520959854125977, 0.09852194786071777, 0.10183429718017578, 0.10514664649963379, 0.1084589958190918, 0.1117713451385498, 0.11508369445800781, 0.11839604377746582, 0.12170839309692383, 0.12502074241638184, 0.12833309173583984, 0.13164544105529785, 0.13495779037475586, 0.13827013969421387, 0.14158248901367188, 0.14489483833312988, 0.1482071876525879, 0.1515195369720459, 0.1548318862915039, 0.15814423561096191, 0.16145658493041992, 0.16476893424987793, 0.16808128356933594, 0.17139363288879395, 0.17470598220825195, 0.17801833152770996, 0.18133068084716797, 0.18464303016662598, 0.18795537948608398, 0.191267728805542, 0.194580078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 11.0, 7.0, 16.0, 24.0, 18.0, 32.0, 41.0, 56.0, 85.0, 277.0, 2156.0, 165451.0, 873323.0, 6267.0, 427.0, 138.0, 53.0, 41.0, 33.0, 27.0, 13.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.267578125, -1.2241058349609375, -1.180633544921875, -1.1371612548828125, -1.09368896484375, -1.0502166748046875, -1.006744384765625, -0.9632720947265625, -0.9197998046875, -0.8763275146484375, -0.832855224609375, -0.7893829345703125, -0.74591064453125, -0.7024383544921875, -0.658966064453125, -0.6154937744140625, -0.572021484375, -0.5285491943359375, -0.485076904296875, -0.4416046142578125, -0.39813232421875, -0.3546600341796875, -0.311187744140625, -0.2677154541015625, -0.2242431640625, -0.1807708740234375, -0.137298583984375, -0.0938262939453125, -0.05035400390625, -0.0068817138671875, 0.036590576171875, 0.0800628662109375, 0.12353515625, 0.1670074462890625, 0.210479736328125, 0.2539520263671875, 0.29742431640625, 0.3408966064453125, 0.384368896484375, 0.4278411865234375, 0.4713134765625, 0.5147857666015625, 0.558258056640625, 0.6017303466796875, 0.64520263671875, 0.6886749267578125, 0.732147216796875, 0.7756195068359375, 0.819091796875, 0.8625640869140625, 0.906036376953125, 0.9495086669921875, 0.99298095703125, 1.0364532470703125, 1.079925537109375, 1.1233978271484375, 1.1668701171875, 1.2103424072265625, 1.253814697265625, 1.2972869873046875, 1.34075927734375, 1.3842315673828125, 1.427703857421875, 1.4711761474609375, 1.5146484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 10.0, 12.0, 13.0, 9.0, 14.0, 23.0, 23.0, 25.0, 19.0, 26.0, 38.0, 30.0, 40.0, 31.0, 37.0, 49.0, 35.0, 46.0, 38.0, 41.0, 34.0, 36.0, 29.0, 34.0, 41.0, 23.0, 22.0, 25.0, 22.0, 18.0, 21.0, 16.0, 12.0, 10.0, 18.0, 10.0, 7.0, 5.0, 11.0, 8.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.0928955078125, -0.08997631072998047, -0.08705711364746094, -0.0841379165649414, -0.08121871948242188, -0.07829952239990234, -0.07538032531738281, -0.07246112823486328, -0.06954193115234375, -0.06662273406982422, -0.06370353698730469, -0.060784339904785156, -0.057865142822265625, -0.054945945739746094, -0.05202674865722656, -0.04910755157470703, -0.0461883544921875, -0.04326915740966797, -0.04034996032714844, -0.037430763244628906, -0.034511566162109375, -0.031592369079589844, -0.028673171997070312, -0.02575397491455078, -0.02283477783203125, -0.01991558074951172, -0.016996383666992188, -0.014077186584472656, -0.011157989501953125, -0.008238792419433594, -0.0053195953369140625, -0.0024003982543945312, 0.000518798828125, 0.0034379959106445312, 0.0063571929931640625, 0.009276390075683594, 0.012195587158203125, 0.015114784240722656, 0.018033981323242188, 0.02095317840576172, 0.02387237548828125, 0.02679157257080078, 0.029710769653320312, 0.032629966735839844, 0.035549163818359375, 0.038468360900878906, 0.04138755798339844, 0.04430675506591797, 0.0472259521484375, 0.05014514923095703, 0.05306434631347656, 0.055983543395996094, 0.058902740478515625, 0.061821937561035156, 0.06474113464355469, 0.06766033172607422, 0.07057952880859375, 0.07349872589111328, 0.07641792297363281, 0.07933712005615234, 0.08225631713867188, 0.0851755142211914, 0.08809471130371094, 0.09101390838623047, 0.09393310546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 3.0, 5.0, 8.0, 6.0, 4.0, 3.0, 8.0, 11.0, 10.0, 28.0, 99.0, 386.0, 2859.0, 869744.0, 172523.0, 2301.0, 378.0, 58.0, 23.0, 10.0, 6.0, 5.0, 5.0, 14.0, 5.0, 4.0, 1.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5226593017578125, -1.475006103515625, -1.4273529052734375, -1.37969970703125, -1.3320465087890625, -1.284393310546875, -1.2367401123046875, -1.1890869140625, -1.1414337158203125, -1.093780517578125, -1.0461273193359375, -0.99847412109375, -0.9508209228515625, -0.903167724609375, -0.8555145263671875, -0.807861328125, -0.7602081298828125, -0.712554931640625, -0.6649017333984375, -0.61724853515625, -0.5695953369140625, -0.521942138671875, -0.4742889404296875, -0.4266357421875, -0.3789825439453125, -0.331329345703125, -0.2836761474609375, -0.23602294921875, -0.1883697509765625, -0.140716552734375, -0.0930633544921875, -0.04541015625, 0.0022430419921875, 0.049896240234375, 0.0975494384765625, 0.14520263671875, 0.1928558349609375, 0.240509033203125, 0.2881622314453125, 0.3358154296875, 0.3834686279296875, 0.431121826171875, 0.4787750244140625, 0.52642822265625, 0.5740814208984375, 0.621734619140625, 0.6693878173828125, 0.717041015625, 0.7646942138671875, 0.812347412109375, 0.8600006103515625, 0.90765380859375, 0.9553070068359375, 1.002960205078125, 1.0506134033203125, 1.0982666015625, 1.1459197998046875, 1.193572998046875, 1.2412261962890625, 1.28887939453125, 1.3365325927734375, 1.384185791015625, 1.4318389892578125, 1.4794921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 6.0, 12.0, 12.0, 14.0, 19.0, 63.0, 161.0, 267.0, 200.0, 83.0, 35.0, 25.0, 20.0, 13.0, 7.0, 7.0, 4.0, 5.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84721565246582e-05, -5.6733377277851105e-05, -5.4994598031044006e-05, -5.325581878423691e-05, -5.151703953742981e-05, -4.977826029062271e-05, -4.803948104381561e-05, -4.6300701797008514e-05, -4.4561922550201416e-05, -4.282314330339432e-05, -4.108436405658722e-05, -3.934558480978012e-05, -3.760680556297302e-05, -3.5868026316165924e-05, -3.4129247069358826e-05, -3.239046782255173e-05, -3.065168857574463e-05, -2.891290932893753e-05, -2.7174130082130432e-05, -2.5435350835323334e-05, -2.3696571588516235e-05, -2.1957792341709137e-05, -2.021901309490204e-05, -1.848023384809494e-05, -1.6741454601287842e-05, -1.5002675354480743e-05, -1.3263896107673645e-05, -1.1525116860866547e-05, -9.786337614059448e-06, -8.04755836725235e-06, -6.3087791204452515e-06, -4.569999873638153e-06, -2.8312206268310547e-06, -1.0924413800239563e-06, 6.463378667831421e-07, 2.3851171135902405e-06, 4.123896360397339e-06, 5.862675607204437e-06, 7.601454854011536e-06, 9.340234100818634e-06, 1.1079013347625732e-05, 1.281779259443283e-05, 1.455657184123993e-05, 1.6295351088047028e-05, 1.8034130334854126e-05, 1.9772909581661224e-05, 2.1511688828468323e-05, 2.325046807527542e-05, 2.498924732208252e-05, 2.6728026568889618e-05, 2.8466805815696716e-05, 3.0205585062503815e-05, 3.194436430931091e-05, 3.368314355611801e-05, 3.542192280292511e-05, 3.716070204973221e-05, 3.889948129653931e-05, 4.0638260543346405e-05, 4.2377039790153503e-05, 4.41158190369606e-05, 4.58545982837677e-05, 4.75933775305748e-05, 4.93321567773819e-05, 5.1070936024188995e-05, 5.2809715270996094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 8.0, 10.0, 14.0, 25.0, 48.0, 91.0, 115.0, 241.0, 457.0, 940.0, 2147.0, 5905.0, 25735.0, 960741.0, 39019.0, 7804.0, 2934.0, 1173.0, 529.0, 263.0, 133.0, 85.0, 44.0, 36.0, 20.0, 14.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.15234375, -1.120849609375, -1.08935546875, -1.057861328125, -1.0263671875, -0.994873046875, -0.96337890625, -0.931884765625, -0.900390625, -0.868896484375, -0.83740234375, -0.805908203125, -0.7744140625, -0.742919921875, -0.71142578125, -0.679931640625, -0.6484375, -0.616943359375, -0.58544921875, -0.553955078125, -0.5224609375, -0.490966796875, -0.45947265625, -0.427978515625, -0.396484375, -0.364990234375, -0.33349609375, -0.302001953125, -0.2705078125, -0.239013671875, -0.20751953125, -0.176025390625, -0.14453125, -0.113037109375, -0.08154296875, -0.050048828125, -0.0185546875, 0.012939453125, 0.04443359375, 0.075927734375, 0.107421875, 0.138916015625, 0.17041015625, 0.201904296875, 0.2333984375, 0.264892578125, 0.29638671875, 0.327880859375, 0.359375, 0.390869140625, 0.42236328125, 0.453857421875, 0.4853515625, 0.516845703125, 0.54833984375, 0.579833984375, 0.611328125, 0.642822265625, 0.67431640625, 0.705810546875, 0.7373046875, 0.768798828125, 0.80029296875, 0.831787109375, 0.86328125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 7.0, 6.0, 18.0, 27.0, 101.0, 628.0, 121.0, 25.0, 4.0, 11.0, 6.0, 4.0, 3.0, 3.0, 7.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40576171875, -0.39101409912109375, -0.3762664794921875, -0.36151885986328125, -0.346771240234375, -0.33202362060546875, -0.3172760009765625, -0.30252838134765625, -0.28778076171875, -0.27303314208984375, -0.2582855224609375, -0.24353790283203125, -0.228790283203125, -0.21404266357421875, -0.1992950439453125, -0.18454742431640625, -0.1697998046875, -0.15505218505859375, -0.1403045654296875, -0.12555694580078125, -0.110809326171875, -0.09606170654296875, -0.0813140869140625, -0.06656646728515625, -0.05181884765625, -0.03707122802734375, -0.0223236083984375, -0.00757598876953125, 0.007171630859375, 0.02191925048828125, 0.0366668701171875, 0.05141448974609375, 0.066162109375, 0.08090972900390625, 0.0956573486328125, 0.11040496826171875, 0.125152587890625, 0.13990020751953125, 0.1546478271484375, 0.16939544677734375, 0.18414306640625, 0.19889068603515625, 0.2136383056640625, 0.22838592529296875, 0.243133544921875, 0.25788116455078125, 0.2726287841796875, 0.28737640380859375, 0.3021240234375, 0.31687164306640625, 0.3316192626953125, 0.34636688232421875, 0.361114501953125, 0.37586212158203125, 0.3906097412109375, 0.40535736083984375, 0.42010498046875, 0.43485260009765625, 0.4496002197265625, 0.46434783935546875, 0.479095458984375, 0.49384307861328125, 0.5085906982421875, 0.5233383178710938, 0.5380859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 15.0, 190.0, 688.0, 102.0, 15.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.036210060119629, -12.771994590759277, -12.50777816772461, -12.243562698364258, -11.979347229003906, -11.715131759643555, -11.450915336608887, -11.186699867248535, -10.922483444213867, -10.658267974853516, -10.394051551818848, -10.129836082458496, -9.865620613098145, -9.601404190063477, -9.337188720703125, -9.072973251342773, -8.808757781982422, -8.54454231262207, -8.280325889587402, -8.01611042022705, -7.751894950866699, -7.4876790046691895, -7.22346305847168, -6.959247589111328, -6.695031642913818, -6.430815696716309, -6.166600227355957, -5.902384281158447, -5.6381683349609375, -5.373952865600586, -5.109736919403076, -4.845520973205566, -4.581305503845215, -4.317089557647705, -4.0528740882873535, -3.7886581420898438, -3.524442434310913, -3.2602267265319824, -2.9960107803344727, -2.731795072555542, -2.4675791263580322, -2.2033634185791016, -1.9391475915908813, -1.6749317646026611, -1.4107160568237305, -1.1465003490447998, -0.8822845220565796, -0.6180686950683594, -0.3538529872894287, -0.08963721990585327, 0.17457854747772217, 0.4387943148612976, 0.703010082244873, 0.9672257900238037, 1.231441617012024, 1.4956574440002441, 1.7598731517791748, 2.0240888595581055, 2.2883048057556152, 2.552520513534546, 2.8167362213134766, 3.0809519290924072, 3.345167636871338, 3.6093835830688477, 3.8735992908477783]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 13.0, 21.0, 40.0, 64.0, 105.0, 134.0, 155.0, 120.0, 131.0, 76.0, 58.0, 33.0, 15.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0], "bins": [-3.283161163330078, -3.2172725200653076, -3.151383876800537, -3.0854949951171875, -3.019606351852417, -2.9537177085876465, -2.887829065322876, -2.8219404220581055, -2.756051540374756, -2.6901628971099854, -2.624274253845215, -2.5583853721618652, -2.4924967288970947, -2.426608085632324, -2.3607194423675537, -2.294830799102783, -2.2289421558380127, -2.163053512573242, -2.0971648693084717, -2.031275987625122, -1.9653873443603516, -1.899498701095581, -1.8336100578308105, -1.76772141456604, -1.70183265209198, -1.6359440088272095, -1.5700552463531494, -1.504166603088379, -1.4382779598236084, -1.3723891973495483, -1.3065005540847778, -1.2406117916107178, -1.1747229099273682, -1.1088342666625977, -1.0429455041885376, -0.9770568609237671, -0.9111681580543518, -0.8452794551849365, -0.779390811920166, -0.7135021090507507, -0.6476134657859802, -0.5817247629165649, -0.5158361196517944, -0.44994741678237915, -0.38405871391296387, -0.3181700110435486, -0.2522813379764557, -0.1863926649093628, -0.12050396203994751, -0.05461527407169342, 0.011273413896560669, 0.07716210186481476, 0.14305078983306885, 0.20893949270248413, 0.274828165769577, 0.3407168388366699, 0.4066055417060852, 0.4724942445755005, 0.538382887840271, 0.6042715907096863, 0.6701602935791016, 0.7360489964485168, 0.8019376993179321, 0.8678263425827026, 0.9337150454521179]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 4.0, 8.0, 8.0, 16.0, 12.0, 18.0, 14.0, 18.0, 22.0, 20.0, 36.0, 270.0, 4188856.0, 4548.0, 199.0, 51.0, 30.0, 26.0, 24.0, 20.0, 10.0, 22.0, 4.0, 4.0, 8.0, 2.0, 0.0, 0.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.3359375, -13.7811279296875, -13.226318359375, -12.6715087890625, -12.11669921875, -11.5618896484375, -11.007080078125, -10.4522705078125, -9.8974609375, -9.3426513671875, -8.787841796875, -8.2330322265625, -7.67822265625, -7.1234130859375, -6.568603515625, -6.0137939453125, -5.458984375, -4.9041748046875, -4.349365234375, -3.7945556640625, -3.23974609375, -2.6849365234375, -2.130126953125, -1.5753173828125, -1.0205078125, -0.4656982421875, 0.089111328125, 0.6439208984375, 1.19873046875, 1.7535400390625, 2.308349609375, 2.8631591796875, 3.41796875, 3.9727783203125, 4.527587890625, 5.0823974609375, 5.63720703125, 6.1920166015625, 6.746826171875, 7.3016357421875, 7.8564453125, 8.4112548828125, 8.966064453125, 9.5208740234375, 10.07568359375, 10.6304931640625, 11.185302734375, 11.7401123046875, 12.294921875, 12.8497314453125, 13.404541015625, 13.9593505859375, 14.51416015625, 15.0689697265625, 15.623779296875, 16.1785888671875, 16.7333984375, 17.2882080078125, 17.843017578125, 18.3978271484375, 18.95263671875, 19.5074462890625, 20.062255859375, 20.6170654296875, 21.171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 13.0, 9.0, 26.0, 40.0, 60.0, 76.0, 123.0, 139.0, 131.0, 115.0, 66.0, 46.0, 50.0, 35.0, 21.0, 8.0, 18.0, 4.0, 5.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0194091796875, -0.018276691436767578, -0.017144203186035156, -0.016011714935302734, -0.014879226684570312, -0.01374673843383789, -0.012614250183105469, -0.011481761932373047, -0.010349273681640625, -0.009216785430908203, -0.008084297180175781, -0.006951808929443359, -0.0058193206787109375, -0.004686832427978516, -0.0035543441772460938, -0.002421855926513672, -0.00128936767578125, -0.00015687942504882812, 0.0009756088256835938, 0.0021080970764160156, 0.0032405853271484375, 0.004373073577880859, 0.005505561828613281, 0.006638050079345703, 0.007770538330078125, 0.008903026580810547, 0.010035514831542969, 0.01116800308227539, 0.012300491333007812, 0.013432979583740234, 0.014565467834472656, 0.015697956085205078, 0.0168304443359375, 0.017962932586669922, 0.019095420837402344, 0.020227909088134766, 0.021360397338867188, 0.02249288558959961, 0.02362537384033203, 0.024757862091064453, 0.025890350341796875, 0.027022838592529297, 0.02815532684326172, 0.02928781509399414, 0.030420303344726562, 0.031552791595458984, 0.032685279846191406, 0.03381776809692383, 0.03495025634765625, 0.03608274459838867, 0.037215232849121094, 0.038347721099853516, 0.03948020935058594, 0.04061269760131836, 0.04174518585205078, 0.0428776741027832, 0.044010162353515625, 0.04514265060424805, 0.04627513885498047, 0.04740762710571289, 0.04854011535644531, 0.049672603607177734, 0.050805091857910156, 0.05193758010864258, 0.053070068359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 46.0, 331.0, 4193557.0, 326.0, 23.0, 10.0], "bins": [-54.25, -53.354339599609375, -52.45867919921875, -51.563018798828125, -50.6673583984375, -49.771697998046875, -48.87603759765625, -47.980377197265625, -47.084716796875, -46.189056396484375, -45.29339599609375, -44.397735595703125, -43.5020751953125, -42.606414794921875, -41.71075439453125, -40.815093994140625, -39.91943359375, -39.023773193359375, -38.12811279296875, -37.232452392578125, -36.3367919921875, -35.441131591796875, -34.54547119140625, -33.649810791015625, -32.754150390625, -31.858489990234375, -30.96282958984375, -30.067169189453125, -29.1715087890625, -28.275848388671875, -27.38018798828125, -26.484527587890625, -25.5888671875, -24.693206787109375, -23.79754638671875, -22.901885986328125, -22.0062255859375, -21.110565185546875, -20.21490478515625, -19.319244384765625, -18.423583984375, -17.527923583984375, -16.63226318359375, -15.736602783203125, -14.8409423828125, -13.945281982421875, -13.04962158203125, -12.153961181640625, -11.25830078125, -10.362640380859375, -9.46697998046875, -8.571319580078125, -7.6756591796875, -6.779998779296875, -5.88433837890625, -4.988677978515625, -4.093017578125, -3.197357177734375, -2.30169677734375, -1.406036376953125, -0.5103759765625, 0.385284423828125, 1.28094482421875, 2.176605224609375, 3.072265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 12.0, 9.0, 26.0, 45.0, 56.0, 141.0, 531.0, 2741.0, 276.0, 99.0, 53.0, 36.0, 14.0, 12.0, 12.0, 8.0, 3.0, 2.0, 3.0, 3.0], "bins": [-0.2396240234375, -0.23496341705322266, -0.2303028106689453, -0.22564220428466797, -0.22098159790039062, -0.21632099151611328, -0.21166038513183594, -0.2069997787475586, -0.20233917236328125, -0.1976785659790039, -0.19301795959472656, -0.18835735321044922, -0.18369674682617188, -0.17903614044189453, -0.1743755340576172, -0.16971492767333984, -0.1650543212890625, -0.16039371490478516, -0.1557331085205078, -0.15107250213623047, -0.14641189575195312, -0.14175128936767578, -0.13709068298339844, -0.1324300765991211, -0.12776947021484375, -0.1231088638305664, -0.11844825744628906, -0.11378765106201172, -0.10912704467773438, -0.10446643829345703, -0.09980583190917969, -0.09514522552490234, -0.090484619140625, -0.08582401275634766, -0.08116340637207031, -0.07650279998779297, -0.07184219360351562, -0.06718158721923828, -0.06252098083496094, -0.057860374450683594, -0.05319976806640625, -0.048539161682128906, -0.04387855529785156, -0.03921794891357422, -0.034557342529296875, -0.02989673614501953, -0.025236129760742188, -0.020575523376464844, -0.0159149169921875, -0.011254310607910156, -0.0065937042236328125, -0.0019330978393554688, 0.002727508544921875, 0.007388114929199219, 0.012048721313476562, 0.016709327697753906, 0.02136993408203125, 0.026030540466308594, 0.030691146850585938, 0.03535175323486328, 0.040012359619140625, 0.04467296600341797, 0.04933357238769531, 0.053994178771972656, 0.05865478515625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1021.0], "bins": [-132.24578857421875, -130.16552734375, -128.0852508544922, -126.0049819946289, -123.92471313476562, -121.84444427490234, -119.76417541503906, -117.68390655517578, -115.6036376953125, -113.52336883544922, -111.44309997558594, -109.36283111572266, -107.28256225585938, -105.2022933959961, -103.12202453613281, -101.04175567626953, -98.96148681640625, -96.88121795654297, -94.80094909667969, -92.7206802368164, -90.64041137695312, -88.56014251708984, -86.47987365722656, -84.39960479736328, -82.3193359375, -80.23906707763672, -78.15879821777344, -76.07852935791016, -73.99826049804688, -71.9179916381836, -69.83772277832031, -67.75745391845703, -65.67717742919922, -63.59690856933594, -61.516639709472656, -59.436370849609375, -57.356101989746094, -55.27583312988281, -53.19556427001953, -51.11529541015625, -49.035030364990234, -46.95476150512695, -44.87449264526367, -42.79422378540039, -40.71395492553711, -38.63368606567383, -36.55341720581055, -34.473148345947266, -32.392879486083984, -30.312610626220703, -28.232341766357422, -26.15207290649414, -24.07180404663086, -21.991535186767578, -19.911266326904297, -17.830997467041016, -15.750727653503418, -13.670458793640137, -11.590189933776855, -9.509921073913574, -7.429652214050293, -5.349383354187012, -3.2691144943237305, -1.1888456344604492, 0.8914236426353455]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 15.0, 46.0, 93.0, 167.0, 236.0, 199.0, 137.0, 62.0, 37.0, 8.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.031057834625244, -4.929389953613281, -4.827722072601318, -4.7260541915893555, -4.624386310577393, -4.52271842956543, -4.421050548553467, -4.319382667541504, -4.217714786529541, -4.116046905517578, -4.014379024505615, -3.9127111434936523, -3.8110432624816895, -3.7093753814697266, -3.6077075004577637, -3.506039619445801, -3.404371738433838, -3.302703857421875, -3.201035976409912, -3.099368095397949, -2.9977002143859863, -2.8960323333740234, -2.7943644523620605, -2.6926965713500977, -2.5910284519195557, -2.4893605709075928, -2.38769268989563, -2.286024808883667, -2.184356927871704, -2.082689046859741, -1.9810211658477783, -1.8793532848358154, -1.7776854038238525, -1.6760175228118896, -1.5743496417999268, -1.4726817607879639, -1.371013879776001, -1.269345998764038, -1.1676781177520752, -1.0660102367401123, -0.9643422961235046, -0.8626744151115417, -0.7610065340995789, -0.6593385934829712, -0.5576707124710083, -0.4560028314590454, -0.3543349504470825, -0.25266706943511963, -0.15099918842315674, -0.04933129996061325, 0.05233658850193024, 0.15400448441505432, 0.2556723654270172, 0.3573402762413025, 0.4590081572532654, 0.5606760382652283, 0.6623439192771912, 0.764011800289154, 0.8656796813011169, 0.9673476219177246, 1.0690155029296875, 1.1706833839416504, 1.2723512649536133, 1.3740191459655762, 1.475687026977539]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 3.0, 4.0, 6.0, 8.0, 11.0, 8.0, 11.0, 21.0, 21.0, 19.0, 21.0, 30.0, 24.0, 35.0, 44.0, 29.0, 48.0, 66.0, 298.0, 61881.0, 983334.0, 2141.0, 105.0, 52.0, 48.0, 32.0, 27.0, 31.0, 23.0, 25.0, 21.0, 11.0, 22.0, 18.0, 10.0, 10.0, 6.0, 11.0, 8.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.55255126953125, -4.4019775390625, -4.25140380859375, -4.100830078125, -3.95025634765625, -3.7996826171875, -3.64910888671875, -3.49853515625, -3.34796142578125, -3.1973876953125, -3.04681396484375, -2.896240234375, -2.74566650390625, -2.5950927734375, -2.44451904296875, -2.2939453125, -2.14337158203125, -1.9927978515625, -1.84222412109375, -1.691650390625, -1.54107666015625, -1.3905029296875, -1.23992919921875, -1.08935546875, -0.93878173828125, -0.7882080078125, -0.63763427734375, -0.487060546875, -0.33648681640625, -0.1859130859375, -0.03533935546875, 0.115234375, 0.26580810546875, 0.4163818359375, 0.56695556640625, 0.717529296875, 0.86810302734375, 1.0186767578125, 1.16925048828125, 1.31982421875, 1.47039794921875, 1.6209716796875, 1.77154541015625, 1.922119140625, 2.07269287109375, 2.2232666015625, 2.37384033203125, 2.5244140625, 2.67498779296875, 2.8255615234375, 2.97613525390625, 3.126708984375, 3.27728271484375, 3.4278564453125, 3.57843017578125, 3.72900390625, 3.87957763671875, 4.0301513671875, 4.18072509765625, 4.331298828125, 4.48187255859375, 4.6324462890625, 4.78302001953125, 4.93359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 28.0, 78.0, 150.0, 244.0, 252.0, 143.0, 79.0, 29.0, 10.0], "bins": [-0.6240234375, -0.6134324073791504, -0.6028413772583008, -0.5922503471374512, -0.5816593170166016, -0.571068286895752, -0.5604772567749023, -0.5498862266540527, -0.5392951965332031, -0.5287041664123535, -0.5181131362915039, -0.5075221061706543, -0.4969310760498047, -0.4863400459289551, -0.47574901580810547, -0.46515798568725586, -0.45456695556640625, -0.44397592544555664, -0.43338489532470703, -0.4227938652038574, -0.4122028350830078, -0.4016118049621582, -0.3910207748413086, -0.380429744720459, -0.3698387145996094, -0.35924768447875977, -0.34865665435791016, -0.33806562423706055, -0.32747459411621094, -0.31688356399536133, -0.3062925338745117, -0.2957015037536621, -0.2851104736328125, -0.2745194435119629, -0.2639284133911133, -0.25333738327026367, -0.24274635314941406, -0.23215532302856445, -0.22156429290771484, -0.21097326278686523, -0.20038223266601562, -0.18979120254516602, -0.1792001724243164, -0.1686091423034668, -0.1580181121826172, -0.14742708206176758, -0.13683605194091797, -0.12624502182006836, -0.11565399169921875, -0.10506296157836914, -0.09447193145751953, -0.08388090133666992, -0.07328987121582031, -0.0626988410949707, -0.052107810974121094, -0.041516780853271484, -0.030925750732421875, -0.020334720611572266, -0.009743690490722656, 0.0008473396301269531, 0.011438369750976562, 0.022029399871826172, 0.03262042999267578, 0.04321146011352539, 0.053802490234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 7.0, 8.0, 4.0, 16.0, 17.0, 12.0, 20.0, 30.0, 30.0, 49.0, 65.0, 119.0, 181.0, 691.0, 4488.0, 126394.0, 892785.0, 21109.0, 1624.0, 380.0, 161.0, 77.0, 61.0, 46.0, 37.0, 31.0, 22.0, 21.0, 15.0, 6.0, 10.0, 11.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.466796875, -3.348358154296875, -3.22991943359375, -3.111480712890625, -2.9930419921875, -2.874603271484375, -2.75616455078125, -2.637725830078125, -2.519287109375, -2.400848388671875, -2.28240966796875, -2.163970947265625, -2.0455322265625, -1.927093505859375, -1.80865478515625, -1.690216064453125, -1.57177734375, -1.453338623046875, -1.33489990234375, -1.216461181640625, -1.0980224609375, -0.979583740234375, -0.86114501953125, -0.742706298828125, -0.624267578125, -0.505828857421875, -0.38739013671875, -0.268951416015625, -0.1505126953125, -0.032073974609375, 0.08636474609375, 0.204803466796875, 0.3232421875, 0.441680908203125, 0.56011962890625, 0.678558349609375, 0.7969970703125, 0.915435791015625, 1.03387451171875, 1.152313232421875, 1.270751953125, 1.389190673828125, 1.50762939453125, 1.626068115234375, 1.7445068359375, 1.862945556640625, 1.98138427734375, 2.099822998046875, 2.21826171875, 2.336700439453125, 2.45513916015625, 2.573577880859375, 2.6920166015625, 2.810455322265625, 2.92889404296875, 3.047332763671875, 3.165771484375, 3.284210205078125, 3.40264892578125, 3.521087646484375, 3.6395263671875, 3.757965087890625, 3.87640380859375, 3.994842529296875, 4.11328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 6.0, 12.0, 9.0, 11.0, 18.0, 18.0, 19.0, 26.0, 37.0, 38.0, 58.0, 41.0, 63.0, 53.0, 57.0, 56.0, 60.0, 54.0, 50.0, 46.0, 39.0, 33.0, 44.0, 28.0, 28.0, 19.0, 17.0, 6.0, 10.0, 10.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6970443725585938, -0.6738739013671875, -0.6507034301757812, -0.627532958984375, -0.6043624877929688, -0.5811920166015625, -0.5580215454101562, -0.53485107421875, -0.5116806030273438, -0.4885101318359375, -0.46533966064453125, -0.442169189453125, -0.41899871826171875, -0.3958282470703125, -0.37265777587890625, -0.3494873046875, -0.32631683349609375, -0.3031463623046875, -0.27997589111328125, -0.256805419921875, -0.23363494873046875, -0.2104644775390625, -0.18729400634765625, -0.16412353515625, -0.14095306396484375, -0.1177825927734375, -0.09461212158203125, -0.071441650390625, -0.04827117919921875, -0.0251007080078125, -0.00193023681640625, 0.021240234375, 0.04441070556640625, 0.0675811767578125, 0.09075164794921875, 0.113922119140625, 0.13709259033203125, 0.1602630615234375, 0.18343353271484375, 0.20660400390625, 0.22977447509765625, 0.2529449462890625, 0.27611541748046875, 0.299285888671875, 0.32245635986328125, 0.3456268310546875, 0.36879730224609375, 0.3919677734375, 0.41513824462890625, 0.4383087158203125, 0.46147918701171875, 0.484649658203125, 0.5078201293945312, 0.5309906005859375, 0.5541610717773438, 0.57733154296875, 0.6005020141601562, 0.6236724853515625, 0.6468429565429688, 0.670013427734375, 0.6931838989257812, 0.7163543701171875, 0.7395248413085938, 0.7626953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 7.0, 6.0, 7.0, 17.0, 25.0, 35.0, 36.0, 69.0, 114.0, 235.0, 504.0, 1320.0, 3991.0, 18069.0, 156447.0, 776663.0, 75124.0, 11199.0, 2832.0, 974.0, 406.0, 201.0, 78.0, 70.0, 32.0, 26.0, 20.0, 15.0, 4.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.056640625, -2.0015869140625, -1.946533203125, -1.8914794921875, -1.83642578125, -1.7813720703125, -1.726318359375, -1.6712646484375, -1.6162109375, -1.5611572265625, -1.506103515625, -1.4510498046875, -1.39599609375, -1.3409423828125, -1.285888671875, -1.2308349609375, -1.17578125, -1.1207275390625, -1.065673828125, -1.0106201171875, -0.95556640625, -0.9005126953125, -0.845458984375, -0.7904052734375, -0.7353515625, -0.6802978515625, -0.625244140625, -0.5701904296875, -0.51513671875, -0.4600830078125, -0.405029296875, -0.3499755859375, -0.294921875, -0.2398681640625, -0.184814453125, -0.1297607421875, -0.07470703125, -0.0196533203125, 0.035400390625, 0.0904541015625, 0.1455078125, 0.2005615234375, 0.255615234375, 0.3106689453125, 0.36572265625, 0.4207763671875, 0.475830078125, 0.5308837890625, 0.5859375, 0.6409912109375, 0.696044921875, 0.7510986328125, 0.80615234375, 0.8612060546875, 0.916259765625, 0.9713134765625, 1.0263671875, 1.0814208984375, 1.136474609375, 1.1915283203125, 1.24658203125, 1.3016357421875, 1.356689453125, 1.4117431640625, 1.466796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 10.0, 7.0, 15.0, 17.0, 21.0, 34.0, 60.0, 95.0, 141.0, 206.0, 146.0, 92.0, 62.0, 31.0, 13.0, 16.0, 7.0, 6.0, 4.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017368793487548828, -0.0001675877720117569, -0.0001614876091480255, -0.00015538744628429413, -0.00014928728342056274, -0.00014318712055683136, -0.00013708695769309998, -0.0001309867948293686, -0.0001248866319656372, -0.00011878646910190582, -0.00011268630623817444, -0.00010658614337444305, -0.00010048598051071167, -9.438581764698029e-05, -8.82856547832489e-05, -8.218549191951752e-05, -7.608532905578613e-05, -6.998516619205475e-05, -6.388500332832336e-05, -5.778484046459198e-05, -5.1684677600860596e-05, -4.558451473712921e-05, -3.948435187339783e-05, -3.338418900966644e-05, -2.728402614593506e-05, -2.1183863282203674e-05, -1.508370041847229e-05, -8.983537554740906e-06, -2.8833746910095215e-06, 3.216788172721863e-06, 9.316951036453247e-06, 1.541711390018463e-05, 2.1517276763916016e-05, 2.76174396276474e-05, 3.3717602491378784e-05, 3.981776535511017e-05, 4.591792821884155e-05, 5.201809108257294e-05, 5.811825394630432e-05, 6.42184168100357e-05, 7.031857967376709e-05, 7.641874253749847e-05, 8.251890540122986e-05, 8.861906826496124e-05, 9.471923112869263e-05, 0.00010081939399242401, 0.0001069195568561554, 0.00011301971971988678, 0.00011911988258361816, 0.00012522004544734955, 0.00013132020831108093, 0.00013742037117481232, 0.0001435205340385437, 0.00014962069690227509, 0.00015572085976600647, 0.00016182102262973785, 0.00016792118549346924, 0.00017402134835720062, 0.000180121511220932, 0.0001862216740846634, 0.00019232183694839478, 0.00019842199981212616, 0.00020452216267585754, 0.00021062232553958893, 0.0002167224884033203]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 19.0, 17.0, 27.0, 31.0, 42.0, 68.0, 133.0, 418.0, 2065.0, 22534.0, 834247.0, 180401.0, 6997.0, 973.0, 253.0, 128.0, 54.0, 33.0, 17.0, 20.0, 19.0, 14.0, 2.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76953125, -1.700897216796875, -1.63226318359375, -1.563629150390625, -1.4949951171875, -1.426361083984375, -1.35772705078125, -1.289093017578125, -1.220458984375, -1.151824951171875, -1.08319091796875, -1.014556884765625, -0.9459228515625, -0.877288818359375, -0.80865478515625, -0.740020751953125, -0.67138671875, -0.602752685546875, -0.53411865234375, -0.465484619140625, -0.3968505859375, -0.328216552734375, -0.25958251953125, -0.190948486328125, -0.122314453125, -0.053680419921875, 0.01495361328125, 0.083587646484375, 0.1522216796875, 0.220855712890625, 0.28948974609375, 0.358123779296875, 0.4267578125, 0.495391845703125, 0.56402587890625, 0.632659912109375, 0.7012939453125, 0.769927978515625, 0.83856201171875, 0.907196044921875, 0.975830078125, 1.044464111328125, 1.11309814453125, 1.181732177734375, 1.2503662109375, 1.319000244140625, 1.38763427734375, 1.456268310546875, 1.52490234375, 1.593536376953125, 1.66217041015625, 1.730804443359375, 1.7994384765625, 1.868072509765625, 1.93670654296875, 2.005340576171875, 2.073974609375, 2.142608642578125, 2.21124267578125, 2.279876708984375, 2.3485107421875, 2.417144775390625, 2.48577880859375, 2.554412841796875, 2.623046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 6.0, 5.0, 6.0, 7.0, 16.0, 11.0, 18.0, 25.0, 30.0, 46.0, 61.0, 68.0, 77.0, 109.0, 99.0, 97.0, 67.0, 51.0, 49.0, 31.0, 33.0, 16.0, 13.0, 17.0, 8.0, 5.0, 5.0, 2.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416259765625, -0.3995018005371094, -0.38274383544921875, -0.3659858703613281, -0.3492279052734375, -0.3324699401855469, -0.31571197509765625, -0.2989540100097656, -0.282196044921875, -0.2654380798339844, -0.24868011474609375, -0.23192214965820312, -0.2151641845703125, -0.19840621948242188, -0.18164825439453125, -0.16489028930664062, -0.14813232421875, -0.13137435913085938, -0.11461639404296875, -0.09785842895507812, -0.0811004638671875, -0.06434249877929688, -0.04758453369140625, -0.030826568603515625, -0.014068603515625, 0.002689361572265625, 0.01944732666015625, 0.036205291748046875, 0.0529632568359375, 0.06972122192382812, 0.08647918701171875, 0.10323715209960938, 0.1199951171875, 0.13675308227539062, 0.15351104736328125, 0.17026901245117188, 0.1870269775390625, 0.20378494262695312, 0.22054290771484375, 0.23730087280273438, 0.254058837890625, 0.2708168029785156, 0.28757476806640625, 0.3043327331542969, 0.3210906982421875, 0.3378486633300781, 0.35460662841796875, 0.3713645935058594, 0.38812255859375, 0.4048805236816406, 0.42163848876953125, 0.4383964538574219, 0.4551544189453125, 0.4719123840332031, 0.48867034912109375, 0.5054283142089844, 0.522186279296875, 0.5389442443847656, 0.5557022094726562, 0.5724601745605469, 0.5892181396484375, 0.6059761047363281, 0.6227340698242188, 0.6394920349121094, 0.65625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 396.0, 582.0, 27.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.49568176269531, -69.32637023925781, -67.15706634521484, -64.98775482177734, -62.818450927734375, -60.649139404296875, -58.47983169555664, -56.310523986816406, -54.14121627807617, -51.97190856933594, -49.8026008605957, -47.63329315185547, -45.46398162841797, -43.294677734375, -41.1253662109375, -38.956058502197266, -36.78675079345703, -34.6174430847168, -32.44813537597656, -30.278825759887695, -28.10951805114746, -25.940210342407227, -23.77090072631836, -21.601593017578125, -19.43228530883789, -17.262977600097656, -15.093668937683105, -12.924360275268555, -10.75505256652832, -8.585744857788086, -6.416436195373535, -4.247127532958984, -2.0778274536132812, 0.09148073196411133, 2.260788917541504, 4.4300971031188965, 6.599405288696289, 8.768712997436523, 10.938021659851074, 13.107330322265625, 15.27663803100586, 17.445945739746094, 19.615253448486328, 21.784563064575195, 23.95387077331543, 26.123178482055664, 28.29248809814453, 30.461795806884766, 32.631103515625, 34.800411224365234, 36.96971893310547, 39.1390266418457, 41.30833435058594, 43.47764587402344, 45.64695358276367, 47.816261291503906, 49.98556900024414, 52.154876708984375, 54.32418441772461, 56.493492126464844, 58.662803649902344, 60.83210754394531, 63.00141906738281, 65.17073059082031, 67.34003448486328]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 16.0, 21.0, 42.0, 41.0, 45.0, 68.0, 67.0, 95.0, 78.0, 100.0, 82.0, 65.0, 67.0, 55.0, 37.0, 32.0, 27.0, 14.0, 21.0, 12.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.127429962158203, -8.884913444519043, -8.642395973205566, -8.399879455566406, -8.15736198425293, -7.9148454666137695, -7.672328472137451, -7.429811477661133, -7.1872944831848145, -6.944777488708496, -6.702260494232178, -6.459743499755859, -6.217226982116699, -5.974709987640381, -5.7321929931640625, -5.489675998687744, -5.247159004211426, -5.004642009735107, -4.762125015258789, -4.519608497619629, -4.2770915031433105, -4.034574508666992, -3.792057514190674, -3.5495405197143555, -3.3070240020751953, -3.064507007598877, -2.8219902515411377, -2.5794732570648193, -2.336956262588501, -2.0944395065307617, -1.8519225120544434, -1.609405517578125, -1.3668885231018066, -1.1243716478347778, -0.8818546533584595, -0.6393377780914307, -0.3968208432197571, -0.1543039083480835, 0.08821296691894531, 0.33072996139526367, 0.5732468366622925, 0.8157637715339661, 1.0582807064056396, 1.3007975816726685, 1.5433144569396973, 1.7858314514160156, 2.028348445892334, 2.2708654403686523, 2.5133821964263916, 2.75589919090271, 2.998415946960449, 3.2409329414367676, 3.483449935913086, 3.7259669303894043, 3.9684836864471436, 4.211000442504883, 4.453517436981201, 4.6960344314575195, 4.938551425933838, 5.181068420410156, 5.423584938049316, 5.666101932525635, 5.908618927001953, 6.1511359214782715, 6.39365291595459]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 14.0, 21.0, 80.0, 258.0, 967.0, 4178762.0, 13358.0, 474.0, 200.0, 73.0, 39.0, 17.0, 6.0, 8.0, 10.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.90625, -34.144775390625, -33.38330078125, -32.621826171875, -31.8603515625, -31.098876953125, -30.33740234375, -29.575927734375, -28.814453125, -28.052978515625, -27.29150390625, -26.530029296875, -25.7685546875, -25.007080078125, -24.24560546875, -23.484130859375, -22.72265625, -21.961181640625, -21.19970703125, -20.438232421875, -19.6767578125, -18.915283203125, -18.15380859375, -17.392333984375, -16.630859375, -15.869384765625, -15.10791015625, -14.346435546875, -13.5849609375, -12.823486328125, -12.06201171875, -11.300537109375, -10.5390625, -9.777587890625, -9.01611328125, -8.254638671875, -7.4931640625, -6.731689453125, -5.97021484375, -5.208740234375, -4.447265625, -3.685791015625, -2.92431640625, -2.162841796875, -1.4013671875, -0.639892578125, 0.12158203125, 0.883056640625, 1.64453125, 2.406005859375, 3.16748046875, 3.928955078125, 4.6904296875, 5.451904296875, 6.21337890625, 6.974853515625, 7.736328125, 8.497802734375, 9.25927734375, 10.020751953125, 10.7822265625, 11.543701171875, 12.30517578125, 13.066650390625, 13.828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 40.0, 109.0, 168.0, 243.0, 197.0, 124.0, 71.0, 33.0, 8.0, 5.0, 0.0, 3.0], "bins": [-0.7265625, -0.7135190963745117, -0.7004756927490234, -0.6874322891235352, -0.6743888854980469, -0.6613454818725586, -0.6483020782470703, -0.635258674621582, -0.6222152709960938, -0.6091718673706055, -0.5961284637451172, -0.5830850601196289, -0.5700416564941406, -0.5569982528686523, -0.5439548492431641, -0.5309114456176758, -0.5178680419921875, -0.5048246383666992, -0.49178123474121094, -0.47873783111572266, -0.4656944274902344, -0.4526510238647461, -0.4396076202392578, -0.42656421661376953, -0.41352081298828125, -0.40047740936279297, -0.3874340057373047, -0.3743906021118164, -0.3613471984863281, -0.34830379486083984, -0.33526039123535156, -0.3222169876098633, -0.309173583984375, -0.2961301803588867, -0.28308677673339844, -0.27004337310791016, -0.2569999694824219, -0.2439565658569336, -0.2309131622314453, -0.21786975860595703, -0.20482635498046875, -0.19178295135498047, -0.1787395477294922, -0.1656961441040039, -0.15265274047851562, -0.13960933685302734, -0.12656593322753906, -0.11352252960205078, -0.1004791259765625, -0.08743572235107422, -0.07439231872558594, -0.061348915100097656, -0.048305511474609375, -0.035262107849121094, -0.022218704223632812, -0.009175300598144531, 0.00386810302734375, 0.01691150665283203, 0.029954910278320312, 0.042998313903808594, 0.056041717529296875, 0.06908512115478516, 0.08212852478027344, 0.09517192840576172, 0.10821533203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 33.0, 78.0, 225.0, 350.0, 2986.0, 4189830.0, 492.0, 192.0, 80.0, 18.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-89.625, -87.841552734375, -86.05810546875, -84.274658203125, -82.4912109375, -80.707763671875, -78.92431640625, -77.140869140625, -75.357421875, -73.573974609375, -71.79052734375, -70.007080078125, -68.2236328125, -66.440185546875, -64.65673828125, -62.873291015625, -61.08984375, -59.306396484375, -57.52294921875, -55.739501953125, -53.9560546875, -52.172607421875, -50.38916015625, -48.605712890625, -46.822265625, -45.038818359375, -43.25537109375, -41.471923828125, -39.6884765625, -37.905029296875, -36.12158203125, -34.338134765625, -32.5546875, -30.771240234375, -28.98779296875, -27.204345703125, -25.4208984375, -23.637451171875, -21.85400390625, -20.070556640625, -18.287109375, -16.503662109375, -14.72021484375, -12.936767578125, -11.1533203125, -9.369873046875, -7.58642578125, -5.802978515625, -4.01953125, -2.236083984375, -0.45263671875, 1.330810546875, 3.1142578125, 4.897705078125, 6.68115234375, 8.464599609375, 10.248046875, 12.031494140625, 13.81494140625, 15.598388671875, 17.3818359375, 19.165283203125, 20.94873046875, 22.732177734375, 24.515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 13.0, 202.0, 3761.0, 108.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.977996826171875, -5.86614990234375, -5.754302978515625, -5.6424560546875, -5.530609130859375, -5.41876220703125, -5.306915283203125, -5.195068359375, -5.083221435546875, -4.97137451171875, -4.859527587890625, -4.7476806640625, -4.635833740234375, -4.52398681640625, -4.412139892578125, -4.30029296875, -4.188446044921875, -4.07659912109375, -3.964752197265625, -3.8529052734375, -3.741058349609375, -3.62921142578125, -3.517364501953125, -3.405517578125, -3.293670654296875, -3.18182373046875, -3.069976806640625, -2.9581298828125, -2.846282958984375, -2.73443603515625, -2.622589111328125, -2.5107421875, -2.398895263671875, -2.28704833984375, -2.175201416015625, -2.0633544921875, -1.951507568359375, -1.83966064453125, -1.727813720703125, -1.615966796875, -1.504119873046875, -1.39227294921875, -1.280426025390625, -1.1685791015625, -1.056732177734375, -0.94488525390625, -0.833038330078125, -0.72119140625, -0.609344482421875, -0.49749755859375, -0.385650634765625, -0.2738037109375, -0.161956787109375, -0.05010986328125, 0.061737060546875, 0.173583984375, 0.285430908203125, 0.39727783203125, 0.509124755859375, 0.6209716796875, 0.732818603515625, 0.84466552734375, 0.956512451171875, 1.068359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 106.0, 842.0, 52.0, 4.0, 1.0, 2.0], "bins": [-118.08844757080078, -116.10152435302734, -114.1146011352539, -112.12767028808594, -110.1407470703125, -108.15382385253906, -106.16690063476562, -104.17996978759766, -102.19304656982422, -100.20612335205078, -98.21920013427734, -96.23226928710938, -94.24534606933594, -92.2584228515625, -90.27149963378906, -88.2845687866211, -86.29764556884766, -84.31072235107422, -82.32379913330078, -80.33686828613281, -78.34994506835938, -76.36302185058594, -74.3760986328125, -72.38916778564453, -70.4022445678711, -68.41532135009766, -66.42839813232422, -64.44146728515625, -62.45454406738281, -60.467620849609375, -58.48069381713867, -56.493770599365234, -54.5068473815918, -52.51992416381836, -50.532997131347656, -48.54607391357422, -46.559146881103516, -44.57222366333008, -42.585296630859375, -40.59837341308594, -38.611446380615234, -36.6245231628418, -34.637596130371094, -32.650672912597656, -30.663745880126953, -28.676822662353516, -26.689895629882812, -24.702972412109375, -22.716045379638672, -20.7291202545166, -18.74219512939453, -16.75527000427246, -14.76834487915039, -12.781420707702637, -10.794495582580566, -8.807570457458496, -6.820646286010742, -4.833721160888672, -2.8467962741851807, -0.8598713874816895, 1.1270537376403809, 3.113978385925293, 5.100903511047363, 7.087828636169434, 9.074753761291504]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 10.0, 22.0, 44.0, 73.0, 117.0, 177.0, 164.0, 141.0, 97.0, 75.0, 47.0, 16.0, 13.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.80453872680664, -18.16191291809082, -17.519289016723633, -16.876663208007812, -16.234039306640625, -15.591413497924805, -14.9487886428833, -14.306163787841797, -13.663538932800293, -13.020914077758789, -12.378289222717285, -11.735664367675781, -11.093038558959961, -10.450414657592773, -9.807788848876953, -9.16516399383545, -8.522539138793945, -7.879914283752441, -7.2372894287109375, -6.594664096832275, -5.9520392417907715, -5.309414386749268, -4.6667890548706055, -4.024164199829102, -3.3815393447875977, -2.7389144897460938, -2.0962893962860107, -1.4536644220352173, -0.8110394477844238, -0.16841459274291992, 0.4742105007171631, 1.116835594177246, 1.7594623565673828, 2.4020872116088867, 3.0447123050689697, 3.6873373985290527, 4.329962253570557, 4.9725871086120605, 5.615212440490723, 6.257837295532227, 6.9004621505737305, 7.543087005615234, 8.185711860656738, 8.828336715698242, 9.470962524414062, 10.11358642578125, 10.75621223449707, 11.398837089538574, 12.041461944580078, 12.684086799621582, 13.326711654663086, 13.96933650970459, 14.611961364746094, 15.254587173461914, 15.897212028503418, 16.539836883544922, 17.18246078491211, 17.82508659362793, 18.467710494995117, 19.110336303710938, 19.752960205078125, 20.395586013793945, 21.038209915161133, 21.680835723876953, 22.323461532592773]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 7.0, 9.0, 7.0, 16.0, 19.0, 26.0, 39.0, 72.0, 97.0, 176.0, 301.0, 621.0, 1652.0, 6922.0, 70781.0, 872305.0, 84107.0, 8046.0, 1866.0, 692.0, 288.0, 173.0, 86.0, 71.0, 35.0, 36.0, 18.0, 13.0, 19.0, 12.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.5596923828125, -7.334228515625, -7.1087646484375, -6.88330078125, -6.6578369140625, -6.432373046875, -6.2069091796875, -5.9814453125, -5.7559814453125, -5.530517578125, -5.3050537109375, -5.07958984375, -4.8541259765625, -4.628662109375, -4.4031982421875, -4.177734375, -3.9522705078125, -3.726806640625, -3.5013427734375, -3.27587890625, -3.0504150390625, -2.824951171875, -2.5994873046875, -2.3740234375, -2.1485595703125, -1.923095703125, -1.6976318359375, -1.47216796875, -1.2467041015625, -1.021240234375, -0.7957763671875, -0.5703125, -0.3448486328125, -0.119384765625, 0.1060791015625, 0.33154296875, 0.5570068359375, 0.782470703125, 1.0079345703125, 1.2333984375, 1.4588623046875, 1.684326171875, 1.9097900390625, 2.13525390625, 2.3607177734375, 2.586181640625, 2.8116455078125, 3.037109375, 3.2625732421875, 3.488037109375, 3.7135009765625, 3.93896484375, 4.1644287109375, 4.389892578125, 4.6153564453125, 4.8408203125, 5.0662841796875, 5.291748046875, 5.5172119140625, 5.74267578125, 5.9681396484375, 6.193603515625, 6.4190673828125, 6.64453125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 11.0, 18.0, 32.0, 49.0, 83.0, 120.0, 129.0, 153.0, 118.0, 96.0, 67.0, 59.0, 31.0, 17.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1796875, -1.150390625, -1.12109375, -1.091796875, -1.0625, -1.033203125, -1.00390625, -0.974609375, -0.9453125, -0.916015625, -0.88671875, -0.857421875, -0.828125, -0.798828125, -0.76953125, -0.740234375, -0.7109375, -0.681640625, -0.65234375, -0.623046875, -0.59375, -0.564453125, -0.53515625, -0.505859375, -0.4765625, -0.447265625, -0.41796875, -0.388671875, -0.359375, -0.330078125, -0.30078125, -0.271484375, -0.2421875, -0.212890625, -0.18359375, -0.154296875, -0.125, -0.095703125, -0.06640625, -0.037109375, -0.0078125, 0.021484375, 0.05078125, 0.080078125, 0.109375, 0.138671875, 0.16796875, 0.197265625, 0.2265625, 0.255859375, 0.28515625, 0.314453125, 0.34375, 0.373046875, 0.40234375, 0.431640625, 0.4609375, 0.490234375, 0.51953125, 0.548828125, 0.578125, 0.607421875, 0.63671875, 0.666015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 8.0, 2.0, 10.0, 12.0, 16.0, 19.0, 19.0, 25.0, 33.0, 34.0, 50.0, 81.0, 190.0, 513.0, 4258.0, 170445.0, 857591.0, 13563.0, 1065.0, 243.0, 109.0, 70.0, 47.0, 32.0, 18.0, 19.0, 20.0, 10.0, 7.0, 7.0, 9.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.17938232421875, -6.9564208984375, -6.73345947265625, -6.510498046875, -6.28753662109375, -6.0645751953125, -5.84161376953125, -5.61865234375, -5.39569091796875, -5.1727294921875, -4.94976806640625, -4.726806640625, -4.50384521484375, -4.2808837890625, -4.05792236328125, -3.8349609375, -3.61199951171875, -3.3890380859375, -3.16607666015625, -2.943115234375, -2.72015380859375, -2.4971923828125, -2.27423095703125, -2.05126953125, -1.82830810546875, -1.6053466796875, -1.38238525390625, -1.159423828125, -0.93646240234375, -0.7135009765625, -0.49053955078125, -0.267578125, -0.04461669921875, 0.1783447265625, 0.40130615234375, 0.624267578125, 0.84722900390625, 1.0701904296875, 1.29315185546875, 1.51611328125, 1.73907470703125, 1.9620361328125, 2.18499755859375, 2.407958984375, 2.63092041015625, 2.8538818359375, 3.07684326171875, 3.2998046875, 3.52276611328125, 3.7457275390625, 3.96868896484375, 4.191650390625, 4.41461181640625, 4.6375732421875, 4.86053466796875, 5.08349609375, 5.30645751953125, 5.5294189453125, 5.75238037109375, 5.975341796875, 6.19830322265625, 6.4212646484375, 6.64422607421875, 6.8671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 6.0, 10.0, 11.0, 13.0, 12.0, 16.0, 31.0, 22.0, 27.0, 28.0, 46.0, 53.0, 51.0, 60.0, 60.0, 60.0, 58.0, 48.0, 52.0, 63.0, 51.0, 47.0, 33.0, 33.0, 14.0, 14.0, 20.0, 8.0, 13.0, 8.0, 9.0, 4.0, 3.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.9828338623046875, -1.920745849609375, -1.8586578369140625, -1.79656982421875, -1.7344818115234375, -1.672393798828125, -1.6103057861328125, -1.5482177734375, -1.4861297607421875, -1.424041748046875, -1.3619537353515625, -1.29986572265625, -1.2377777099609375, -1.175689697265625, -1.1136016845703125, -1.051513671875, -0.9894256591796875, -0.927337646484375, -0.8652496337890625, -0.80316162109375, -0.7410736083984375, -0.678985595703125, -0.6168975830078125, -0.5548095703125, -0.4927215576171875, -0.430633544921875, -0.3685455322265625, -0.30645751953125, -0.2443695068359375, -0.182281494140625, -0.1201934814453125, -0.05810546875, 0.0039825439453125, 0.066070556640625, 0.1281585693359375, 0.19024658203125, 0.2523345947265625, 0.314422607421875, 0.3765106201171875, 0.4385986328125, 0.5006866455078125, 0.562774658203125, 0.6248626708984375, 0.68695068359375, 0.7490386962890625, 0.811126708984375, 0.8732147216796875, 0.935302734375, 0.9973907470703125, 1.059478759765625, 1.1215667724609375, 1.18365478515625, 1.2457427978515625, 1.307830810546875, 1.3699188232421875, 1.4320068359375, 1.4940948486328125, 1.556182861328125, 1.6182708740234375, 1.68035888671875, 1.7424468994140625, 1.804534912109375, 1.8666229248046875, 1.9287109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 8.0, 16.0, 27.0, 59.0, 106.0, 238.0, 765.0, 3533.0, 96673.0, 934536.0, 10631.0, 1241.0, 386.0, 167.0, 69.0, 38.0, 19.0, 12.0, 9.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84765625, -6.66851806640625, -6.4893798828125, -6.31024169921875, -6.131103515625, -5.95196533203125, -5.7728271484375, -5.59368896484375, -5.41455078125, -5.23541259765625, -5.0562744140625, -4.87713623046875, -4.697998046875, -4.51885986328125, -4.3397216796875, -4.16058349609375, -3.9814453125, -3.80230712890625, -3.6231689453125, -3.44403076171875, -3.264892578125, -3.08575439453125, -2.9066162109375, -2.72747802734375, -2.54833984375, -2.36920166015625, -2.1900634765625, -2.01092529296875, -1.831787109375, -1.65264892578125, -1.4735107421875, -1.29437255859375, -1.115234375, -0.93609619140625, -0.7569580078125, -0.57781982421875, -0.398681640625, -0.21954345703125, -0.0404052734375, 0.13873291015625, 0.31787109375, 0.49700927734375, 0.6761474609375, 0.85528564453125, 1.034423828125, 1.21356201171875, 1.3927001953125, 1.57183837890625, 1.7509765625, 1.93011474609375, 2.1092529296875, 2.28839111328125, 2.467529296875, 2.64666748046875, 2.8258056640625, 3.00494384765625, 3.18408203125, 3.36322021484375, 3.5423583984375, 3.72149658203125, 3.900634765625, 4.07977294921875, 4.2589111328125, 4.43804931640625, 4.6171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 12.0, 24.0, 33.0, 46.0, 64.0, 82.0, 118.0, 156.0, 124.0, 89.0, 69.0, 53.0, 36.0, 21.0, 6.0, 12.0, 8.0, 9.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00020074844360351562, -0.00019478052854537964, -0.00018881261348724365, -0.00018284469842910767, -0.00017687678337097168, -0.0001709088683128357, -0.0001649409532546997, -0.00015897303819656372, -0.00015300512313842773, -0.00014703720808029175, -0.00014106929302215576, -0.00013510137796401978, -0.0001291334629058838, -0.0001231655478477478, -0.00011719763278961182, -0.00011122971773147583, -0.00010526180267333984, -9.929388761520386e-05, -9.332597255706787e-05, -8.735805749893188e-05, -8.13901424407959e-05, -7.542222738265991e-05, -6.945431232452393e-05, -6.348639726638794e-05, -5.751848220825195e-05, -5.155056715011597e-05, -4.558265209197998e-05, -3.9614737033843994e-05, -3.364682197570801e-05, -2.767890691757202e-05, -2.1710991859436035e-05, -1.574307680130005e-05, -9.775161743164062e-06, -3.807246685028076e-06, 2.16066837310791e-06, 8.128583431243896e-06, 1.4096498489379883e-05, 2.006441354751587e-05, 2.6032328605651855e-05, 3.200024366378784e-05, 3.796815872192383e-05, 4.3936073780059814e-05, 4.99039888381958e-05, 5.587190389633179e-05, 6.183981895446777e-05, 6.780773401260376e-05, 7.377564907073975e-05, 7.974356412887573e-05, 8.571147918701172e-05, 9.16793942451477e-05, 9.764730930328369e-05, 0.00010361522436141968, 0.00010958313941955566, 0.00011555105447769165, 0.00012151896953582764, 0.00012748688459396362, 0.0001334547996520996, 0.0001394227147102356, 0.00014539062976837158, 0.00015135854482650757, 0.00015732645988464355, 0.00016329437494277954, 0.00016926229000091553, 0.00017523020505905151, 0.0001811981201171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 9.0, 11.0, 20.0, 40.0, 110.0, 391.0, 2961.0, 295577.0, 744578.0, 4131.0, 437.0, 123.0, 54.0, 29.0, 15.0, 13.0, 9.0, 6.0, 2.0, 4.0, 3.0, 7.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.31640625, -7.1337890625, -6.951171875, -6.7685546875, -6.5859375, -6.4033203125, -6.220703125, -6.0380859375, -5.85546875, -5.6728515625, -5.490234375, -5.3076171875, -5.125, -4.9423828125, -4.759765625, -4.5771484375, -4.39453125, -4.2119140625, -4.029296875, -3.8466796875, -3.6640625, -3.4814453125, -3.298828125, -3.1162109375, -2.93359375, -2.7509765625, -2.568359375, -2.3857421875, -2.203125, -2.0205078125, -1.837890625, -1.6552734375, -1.47265625, -1.2900390625, -1.107421875, -0.9248046875, -0.7421875, -0.5595703125, -0.376953125, -0.1943359375, -0.01171875, 0.1708984375, 0.353515625, 0.5361328125, 0.71875, 0.9013671875, 1.083984375, 1.2666015625, 1.44921875, 1.6318359375, 1.814453125, 1.9970703125, 2.1796875, 2.3623046875, 2.544921875, 2.7275390625, 2.91015625, 3.0927734375, 3.275390625, 3.4580078125, 3.640625, 3.8232421875, 4.005859375, 4.1884765625, 4.37109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 5.0, 7.0, 14.0, 33.0, 48.0, 121.0, 163.0, 198.0, 145.0, 95.0, 63.0, 24.0, 15.0, 11.0, 9.0, 9.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.080078125, -2.02874755859375, -1.9774169921875, -1.92608642578125, -1.874755859375, -1.82342529296875, -1.7720947265625, -1.72076416015625, -1.66943359375, -1.61810302734375, -1.5667724609375, -1.51544189453125, -1.464111328125, -1.41278076171875, -1.3614501953125, -1.31011962890625, -1.2587890625, -1.20745849609375, -1.1561279296875, -1.10479736328125, -1.053466796875, -1.00213623046875, -0.9508056640625, -0.89947509765625, -0.84814453125, -0.79681396484375, -0.7454833984375, -0.69415283203125, -0.642822265625, -0.59149169921875, -0.5401611328125, -0.48883056640625, -0.4375, -0.38616943359375, -0.3348388671875, -0.28350830078125, -0.232177734375, -0.18084716796875, -0.1295166015625, -0.07818603515625, -0.02685546875, 0.02447509765625, 0.0758056640625, 0.12713623046875, 0.178466796875, 0.22979736328125, 0.2811279296875, 0.33245849609375, 0.3837890625, 0.43511962890625, 0.4864501953125, 0.53778076171875, 0.589111328125, 0.64044189453125, 0.6917724609375, 0.74310302734375, 0.79443359375, 0.84576416015625, 0.8970947265625, 0.94842529296875, 0.999755859375, 1.05108642578125, 1.1024169921875, 1.15374755859375, 1.205078125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 143.0, 796.0, 58.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-108.2940902709961, -105.38226318359375, -102.47042846679688, -99.55860137939453, -96.64677429199219, -93.73494720458984, -90.82311248779297, -87.91128540039062, -84.99945831298828, -82.08763122558594, -79.17579650878906, -76.26396942138672, -73.35214233398438, -70.44031524658203, -67.52848052978516, -64.61665344238281, -61.7048225402832, -58.792991638183594, -55.88116455078125, -52.96933364868164, -50.0575065612793, -47.14567565917969, -44.233848571777344, -41.322017669677734, -38.410186767578125, -35.498355865478516, -32.58652877807617, -29.674697875976562, -26.76287078857422, -23.85103988647461, -20.939210891723633, -18.027381896972656, -15.115554809570312, -12.203725814819336, -9.29189682006836, -6.380066871643066, -3.46823787689209, -0.5564088821411133, 2.3554210662841797, 5.267250061035156, 8.179079055786133, 11.09090805053711, 14.002737045288086, 16.914566040039062, 19.826396942138672, 22.738224029541016, 25.650054931640625, 28.5618839263916, 31.473712921142578, 34.38554382324219, 37.29737091064453, 40.20920181274414, 43.121028900146484, 46.032859802246094, 48.94468688964844, 51.85651779174805, 54.768348693847656, 57.680179595947266, 60.59200668334961, 63.50383758544922, 66.41566467285156, 69.3274917602539, 72.23932647705078, 75.15115356445312, 78.06298065185547]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 9.0, 13.0, 9.0, 8.0, 18.0, 20.0, 36.0, 36.0, 55.0, 49.0, 63.0, 67.0, 73.0, 75.0, 77.0, 79.0, 51.0, 61.0, 50.0, 32.0, 36.0, 30.0, 15.0, 16.0, 10.0, 6.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.02103042602539, -15.478071212768555, -14.935111045837402, -14.392151832580566, -13.84919261932373, -13.306232452392578, -12.763273239135742, -12.220314025878906, -11.67735481262207, -11.134395599365234, -10.591435432434082, -10.048476219177246, -9.50551700592041, -8.962556838989258, -8.419597625732422, -7.876638412475586, -7.333678245544434, -6.7907185554504395, -6.2477593421936035, -5.704799652099609, -5.161840438842773, -4.618880748748779, -4.075921058654785, -3.53296160697937, -2.990002155303955, -2.44704270362854, -1.9040831327438354, -1.3611235618591309, -0.8181641101837158, -0.2752046585083008, 0.26775503158569336, 0.8107144832611084, 1.3536739349365234, 1.8966333866119385, 2.4395928382873535, 2.9825525283813477, 3.5255119800567627, 4.068471431732178, 4.611431121826172, 5.154390335083008, 5.697350025177002, 6.240309715270996, 6.783268928527832, 7.326228618621826, 7.86918830871582, 8.412147521972656, 8.955106735229492, 9.498066902160645, 10.04102611541748, 10.583985328674316, 11.126945495605469, 11.669904708862305, 12.21286392211914, 12.755823135375977, 13.298783302307129, 13.841742515563965, 14.384702682495117, 14.927661895751953, 15.470622062683105, 16.013580322265625, 16.556541442871094, 17.09950065612793, 17.642459869384766, 18.1854190826416, 18.728378295898438]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 10.0, 10.0, 25.0, 43.0, 62.0, 114.0, 253.0, 560.0, 2451.0, 56136.0, 4118984.0, 14102.0, 1024.0, 244.0, 101.0, 52.0, 49.0, 28.0, 11.0, 8.0, 5.0, 7.0, 2.0, 0.0, 2.0], "bins": [-24.46875, -23.972900390625, -23.47705078125, -22.981201171875, -22.4853515625, -21.989501953125, -21.49365234375, -20.997802734375, -20.501953125, -20.006103515625, -19.51025390625, -19.014404296875, -18.5185546875, -18.022705078125, -17.52685546875, -17.031005859375, -16.53515625, -16.039306640625, -15.54345703125, -15.047607421875, -14.5517578125, -14.055908203125, -13.56005859375, -13.064208984375, -12.568359375, -12.072509765625, -11.57666015625, -11.080810546875, -10.5849609375, -10.089111328125, -9.59326171875, -9.097412109375, -8.6015625, -8.105712890625, -7.60986328125, -7.114013671875, -6.6181640625, -6.122314453125, -5.62646484375, -5.130615234375, -4.634765625, -4.138916015625, -3.64306640625, -3.147216796875, -2.6513671875, -2.155517578125, -1.65966796875, -1.163818359375, -0.66796875, -0.172119140625, 0.32373046875, 0.819580078125, 1.3154296875, 1.811279296875, 2.30712890625, 2.802978515625, 3.298828125, 3.794677734375, 4.29052734375, 4.786376953125, 5.2822265625, 5.778076171875, 6.27392578125, 6.769775390625, 7.265625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 8.0, 18.0, 34.0, 46.0, 80.0, 80.0, 104.0, 118.0, 143.0, 100.0, 84.0, 65.0, 37.0, 28.0, 23.0, 12.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3134765625, -1.2859992980957031, -1.2585220336914062, -1.2310447692871094, -1.2035675048828125, -1.1760902404785156, -1.1486129760742188, -1.1211357116699219, -1.093658447265625, -1.0661811828613281, -1.0387039184570312, -1.0112266540527344, -0.9837493896484375, -0.9562721252441406, -0.9287948608398438, -0.9013175964355469, -0.87384033203125, -0.8463630676269531, -0.8188858032226562, -0.7914085388183594, -0.7639312744140625, -0.7364540100097656, -0.7089767456054688, -0.6814994812011719, -0.654022216796875, -0.6265449523925781, -0.5990676879882812, -0.5715904235839844, -0.5441131591796875, -0.5166358947753906, -0.48915863037109375, -0.4616813659667969, -0.4342041015625, -0.4067268371582031, -0.37924957275390625, -0.3517723083496094, -0.3242950439453125, -0.2968177795410156, -0.26934051513671875, -0.24186325073242188, -0.214385986328125, -0.18690872192382812, -0.15943145751953125, -0.13195419311523438, -0.1044769287109375, -0.07699966430664062, -0.04952239990234375, -0.022045135498046875, 0.00543212890625, 0.032909393310546875, 0.06038665771484375, 0.08786392211914062, 0.1153411865234375, 0.14281845092773438, 0.17029571533203125, 0.19777297973632812, 0.225250244140625, 0.2527275085449219, 0.28020477294921875, 0.3076820373535156, 0.3351593017578125, 0.3626365661621094, 0.39011383056640625, 0.4175910949707031, 0.445068359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 12.0, 40.0, 171.0, 754.0, 138914.0, 4053792.0, 477.0, 81.0, 25.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.625, -85.94140625, -84.2578125, -82.57421875, -80.890625, -79.20703125, -77.5234375, -75.83984375, -74.15625, -72.47265625, -70.7890625, -69.10546875, -67.421875, -65.73828125, -64.0546875, -62.37109375, -60.6875, -59.00390625, -57.3203125, -55.63671875, -53.953125, -52.26953125, -50.5859375, -48.90234375, -47.21875, -45.53515625, -43.8515625, -42.16796875, -40.484375, -38.80078125, -37.1171875, -35.43359375, -33.75, -32.06640625, -30.3828125, -28.69921875, -27.015625, -25.33203125, -23.6484375, -21.96484375, -20.28125, -18.59765625, -16.9140625, -15.23046875, -13.546875, -11.86328125, -10.1796875, -8.49609375, -6.8125, -5.12890625, -3.4453125, -1.76171875, -0.078125, 1.60546875, 3.2890625, 4.97265625, 6.65625, 8.33984375, 10.0234375, 11.70703125, 13.390625, 15.07421875, 16.7578125, 18.44140625, 20.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 33.0, 81.0, 601.0, 3170.0, 141.0, 32.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-6.58984375, -6.47052001953125, -6.3511962890625, -6.23187255859375, -6.112548828125, -5.99322509765625, -5.8739013671875, -5.75457763671875, -5.63525390625, -5.51593017578125, -5.3966064453125, -5.27728271484375, -5.157958984375, -5.03863525390625, -4.9193115234375, -4.79998779296875, -4.6806640625, -4.56134033203125, -4.4420166015625, -4.32269287109375, -4.203369140625, -4.08404541015625, -3.9647216796875, -3.84539794921875, -3.72607421875, -3.60675048828125, -3.4874267578125, -3.36810302734375, -3.248779296875, -3.12945556640625, -3.0101318359375, -2.89080810546875, -2.771484375, -2.65216064453125, -2.5328369140625, -2.41351318359375, -2.294189453125, -2.17486572265625, -2.0555419921875, -1.93621826171875, -1.81689453125, -1.69757080078125, -1.5782470703125, -1.45892333984375, -1.339599609375, -1.22027587890625, -1.1009521484375, -0.98162841796875, -0.8623046875, -0.74298095703125, -0.6236572265625, -0.50433349609375, -0.385009765625, -0.26568603515625, -0.1463623046875, -0.02703857421875, 0.09228515625, 0.21160888671875, 0.3309326171875, 0.45025634765625, 0.569580078125, 0.68890380859375, 0.8082275390625, 0.92755126953125, 1.046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 11.0, 36.0, 641.0, 321.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.562095642089844, -34.89507293701172, -33.22805404663086, -31.561031341552734, -29.894010543823242, -28.22698974609375, -26.559967041015625, -24.892946243286133, -23.22592544555664, -21.55890464782715, -19.891883850097656, -18.22486114501953, -16.55784034729004, -14.890819549560547, -13.223797798156738, -11.55677604675293, -9.889755249023438, -8.222734451293945, -6.555712699890137, -4.888691425323486, -3.221670150756836, -1.5546493530273438, 0.11237239837646484, 1.7793941497802734, 3.4464149475097656, 5.113436222076416, 6.780457496643066, 8.447479248046875, 10.114500045776367, 11.78152084350586, 13.448542594909668, 15.115564346313477, 16.78258514404297, 18.44960594177246, 20.116626739501953, 21.783649444580078, 23.45067024230957, 25.117691040039062, 26.784713745117188, 28.45173454284668, 30.118755340576172, 31.785776138305664, 33.452796936035156, 35.11981964111328, 36.786842346191406, 38.453861236572266, 40.12088394165039, 41.78790283203125, 43.454925537109375, 45.1219482421875, 46.78896713256836, 48.455989837646484, 50.123008728027344, 51.79003143310547, 53.457054138183594, 55.12407684326172, 56.79109573364258, 58.4581184387207, 60.12513732910156, 61.79216003417969, 63.45918273925781, 65.12620544433594, 66.79322052001953, 68.46024322509766, 70.12726593017578]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 19.0, 18.0, 30.0, 56.0, 69.0, 100.0, 102.0, 124.0, 119.0, 98.0, 78.0, 72.0, 44.0, 31.0, 18.0, 11.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.979488372802734, -16.497888565063477, -16.01628875732422, -15.534687995910645, -15.05308723449707, -14.571487426757812, -14.089886665344238, -13.60828685760498, -13.126686096191406, -12.645086288452148, -12.163485527038574, -11.681885719299316, -11.200284957885742, -10.718685150146484, -10.23708438873291, -9.755484580993652, -9.273883819580078, -8.79228401184082, -8.310683250427246, -7.82908296585083, -7.347482681274414, -6.865882873535156, -6.384282112121582, -5.902682304382324, -5.421082496643066, -4.93948221206665, -4.457881927490234, -3.9762816429138184, -3.4946813583374023, -3.0130813121795654, -2.5314810276031494, -2.0498807430267334, -1.5682802200317383, -1.0866799354553223, -0.605079710483551, -0.12347948551177979, 0.35812079906463623, 0.8397209644317627, 1.3213212490081787, 1.8029215335845947, 2.2845218181610107, 2.7661221027374268, 3.2477223873138428, 3.7293224334716797, 4.210922718048096, 4.692523002624512, 5.174123287200928, 5.655723571777344, 6.13732385635376, 6.618924140930176, 7.100524425506592, 7.582124710083008, 8.063724517822266, 8.54532527923584, 9.026925086975098, 9.508525848388672, 9.99012565612793, 10.471725463867188, 10.953326225280762, 11.43492603302002, 11.916526794433594, 12.398126602172852, 12.879727363586426, 13.361327171325684, 13.842927932739258]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 10.0, 8.0, 21.0, 24.0, 25.0, 30.0, 52.0, 58.0, 90.0, 115.0, 179.0, 284.0, 460.0, 999.0, 2696.0, 10019.0, 50842.0, 437749.0, 474425.0, 54585.0, 10603.0, 2819.0, 1060.0, 456.0, 284.0, 192.0, 138.0, 82.0, 75.0, 46.0, 34.0, 30.0, 15.0, 17.0, 11.0, 10.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.3648681640625, -5.202392578125, -5.0399169921875, -4.87744140625, -4.7149658203125, -4.552490234375, -4.3900146484375, -4.2275390625, -4.0650634765625, -3.902587890625, -3.7401123046875, -3.57763671875, -3.4151611328125, -3.252685546875, -3.0902099609375, -2.927734375, -2.7652587890625, -2.602783203125, -2.4403076171875, -2.27783203125, -2.1153564453125, -1.952880859375, -1.7904052734375, -1.6279296875, -1.4654541015625, -1.302978515625, -1.1405029296875, -0.97802734375, -0.8155517578125, -0.653076171875, -0.4906005859375, -0.328125, -0.1656494140625, -0.003173828125, 0.1593017578125, 0.32177734375, 0.4842529296875, 0.646728515625, 0.8092041015625, 0.9716796875, 1.1341552734375, 1.296630859375, 1.4591064453125, 1.62158203125, 1.7840576171875, 1.946533203125, 2.1090087890625, 2.271484375, 2.4339599609375, 2.596435546875, 2.7589111328125, 2.92138671875, 3.0838623046875, 3.246337890625, 3.4088134765625, 3.5712890625, 3.7337646484375, 3.896240234375, 4.0587158203125, 4.22119140625, 4.3836669921875, 4.546142578125, 4.7086181640625, 4.87109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 12.0, 7.0, 25.0, 40.0, 49.0, 62.0, 67.0, 91.0, 92.0, 131.0, 102.0, 86.0, 72.0, 66.0, 41.0, 19.0, 19.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4521636962890625, -1.413116455078125, -1.3740692138671875, -1.33502197265625, -1.2959747314453125, -1.256927490234375, -1.2178802490234375, -1.1788330078125, -1.1397857666015625, -1.100738525390625, -1.0616912841796875, -1.02264404296875, -0.9835968017578125, -0.944549560546875, -0.9055023193359375, -0.866455078125, -0.8274078369140625, -0.788360595703125, -0.7493133544921875, -0.71026611328125, -0.6712188720703125, -0.632171630859375, -0.5931243896484375, -0.5540771484375, -0.5150299072265625, -0.475982666015625, -0.4369354248046875, -0.39788818359375, -0.3588409423828125, -0.319793701171875, -0.2807464599609375, -0.24169921875, -0.2026519775390625, -0.163604736328125, -0.1245574951171875, -0.08551025390625, -0.0464630126953125, -0.007415771484375, 0.0316314697265625, 0.0706787109375, 0.1097259521484375, 0.148773193359375, 0.1878204345703125, 0.22686767578125, 0.2659149169921875, 0.304962158203125, 0.3440093994140625, 0.383056640625, 0.4221038818359375, 0.461151123046875, 0.5001983642578125, 0.53924560546875, 0.5782928466796875, 0.617340087890625, 0.6563873291015625, 0.6954345703125, 0.7344818115234375, 0.773529052734375, 0.8125762939453125, 0.85162353515625, 0.8906707763671875, 0.929718017578125, 0.9687652587890625, 1.0078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 12.0, 10.0, 9.0, 23.0, 25.0, 28.0, 41.0, 69.0, 132.0, 283.0, 1041.0, 4640.0, 36222.0, 677538.0, 305337.0, 18902.0, 2920.0, 738.0, 211.0, 121.0, 64.0, 38.0, 20.0, 28.0, 24.0, 12.0, 10.0, 10.0, 8.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.546875, -5.36712646484375, -5.1873779296875, -5.00762939453125, -4.827880859375, -4.64813232421875, -4.4683837890625, -4.28863525390625, -4.10888671875, -3.92913818359375, -3.7493896484375, -3.56964111328125, -3.389892578125, -3.21014404296875, -3.0303955078125, -2.85064697265625, -2.6708984375, -2.49114990234375, -2.3114013671875, -2.13165283203125, -1.951904296875, -1.77215576171875, -1.5924072265625, -1.41265869140625, -1.23291015625, -1.05316162109375, -0.8734130859375, -0.69366455078125, -0.513916015625, -0.33416748046875, -0.1544189453125, 0.02532958984375, 0.205078125, 0.38482666015625, 0.5645751953125, 0.74432373046875, 0.924072265625, 1.10382080078125, 1.2835693359375, 1.46331787109375, 1.64306640625, 1.82281494140625, 2.0025634765625, 2.18231201171875, 2.362060546875, 2.54180908203125, 2.7215576171875, 2.90130615234375, 3.0810546875, 3.26080322265625, 3.4405517578125, 3.62030029296875, 3.800048828125, 3.97979736328125, 4.1595458984375, 4.33929443359375, 4.51904296875, 4.69879150390625, 4.8785400390625, 5.05828857421875, 5.238037109375, 5.41778564453125, 5.5975341796875, 5.77728271484375, 5.95703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 4.0, 7.0, 6.0, 8.0, 14.0, 10.0, 16.0, 23.0, 30.0, 17.0, 46.0, 40.0, 37.0, 46.0, 60.0, 45.0, 63.0, 59.0, 53.0, 49.0, 48.0, 56.0, 56.0, 35.0, 36.0, 28.0, 20.0, 23.0, 20.0, 5.0, 8.0, 10.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.958984375, -2.8642578125, -2.76953125, -2.6748046875, -2.580078125, -2.4853515625, -2.390625, -2.2958984375, -2.201171875, -2.1064453125, -2.01171875, -1.9169921875, -1.822265625, -1.7275390625, -1.6328125, -1.5380859375, -1.443359375, -1.3486328125, -1.25390625, -1.1591796875, -1.064453125, -0.9697265625, -0.875, -0.7802734375, -0.685546875, -0.5908203125, -0.49609375, -0.4013671875, -0.306640625, -0.2119140625, -0.1171875, -0.0224609375, 0.072265625, 0.1669921875, 0.26171875, 0.3564453125, 0.451171875, 0.5458984375, 0.640625, 0.7353515625, 0.830078125, 0.9248046875, 1.01953125, 1.1142578125, 1.208984375, 1.3037109375, 1.3984375, 1.4931640625, 1.587890625, 1.6826171875, 1.77734375, 1.8720703125, 1.966796875, 2.0615234375, 2.15625, 2.2509765625, 2.345703125, 2.4404296875, 2.53515625, 2.6298828125, 2.724609375, 2.8193359375, 2.9140625, 3.0087890625, 3.103515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 12.0, 13.0, 10.0, 14.0, 42.0, 78.0, 151.0, 412.0, 1423.0, 9485.0, 421546.0, 601523.0, 11347.0, 1660.0, 436.0, 159.0, 77.0, 50.0, 33.0, 30.0, 4.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.95452880859375, -3.8348388671875, -3.71514892578125, -3.595458984375, -3.47576904296875, -3.3560791015625, -3.23638916015625, -3.11669921875, -2.99700927734375, -2.8773193359375, -2.75762939453125, -2.637939453125, -2.51824951171875, -2.3985595703125, -2.27886962890625, -2.1591796875, -2.03948974609375, -1.9197998046875, -1.80010986328125, -1.680419921875, -1.56072998046875, -1.4410400390625, -1.32135009765625, -1.20166015625, -1.08197021484375, -0.9622802734375, -0.84259033203125, -0.722900390625, -0.60321044921875, -0.4835205078125, -0.36383056640625, -0.244140625, -0.12445068359375, -0.0047607421875, 0.11492919921875, 0.234619140625, 0.35430908203125, 0.4739990234375, 0.59368896484375, 0.71337890625, 0.83306884765625, 0.9527587890625, 1.07244873046875, 1.192138671875, 1.31182861328125, 1.4315185546875, 1.55120849609375, 1.6708984375, 1.79058837890625, 1.9102783203125, 2.02996826171875, 2.149658203125, 2.26934814453125, 2.3890380859375, 2.50872802734375, 2.62841796875, 2.74810791015625, 2.8677978515625, 2.98748779296875, 3.107177734375, 3.22686767578125, 3.3465576171875, 3.46624755859375, 3.5859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 13.0, 15.0, 17.0, 25.0, 24.0, 44.0, 39.0, 70.0, 68.0, 113.0, 107.0, 101.0, 85.0, 65.0, 50.0, 31.0, 29.0, 21.0, 20.0, 11.0, 11.0, 15.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015687942504882812, -0.0001515764743089676, -0.00014627352356910706, -0.00014097057282924652, -0.00013566762208938599, -0.00013036467134952545, -0.00012506172060966492, -0.00011975876986980438, -0.00011445581912994385, -0.00010915286839008331, -0.00010384991765022278, -9.854696691036224e-05, -9.324401617050171e-05, -8.794106543064117e-05, -8.263811469078064e-05, -7.73351639509201e-05, -7.203221321105957e-05, -6.672926247119904e-05, -6.14263117313385e-05, -5.6123360991477966e-05, -5.082041025161743e-05, -4.55174595117569e-05, -4.021450877189636e-05, -3.491155803203583e-05, -2.9608607292175293e-05, -2.4305656552314758e-05, -1.9002705812454224e-05, -1.3699755072593689e-05, -8.396804332733154e-06, -3.0938535928726196e-06, 2.209097146987915e-06, 7.51204788684845e-06, 1.2814998626708984e-05, 1.811794936656952e-05, 2.3420900106430054e-05, 2.872385084629059e-05, 3.402680158615112e-05, 3.932975232601166e-05, 4.463270306587219e-05, 4.993565380573273e-05, 5.523860454559326e-05, 6.0541555285453796e-05, 6.584450602531433e-05, 7.114745676517487e-05, 7.64504075050354e-05, 8.175335824489594e-05, 8.705630898475647e-05, 9.2359259724617e-05, 9.766221046447754e-05, 0.00010296516120433807, 0.00010826811194419861, 0.00011357106268405914, 0.00011887401342391968, 0.0001241769641637802, 0.00012947991490364075, 0.00013478286564350128, 0.00014008581638336182, 0.00014538876712322235, 0.00015069171786308289, 0.00015599466860294342, 0.00016129761934280396, 0.0001666005700826645, 0.00017190352082252502, 0.00017720647156238556, 0.0001825094223022461]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 22.0, 38.0, 78.0, 193.0, 601.0, 2767.0, 21869.0, 729563.0, 279849.0, 11169.0, 1646.0, 436.0, 150.0, 61.0, 32.0, 24.0, 7.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7957763671875, -2.710693359375, -2.6256103515625, -2.54052734375, -2.4554443359375, -2.370361328125, -2.2852783203125, -2.2001953125, -2.1151123046875, -2.030029296875, -1.9449462890625, -1.85986328125, -1.7747802734375, -1.689697265625, -1.6046142578125, -1.51953125, -1.4344482421875, -1.349365234375, -1.2642822265625, -1.17919921875, -1.0941162109375, -1.009033203125, -0.9239501953125, -0.8388671875, -0.7537841796875, -0.668701171875, -0.5836181640625, -0.49853515625, -0.4134521484375, -0.328369140625, -0.2432861328125, -0.158203125, -0.0731201171875, 0.011962890625, 0.0970458984375, 0.18212890625, 0.2672119140625, 0.352294921875, 0.4373779296875, 0.5224609375, 0.6075439453125, 0.692626953125, 0.7777099609375, 0.86279296875, 0.9478759765625, 1.032958984375, 1.1180419921875, 1.203125, 1.2882080078125, 1.373291015625, 1.4583740234375, 1.54345703125, 1.6285400390625, 1.713623046875, 1.7987060546875, 1.8837890625, 1.9688720703125, 2.053955078125, 2.1390380859375, 2.22412109375, 2.3092041015625, 2.394287109375, 2.4793701171875, 2.564453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 13.0, 17.0, 34.0, 33.0, 51.0, 94.0, 114.0, 139.0, 155.0, 117.0, 73.0, 50.0, 35.0, 19.0, 10.0, 10.0, 6.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5693359375, -1.5228118896484375, -1.476287841796875, -1.4297637939453125, -1.38323974609375, -1.3367156982421875, -1.290191650390625, -1.2436676025390625, -1.1971435546875, -1.1506195068359375, -1.104095458984375, -1.0575714111328125, -1.01104736328125, -0.9645233154296875, -0.917999267578125, -0.8714752197265625, -0.824951171875, -0.7784271240234375, -0.731903076171875, -0.6853790283203125, -0.63885498046875, -0.5923309326171875, -0.545806884765625, -0.4992828369140625, -0.4527587890625, -0.4062347412109375, -0.359710693359375, -0.3131866455078125, -0.26666259765625, -0.2201385498046875, -0.173614501953125, -0.1270904541015625, -0.08056640625, -0.0340423583984375, 0.012481689453125, 0.0590057373046875, 0.10552978515625, 0.1520538330078125, 0.198577880859375, 0.2451019287109375, 0.2916259765625, 0.3381500244140625, 0.384674072265625, 0.4311981201171875, 0.47772216796875, 0.5242462158203125, 0.570770263671875, 0.6172943115234375, 0.663818359375, 0.7103424072265625, 0.756866455078125, 0.8033905029296875, 0.84991455078125, 0.8964385986328125, 0.942962646484375, 0.9894866943359375, 1.0360107421875, 1.0825347900390625, 1.129058837890625, 1.1755828857421875, 1.22210693359375, 1.2686309814453125, 1.315155029296875, 1.3616790771484375, 1.408203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 18.0, 43.0, 162.0, 380.0, 242.0, 100.0, 29.0, 13.0, 8.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.79099655151367, -35.659759521484375, -34.52851867675781, -33.397281646728516, -32.26604461669922, -31.13480567932129, -30.00356674194336, -28.872329711914062, -27.741090774536133, -26.609851837158203, -25.478614807128906, -24.347375869750977, -23.216136932373047, -22.08489990234375, -20.95366096496582, -19.82242202758789, -18.691184997558594, -17.559946060180664, -16.428709030151367, -15.297470092773438, -14.166232109069824, -13.034994125366211, -11.903755187988281, -10.772517204284668, -9.641279220581055, -8.510041236877441, -7.37880277633667, -6.247564315795898, -5.116326332092285, -3.985088348388672, -2.8538498878479004, -1.722611427307129, -0.59136962890625, 0.5398685932159424, 1.6711068153381348, 2.802345037460327, 3.9335832595825195, 5.064821243286133, 6.196059703826904, 7.327298164367676, 8.458536148071289, 9.589774131774902, 10.721012115478516, 11.852251052856445, 12.983489036560059, 14.114727020263672, 15.245965957641602, 16.37720489501953, 17.508441925048828, 18.639680862426758, 19.770917892456055, 20.902156829833984, 22.03339385986328, 23.16463279724121, 24.29587173461914, 25.427108764648438, 26.558347702026367, 27.689586639404297, 28.820823669433594, 29.952062606811523, 31.083301544189453, 32.21453857421875, 33.34577560424805, 34.47701644897461, 35.608253479003906]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 8.0, 13.0, 17.0, 16.0, 30.0, 30.0, 28.0, 38.0, 61.0, 52.0, 47.0, 59.0, 69.0, 66.0, 65.0, 59.0, 44.0, 43.0, 37.0, 34.0, 33.0, 26.0, 13.0, 24.0, 13.0, 17.0, 7.0, 8.0, 8.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.055347442626953, -18.48572540283203, -17.916105270385742, -17.34648323059082, -16.77686309814453, -16.20724105834961, -15.637619972229004, -15.067998886108398, -14.498377799987793, -13.928756713867188, -13.359135627746582, -12.789514541625977, -12.219892501831055, -11.650272369384766, -11.080650329589844, -10.511029243469238, -9.941408157348633, -9.371787071228027, -8.802165985107422, -8.232544898986816, -7.662923336029053, -7.093302249908447, -6.523680686950684, -5.954059600830078, -5.384438514709473, -4.814817428588867, -4.245196342468262, -3.675574779510498, -3.1059536933898926, -2.536332607269287, -1.9667112827301025, -1.397089958190918, -0.8274669647216797, -0.25784575939178467, 0.31177544593811035, 0.8813966512680054, 1.4510178565979004, 2.020638942718506, 2.5902602672576904, 3.159881591796875, 3.7295026779174805, 4.299123764038086, 4.868744850158691, 5.438366413116455, 6.0079874992370605, 6.577608585357666, 7.14723014831543, 7.716851234436035, 8.28647232055664, 8.856093406677246, 9.425714492797852, 9.995335578918457, 10.564956665039062, 11.134578704833984, 11.70419979095459, 12.273820877075195, 12.8434419631958, 13.413063049316406, 13.982684135437012, 14.552305221557617, 15.121927261352539, 15.691547393798828, 16.26116943359375, 16.830791473388672, 17.40041160583496]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 9.0, 6.0, 7.0, 12.0, 19.0, 23.0, 20.0, 43.0, 64.0, 102.0, 138.0, 296.0, 589.0, 1303.0, 3839.0, 18570.0, 621481.0, 3514835.0, 26255.0, 4403.0, 1282.0, 475.0, 202.0, 116.0, 65.0, 38.0, 26.0, 18.0, 8.0, 8.0, 10.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.8046875, -9.55377197265625, -9.3028564453125, -9.05194091796875, -8.801025390625, -8.55010986328125, -8.2991943359375, -8.04827880859375, -7.79736328125, -7.54644775390625, -7.2955322265625, -7.04461669921875, -6.793701171875, -6.54278564453125, -6.2918701171875, -6.04095458984375, -5.7900390625, -5.53912353515625, -5.2882080078125, -5.03729248046875, -4.786376953125, -4.53546142578125, -4.2845458984375, -4.03363037109375, -3.78271484375, -3.53179931640625, -3.2808837890625, -3.02996826171875, -2.779052734375, -2.52813720703125, -2.2772216796875, -2.02630615234375, -1.775390625, -1.52447509765625, -1.2735595703125, -1.02264404296875, -0.771728515625, -0.52081298828125, -0.2698974609375, -0.01898193359375, 0.23193359375, 0.48284912109375, 0.7337646484375, 0.98468017578125, 1.235595703125, 1.48651123046875, 1.7374267578125, 1.98834228515625, 2.2392578125, 2.49017333984375, 2.7410888671875, 2.99200439453125, 3.242919921875, 3.49383544921875, 3.7447509765625, 3.99566650390625, 4.24658203125, 4.49749755859375, 4.7484130859375, 4.99932861328125, 5.250244140625, 5.50115966796875, 5.7520751953125, 6.00299072265625, 6.25390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 11.0, 14.0, 10.0, 22.0, 28.0, 44.0, 70.0, 54.0, 78.0, 89.0, 78.0, 81.0, 86.0, 80.0, 69.0, 49.0, 29.0, 33.0, 22.0, 22.0, 9.0, 8.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-1.4814453125, -1.447601318359375, -1.41375732421875, -1.379913330078125, -1.3460693359375, -1.312225341796875, -1.27838134765625, -1.244537353515625, -1.210693359375, -1.176849365234375, -1.14300537109375, -1.109161376953125, -1.0753173828125, -1.041473388671875, -1.00762939453125, -0.973785400390625, -0.93994140625, -0.906097412109375, -0.87225341796875, -0.838409423828125, -0.8045654296875, -0.770721435546875, -0.73687744140625, -0.703033447265625, -0.669189453125, -0.635345458984375, -0.60150146484375, -0.567657470703125, -0.5338134765625, -0.499969482421875, -0.46612548828125, -0.432281494140625, -0.3984375, -0.364593505859375, -0.33074951171875, -0.296905517578125, -0.2630615234375, -0.229217529296875, -0.19537353515625, -0.161529541015625, -0.127685546875, -0.093841552734375, -0.05999755859375, -0.026153564453125, 0.0076904296875, 0.041534423828125, 0.07537841796875, 0.109222412109375, 0.14306640625, 0.176910400390625, 0.21075439453125, 0.244598388671875, 0.2784423828125, 0.312286376953125, 0.34613037109375, 0.379974365234375, 0.413818359375, 0.447662353515625, 0.48150634765625, 0.515350341796875, 0.5491943359375, 0.583038330078125, 0.61688232421875, 0.650726318359375, 0.6845703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 20.0, 38.0, 59.0, 158.0, 612.0, 4189870.0, 3003.0, 243.0, 118.0, 81.0, 48.0, 21.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.46875, -27.70361328125, -25.9384765625, -24.17333984375, -22.408203125, -20.64306640625, -18.8779296875, -17.11279296875, -15.34765625, -13.58251953125, -11.8173828125, -10.05224609375, -8.287109375, -6.52197265625, -4.7568359375, -2.99169921875, -1.2265625, 0.53857421875, 2.3037109375, 4.06884765625, 5.833984375, 7.59912109375, 9.3642578125, 11.12939453125, 12.89453125, 14.65966796875, 16.4248046875, 18.18994140625, 19.955078125, 21.72021484375, 23.4853515625, 25.25048828125, 27.015625, 28.78076171875, 30.5458984375, 32.31103515625, 34.076171875, 35.84130859375, 37.6064453125, 39.37158203125, 41.13671875, 42.90185546875, 44.6669921875, 46.43212890625, 48.197265625, 49.96240234375, 51.7275390625, 53.49267578125, 55.2578125, 57.02294921875, 58.7880859375, 60.55322265625, 62.318359375, 64.08349609375, 65.8486328125, 67.61376953125, 69.37890625, 71.14404296875, 72.9091796875, 74.67431640625, 76.439453125, 78.20458984375, 79.9697265625, 81.73486328125, 83.5]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 17.0, 268.0, 3688.0, 99.0, 14.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.25213623046875, -3.9925537109375, -3.73297119140625, -3.473388671875, -3.21380615234375, -2.9542236328125, -2.69464111328125, -2.43505859375, -2.17547607421875, -1.9158935546875, -1.65631103515625, -1.396728515625, -1.13714599609375, -0.8775634765625, -0.61798095703125, -0.3583984375, -0.09881591796875, 0.1607666015625, 0.42034912109375, 0.679931640625, 0.93951416015625, 1.1990966796875, 1.45867919921875, 1.71826171875, 1.97784423828125, 2.2374267578125, 2.49700927734375, 2.756591796875, 3.01617431640625, 3.2757568359375, 3.53533935546875, 3.794921875, 4.05450439453125, 4.3140869140625, 4.57366943359375, 4.833251953125, 5.09283447265625, 5.3524169921875, 5.61199951171875, 5.87158203125, 6.13116455078125, 6.3907470703125, 6.65032958984375, 6.909912109375, 7.16949462890625, 7.4290771484375, 7.68865966796875, 7.9482421875, 8.20782470703125, 8.4674072265625, 8.72698974609375, 8.986572265625, 9.24615478515625, 9.5057373046875, 9.76531982421875, 10.02490234375, 10.28448486328125, 10.5440673828125, 10.80364990234375, 11.063232421875, 11.32281494140625, 11.5823974609375, 11.84197998046875, 12.1015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 944.0, 60.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.3465118408203, -144.70880126953125, -141.07107543945312, -137.433349609375, -133.79563903808594, -130.15792846679688, -126.52020263671875, -122.88248443603516, -119.24476623535156, -115.60704803466797, -111.96932983398438, -108.33161163330078, -104.69389343261719, -101.0561752319336, -97.41845703125, -93.7807388305664, -90.14302062988281, -86.50530242919922, -82.86758422851562, -79.22986602783203, -75.59214782714844, -71.95442962646484, -68.31671142578125, -64.67899322509766, -61.04127502441406, -57.40355682373047, -53.765838623046875, -50.12812042236328, -46.49040222167969, -42.852684020996094, -39.2149658203125, -35.577247619628906, -31.939529418945312, -28.30181121826172, -24.664093017578125, -21.02637481689453, -17.388656616210938, -13.750938415527344, -10.11322021484375, -6.475502014160156, -2.8377838134765625, 0.7999343872070312, 4.437652587890625, 8.075370788574219, 11.713088989257812, 15.350807189941406, 18.988525390625, 22.626243591308594, 26.263961791992188, 29.90167999267578, 33.539398193359375, 37.17711639404297, 40.81483459472656, 44.452552795410156, 48.09027099609375, 51.727989196777344, 55.36570739746094, 59.00342559814453, 62.641143798828125, 66.27886199951172, 69.91658020019531, 73.5542984008789, 77.1920166015625, 80.8297348022461, 84.46745300292969]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 20.0, 27.0, 61.0, 71.0, 119.0, 137.0, 160.0, 134.0, 113.0, 74.0, 47.0, 18.0, 11.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.4368896484375, -16.95392417907715, -16.470958709716797, -15.987994194030762, -15.50502872467041, -15.022063255310059, -14.539098739624023, -14.056133270263672, -13.57316780090332, -13.090202331542969, -12.607236862182617, -12.124272346496582, -11.64130687713623, -11.158341407775879, -10.675376892089844, -10.192411422729492, -9.70944595336914, -9.226480484008789, -8.743515014648438, -8.260550498962402, -7.777585029602051, -7.294619560241699, -6.811654567718506, -6.3286895751953125, -5.845724105834961, -5.362758636474609, -4.879793643951416, -4.396828651428223, -3.913863182067871, -3.4308979511260986, -2.947932720184326, -2.4649674892425537, -1.9820013046264648, -1.4990360736846924, -1.01607084274292, -0.5331056118011475, -0.050140380859375, 0.43282485008239746, 0.9157900810241699, 1.3987553119659424, 1.8817205429077148, 2.3646857738494873, 2.8476510047912598, 3.3306162357330322, 3.8135814666748047, 4.296546936035156, 4.77951192855835, 5.262476921081543, 5.7454423904418945, 6.228407859802246, 6.7113728523254395, 7.194337844848633, 7.677303314208984, 8.160268783569336, 8.643234252929688, 9.126198768615723, 9.609164237976074, 10.092129707336426, 10.575094223022461, 11.058059692382812, 11.541025161743164, 12.023990631103516, 12.506956100463867, 12.989920616149902, 13.472886085510254]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 10.0, 15.0, 21.0, 29.0, 44.0, 67.0, 72.0, 112.0, 158.0, 237.0, 430.0, 786.0, 1860.0, 5189.0, 17617.0, 68158.0, 344694.0, 475137.0, 98577.0, 23878.0, 6905.0, 2356.0, 941.0, 456.0, 264.0, 161.0, 116.0, 75.0, 45.0, 32.0, 27.0, 27.0, 15.0, 11.0, 11.0, 4.0, 3.0, 5.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.559112548828125, -3.44830322265625, -3.337493896484375, -3.2266845703125, -3.115875244140625, -3.00506591796875, -2.894256591796875, -2.783447265625, -2.672637939453125, -2.56182861328125, -2.451019287109375, -2.3402099609375, -2.229400634765625, -2.11859130859375, -2.007781982421875, -1.89697265625, -1.786163330078125, -1.67535400390625, -1.564544677734375, -1.4537353515625, -1.342926025390625, -1.23211669921875, -1.121307373046875, -1.010498046875, -0.899688720703125, -0.78887939453125, -0.678070068359375, -0.5672607421875, -0.456451416015625, -0.34564208984375, -0.234832763671875, -0.1240234375, -0.013214111328125, 0.09759521484375, 0.208404541015625, 0.3192138671875, 0.430023193359375, 0.54083251953125, 0.651641845703125, 0.762451171875, 0.873260498046875, 0.98406982421875, 1.094879150390625, 1.2056884765625, 1.316497802734375, 1.42730712890625, 1.538116455078125, 1.64892578125, 1.759735107421875, 1.87054443359375, 1.981353759765625, 2.0921630859375, 2.202972412109375, 2.31378173828125, 2.424591064453125, 2.535400390625, 2.646209716796875, 2.75701904296875, 2.867828369140625, 2.9786376953125, 3.089447021484375, 3.20025634765625, 3.311065673828125, 3.421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 8.0, 12.0, 23.0, 29.0, 45.0, 42.0, 56.0, 70.0, 82.0, 94.0, 80.0, 105.0, 84.0, 70.0, 52.0, 31.0, 41.0, 22.0, 21.0, 8.0, 12.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2864761352539062, -1.2536163330078125, -1.2207565307617188, -1.187896728515625, -1.1550369262695312, -1.1221771240234375, -1.0893173217773438, -1.05645751953125, -1.0235977172851562, -0.9907379150390625, -0.9578781127929688, -0.925018310546875, -0.8921585083007812, -0.8592987060546875, -0.8264389038085938, -0.7935791015625, -0.7607192993164062, -0.7278594970703125, -0.6949996948242188, -0.662139892578125, -0.6292800903320312, -0.5964202880859375, -0.5635604858398438, -0.53070068359375, -0.49784088134765625, -0.4649810791015625, -0.43212127685546875, -0.399261474609375, -0.36640167236328125, -0.3335418701171875, -0.30068206787109375, -0.267822265625, -0.23496246337890625, -0.2021026611328125, -0.16924285888671875, -0.136383056640625, -0.10352325439453125, -0.0706634521484375, -0.03780364990234375, -0.00494384765625, 0.02791595458984375, 0.0607757568359375, 0.09363555908203125, 0.126495361328125, 0.15935516357421875, 0.1922149658203125, 0.22507476806640625, 0.2579345703125, 0.29079437255859375, 0.3236541748046875, 0.35651397705078125, 0.389373779296875, 0.42223358154296875, 0.4550933837890625, 0.48795318603515625, 0.52081298828125, 0.5536727905273438, 0.5865325927734375, 0.6193923950195312, 0.652252197265625, 0.6851119995117188, 0.7179718017578125, 0.7508316040039062, 0.78369140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 5.0, 2.0, 2.0, 11.0, 13.0, 18.0, 17.0, 21.0, 38.0, 42.0, 84.0, 178.0, 416.0, 1310.0, 5040.0, 28594.0, 357703.0, 598704.0, 46570.0, 7055.0, 1680.0, 550.0, 188.0, 109.0, 57.0, 44.0, 30.0, 16.0, 18.0, 9.0, 4.0, 7.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.6363525390625, -5.475830078125, -5.3153076171875, -5.15478515625, -4.9942626953125, -4.833740234375, -4.6732177734375, -4.5126953125, -4.3521728515625, -4.191650390625, -4.0311279296875, -3.87060546875, -3.7100830078125, -3.549560546875, -3.3890380859375, -3.228515625, -3.0679931640625, -2.907470703125, -2.7469482421875, -2.58642578125, -2.4259033203125, -2.265380859375, -2.1048583984375, -1.9443359375, -1.7838134765625, -1.623291015625, -1.4627685546875, -1.30224609375, -1.1417236328125, -0.981201171875, -0.8206787109375, -0.66015625, -0.4996337890625, -0.339111328125, -0.1785888671875, -0.01806640625, 0.1424560546875, 0.302978515625, 0.4635009765625, 0.6240234375, 0.7845458984375, 0.945068359375, 1.1055908203125, 1.26611328125, 1.4266357421875, 1.587158203125, 1.7476806640625, 1.908203125, 2.0687255859375, 2.229248046875, 2.3897705078125, 2.55029296875, 2.7108154296875, 2.871337890625, 3.0318603515625, 3.1923828125, 3.3529052734375, 3.513427734375, 3.6739501953125, 3.83447265625, 3.9949951171875, 4.155517578125, 4.3160400390625, 4.4765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 7.0, 20.0, 12.0, 20.0, 20.0, 25.0, 26.0, 41.0, 35.0, 64.0, 62.0, 58.0, 59.0, 82.0, 52.0, 64.0, 50.0, 55.0, 42.0, 34.0, 41.0, 23.0, 28.0, 13.0, 13.0, 9.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.80633544921875, -3.6986083984375, -3.59088134765625, -3.483154296875, -3.37542724609375, -3.2677001953125, -3.15997314453125, -3.05224609375, -2.94451904296875, -2.8367919921875, -2.72906494140625, -2.621337890625, -2.51361083984375, -2.4058837890625, -2.29815673828125, -2.1904296875, -2.08270263671875, -1.9749755859375, -1.86724853515625, -1.759521484375, -1.65179443359375, -1.5440673828125, -1.43634033203125, -1.32861328125, -1.22088623046875, -1.1131591796875, -1.00543212890625, -0.897705078125, -0.78997802734375, -0.6822509765625, -0.57452392578125, -0.466796875, -0.35906982421875, -0.2513427734375, -0.14361572265625, -0.035888671875, 0.07183837890625, 0.1795654296875, 0.28729248046875, 0.39501953125, 0.50274658203125, 0.6104736328125, 0.71820068359375, 0.825927734375, 0.93365478515625, 1.0413818359375, 1.14910888671875, 1.2568359375, 1.36456298828125, 1.4722900390625, 1.58001708984375, 1.687744140625, 1.79547119140625, 1.9031982421875, 2.01092529296875, 2.11865234375, 2.22637939453125, 2.3341064453125, 2.44183349609375, 2.549560546875, 2.65728759765625, 2.7650146484375, 2.87274169921875, 2.98046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 15.0, 15.0, 33.0, 46.0, 68.0, 91.0, 183.0, 278.0, 511.0, 873.0, 1735.0, 4011.0, 12334.0, 60832.0, 631520.0, 291449.0, 30587.0, 7873.0, 3050.0, 1338.0, 704.0, 405.0, 201.0, 142.0, 91.0, 58.0, 31.0, 22.0, 11.0, 8.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6572265625, -1.5997161865234375, -1.542205810546875, -1.4846954345703125, -1.42718505859375, -1.3696746826171875, -1.312164306640625, -1.2546539306640625, -1.1971435546875, -1.1396331787109375, -1.082122802734375, -1.0246124267578125, -0.96710205078125, -0.9095916748046875, -0.852081298828125, -0.7945709228515625, -0.737060546875, -0.6795501708984375, -0.622039794921875, -0.5645294189453125, -0.50701904296875, -0.4495086669921875, -0.391998291015625, -0.3344879150390625, -0.2769775390625, -0.2194671630859375, -0.161956787109375, -0.1044464111328125, -0.04693603515625, 0.0105743408203125, 0.068084716796875, 0.1255950927734375, 0.18310546875, 0.2406158447265625, 0.298126220703125, 0.3556365966796875, 0.41314697265625, 0.4706573486328125, 0.528167724609375, 0.5856781005859375, 0.6431884765625, 0.7006988525390625, 0.758209228515625, 0.8157196044921875, 0.87322998046875, 0.9307403564453125, 0.988250732421875, 1.0457611083984375, 1.103271484375, 1.1607818603515625, 1.218292236328125, 1.2758026123046875, 1.33331298828125, 1.3908233642578125, 1.448333740234375, 1.5058441162109375, 1.5633544921875, 1.6208648681640625, 1.678375244140625, 1.7358856201171875, 1.79339599609375, 1.8509063720703125, 1.908416748046875, 1.9659271240234375, 2.0234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 11.0, 6.0, 5.0, 9.0, 16.0, 26.0, 37.0, 61.0, 77.0, 98.0, 120.0, 119.0, 103.0, 83.0, 73.0, 37.0, 30.0, 23.0, 19.0, 11.0, 10.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000232696533203125, -0.00022565945982933044, -0.0002186223864555359, -0.00021158531308174133, -0.00020454823970794678, -0.00019751116633415222, -0.00019047409296035767, -0.0001834370195865631, -0.00017639994621276855, -0.000169362872838974, -0.00016232579946517944, -0.0001552887260913849, -0.00014825165271759033, -0.00014121457934379578, -0.00013417750597000122, -0.00012714043259620667, -0.00012010335922241211, -0.00011306628584861755, -0.000106029212474823, -9.899213910102844e-05, -9.195506572723389e-05, -8.491799235343933e-05, -7.788091897964478e-05, -7.084384560585022e-05, -6.380677223205566e-05, -5.676969885826111e-05, -4.973262548446655e-05, -4.2695552110672e-05, -3.565847873687744e-05, -2.8621405363082886e-05, -2.158433198928833e-05, -1.4547258615493774e-05, -7.510185241699219e-06, -4.731118679046631e-07, 6.563961505889893e-06, 1.3601034879684448e-05, 2.0638108253479004e-05, 2.767518162727356e-05, 3.4712255001068115e-05, 4.174932837486267e-05, 4.8786401748657227e-05, 5.582347512245178e-05, 6.286054849624634e-05, 6.98976218700409e-05, 7.693469524383545e-05, 8.397176861763e-05, 9.100884199142456e-05, 9.804591536521912e-05, 0.00010508298873901367, 0.00011212006211280823, 0.00011915713548660278, 0.00012619420886039734, 0.0001332312822341919, 0.00014026835560798645, 0.000147305428981781, 0.00015434250235557556, 0.00016137957572937012, 0.00016841664910316467, 0.00017545372247695923, 0.00018249079585075378, 0.00018952786922454834, 0.0001965649425983429, 0.00020360201597213745, 0.000210639089345932, 0.00021767616271972656]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 0.0, 3.0, 3.0, 14.0, 11.0, 18.0, 34.0, 60.0, 72.0, 161.0, 397.0, 923.0, 2404.0, 9979.0, 85885.0, 831754.0, 101609.0, 10705.0, 2766.0, 918.0, 384.0, 200.0, 95.0, 57.0, 37.0, 21.0, 11.0, 9.0, 7.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.266265869140625, -2.19659423828125, -2.126922607421875, -2.0572509765625, -1.987579345703125, -1.91790771484375, -1.848236083984375, -1.778564453125, -1.708892822265625, -1.63922119140625, -1.569549560546875, -1.4998779296875, -1.430206298828125, -1.36053466796875, -1.290863037109375, -1.22119140625, -1.151519775390625, -1.08184814453125, -1.012176513671875, -0.9425048828125, -0.872833251953125, -0.80316162109375, -0.733489990234375, -0.663818359375, -0.594146728515625, -0.52447509765625, -0.454803466796875, -0.3851318359375, -0.315460205078125, -0.24578857421875, -0.176116943359375, -0.1064453125, -0.036773681640625, 0.03289794921875, 0.102569580078125, 0.1722412109375, 0.241912841796875, 0.31158447265625, 0.381256103515625, 0.450927734375, 0.520599365234375, 0.59027099609375, 0.659942626953125, 0.7296142578125, 0.799285888671875, 0.86895751953125, 0.938629150390625, 1.00830078125, 1.077972412109375, 1.14764404296875, 1.217315673828125, 1.2869873046875, 1.356658935546875, 1.42633056640625, 1.496002197265625, 1.565673828125, 1.635345458984375, 1.70501708984375, 1.774688720703125, 1.8443603515625, 1.914031982421875, 1.98370361328125, 2.053375244140625, 2.123046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 5.0, 4.0, 4.0, 6.0, 5.0, 11.0, 10.0, 16.0, 26.0, 36.0, 55.0, 55.0, 93.0, 106.0, 126.0, 117.0, 89.0, 65.0, 40.0, 34.0, 19.0, 14.0, 13.0, 16.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.705078125, -1.663848876953125, -1.62261962890625, -1.581390380859375, -1.5401611328125, -1.498931884765625, -1.45770263671875, -1.416473388671875, -1.375244140625, -1.334014892578125, -1.29278564453125, -1.251556396484375, -1.2103271484375, -1.169097900390625, -1.12786865234375, -1.086639404296875, -1.04541015625, -1.004180908203125, -0.96295166015625, -0.921722412109375, -0.8804931640625, -0.839263916015625, -0.79803466796875, -0.756805419921875, -0.715576171875, -0.674346923828125, -0.63311767578125, -0.591888427734375, -0.5506591796875, -0.509429931640625, -0.46820068359375, -0.426971435546875, -0.3857421875, -0.344512939453125, -0.30328369140625, -0.262054443359375, -0.2208251953125, -0.179595947265625, -0.13836669921875, -0.097137451171875, -0.055908203125, -0.014678955078125, 0.02655029296875, 0.067779541015625, 0.1090087890625, 0.150238037109375, 0.19146728515625, 0.232696533203125, 0.27392578125, 0.315155029296875, 0.35638427734375, 0.397613525390625, 0.4388427734375, 0.480072021484375, 0.52130126953125, 0.562530517578125, 0.603759765625, 0.644989013671875, 0.68621826171875, 0.727447509765625, 0.7686767578125, 0.809906005859375, 0.85113525390625, 0.892364501953125, 0.93359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 14.0, 35.0, 121.0, 416.0, 326.0, 66.0, 23.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-91.06198120117188, -89.33736419677734, -87.61274719238281, -85.88813018798828, -84.16350555419922, -82.43888854980469, -80.71427154541016, -78.98965454101562, -77.2650375366211, -75.54042053222656, -73.81580352783203, -72.0911865234375, -70.36656188964844, -68.6419448852539, -66.91732788085938, -65.19271087646484, -63.46809387207031, -61.74347686767578, -60.018856048583984, -58.29423904418945, -56.56962203979492, -54.845001220703125, -53.120384216308594, -51.39576721191406, -49.671146392822266, -47.946529388427734, -46.22190856933594, -44.497291564941406, -42.772674560546875, -41.048057556152344, -39.32343673706055, -37.598819732666016, -35.87420654296875, -34.14958953857422, -32.42496871948242, -30.70035171508789, -28.97573471069336, -27.251115798950195, -25.52649688720703, -23.8018798828125, -22.077259063720703, -20.35264015197754, -18.628023147583008, -16.903404235839844, -15.178787231445312, -13.454168319702148, -11.7295503616333, -10.004932403564453, -8.280315399169922, -6.555697441101074, -4.831079483032227, -3.1064610481262207, -1.381843090057373, 0.3427753448486328, 2.0673933029174805, 3.792011260986328, 5.516629219055176, 7.241247177124023, 8.965865135192871, 10.690483093261719, 12.415102005004883, 14.13971996307373, 15.864337921142578, 17.58895492553711, 19.313573837280273]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 9.0, 13.0, 6.0, 14.0, 10.0, 10.0, 16.0, 15.0, 18.0, 30.0, 26.0, 24.0, 21.0, 34.0, 37.0, 46.0, 47.0, 54.0, 43.0, 47.0, 45.0, 33.0, 45.0, 35.0, 31.0, 35.0, 31.0, 24.0, 26.0, 21.0, 20.0, 19.0, 18.0, 16.0, 20.0, 7.0, 14.0, 5.0, 2.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.04270076751709, -13.597654342651367, -13.152607917785645, -12.707560539245605, -12.262514114379883, -11.81746768951416, -11.372421264648438, -10.927373886108398, -10.482327461242676, -10.037281036376953, -9.59223461151123, -9.147187232971191, -8.702140808105469, -8.257094383239746, -7.812047958374023, -7.367001056671143, -6.92195463180542, -6.476908206939697, -6.031861305236816, -5.586814880371094, -5.141767978668213, -4.69672155380249, -4.251674652099609, -3.8066282272338867, -3.361581563949585, -2.916534900665283, -2.4714882373809814, -2.0264415740966797, -1.5813950300216675, -1.1363484859466553, -0.6913018226623535, -0.24625515937805176, 0.19879150390625, 0.6438381671905518, 1.0888848304748535, 1.5339313745498657, 1.9789780378341675, 2.4240245819091797, 2.8690712451934814, 3.314117908477783, 3.759164571762085, 4.204211235046387, 4.649257659912109, 5.09430456161499, 5.539350986480713, 5.984397888183594, 6.429444313049316, 6.874490737915039, 7.31953763961792, 7.764584064483643, 8.209630966186523, 8.654677391052246, 9.099723815917969, 9.544771194458008, 9.98981761932373, 10.434864044189453, 10.879910469055176, 11.324956893920898, 11.770003318786621, 12.21505069732666, 12.660097122192383, 13.105143547058105, 13.550189971923828, 13.995237350463867, 14.44028377532959]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 9.0, 8.0, 10.0, 13.0, 25.0, 37.0, 51.0, 49.0, 93.0, 172.0, 208.0, 345.0, 535.0, 865.0, 1463.0, 2816.0, 5977.0, 15719.0, 55540.0, 426917.0, 3486366.0, 148085.0, 30406.0, 9903.0, 3970.0, 1937.0, 1077.0, 584.0, 392.0, 211.0, 149.0, 89.0, 76.0, 54.0, 22.0, 18.0, 17.0, 15.0, 10.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-4.64453125, -4.509033203125, -4.37353515625, -4.238037109375, -4.1025390625, -3.967041015625, -3.83154296875, -3.696044921875, -3.560546875, -3.425048828125, -3.28955078125, -3.154052734375, -3.0185546875, -2.883056640625, -2.74755859375, -2.612060546875, -2.4765625, -2.341064453125, -2.20556640625, -2.070068359375, -1.9345703125, -1.799072265625, -1.66357421875, -1.528076171875, -1.392578125, -1.257080078125, -1.12158203125, -0.986083984375, -0.8505859375, -0.715087890625, -0.57958984375, -0.444091796875, -0.30859375, -0.173095703125, -0.03759765625, 0.097900390625, 0.2333984375, 0.368896484375, 0.50439453125, 0.639892578125, 0.775390625, 0.910888671875, 1.04638671875, 1.181884765625, 1.3173828125, 1.452880859375, 1.58837890625, 1.723876953125, 1.859375, 1.994873046875, 2.13037109375, 2.265869140625, 2.4013671875, 2.536865234375, 2.67236328125, 2.807861328125, 2.943359375, 3.078857421875, 3.21435546875, 3.349853515625, 3.4853515625, 3.620849609375, 3.75634765625, 3.891845703125, 4.02734375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 13.0, 17.0, 22.0, 19.0, 25.0, 38.0, 45.0, 51.0, 59.0, 70.0, 66.0, 73.0, 74.0, 68.0, 60.0, 56.0, 47.0, 44.0, 24.0, 33.0, 19.0, 19.0, 12.0, 17.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.022125244140625, -0.99346923828125, -0.964813232421875, -0.9361572265625, -0.907501220703125, -0.87884521484375, -0.850189208984375, -0.821533203125, -0.792877197265625, -0.76422119140625, -0.735565185546875, -0.7069091796875, -0.678253173828125, -0.64959716796875, -0.620941162109375, -0.59228515625, -0.563629150390625, -0.53497314453125, -0.506317138671875, -0.4776611328125, -0.449005126953125, -0.42034912109375, -0.391693115234375, -0.363037109375, -0.334381103515625, -0.30572509765625, -0.277069091796875, -0.2484130859375, -0.219757080078125, -0.19110107421875, -0.162445068359375, -0.1337890625, -0.105133056640625, -0.07647705078125, -0.047821044921875, -0.0191650390625, 0.009490966796875, 0.03814697265625, 0.066802978515625, 0.095458984375, 0.124114990234375, 0.15277099609375, 0.181427001953125, 0.2100830078125, 0.238739013671875, 0.26739501953125, 0.296051025390625, 0.32470703125, 0.353363037109375, 0.38201904296875, 0.410675048828125, 0.4393310546875, 0.467987060546875, 0.49664306640625, 0.525299072265625, 0.553955078125, 0.582611083984375, 0.61126708984375, 0.639923095703125, 0.6685791015625, 0.697235107421875, 0.72589111328125, 0.754547119140625, 0.783203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 8.0, 7.0, 9.0, 10.0, 16.0, 18.0, 28.0, 59.0, 88.0, 106.0, 216.0, 346.0, 640.0, 1396.0, 3592.0, 12345.0, 75561.0, 3682197.0, 378288.0, 27736.0, 6832.0, 2441.0, 1060.0, 522.0, 299.0, 168.0, 90.0, 62.0, 57.0, 21.0, 14.0, 19.0, 11.0, 5.0, 6.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.5546875, -6.3660888671875, -6.177490234375, -5.9888916015625, -5.80029296875, -5.6116943359375, -5.423095703125, -5.2344970703125, -5.0458984375, -4.8572998046875, -4.668701171875, -4.4801025390625, -4.29150390625, -4.1029052734375, -3.914306640625, -3.7257080078125, -3.537109375, -3.3485107421875, -3.159912109375, -2.9713134765625, -2.78271484375, -2.5941162109375, -2.405517578125, -2.2169189453125, -2.0283203125, -1.8397216796875, -1.651123046875, -1.4625244140625, -1.27392578125, -1.0853271484375, -0.896728515625, -0.7081298828125, -0.51953125, -0.3309326171875, -0.142333984375, 0.0462646484375, 0.23486328125, 0.4234619140625, 0.612060546875, 0.8006591796875, 0.9892578125, 1.1778564453125, 1.366455078125, 1.5550537109375, 1.74365234375, 1.9322509765625, 2.120849609375, 2.3094482421875, 2.498046875, 2.6866455078125, 2.875244140625, 3.0638427734375, 3.25244140625, 3.4410400390625, 3.629638671875, 3.8182373046875, 4.0068359375, 4.1954345703125, 4.384033203125, 4.5726318359375, 4.76123046875, 4.9498291015625, 5.138427734375, 5.3270263671875, 5.515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 8.0, 7.0, 14.0, 20.0, 36.0, 40.0, 79.0, 150.0, 395.0, 1930.0, 830.0, 254.0, 127.0, 57.0, 42.0, 20.0, 17.0, 12.0, 6.0, 6.0, 7.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.537109375, -2.45965576171875, -2.3822021484375, -2.30474853515625, -2.227294921875, -2.14984130859375, -2.0723876953125, -1.99493408203125, -1.91748046875, -1.84002685546875, -1.7625732421875, -1.68511962890625, -1.607666015625, -1.53021240234375, -1.4527587890625, -1.37530517578125, -1.2978515625, -1.22039794921875, -1.1429443359375, -1.06549072265625, -0.988037109375, -0.91058349609375, -0.8331298828125, -0.75567626953125, -0.67822265625, -0.60076904296875, -0.5233154296875, -0.44586181640625, -0.368408203125, -0.29095458984375, -0.2135009765625, -0.13604736328125, -0.05859375, 0.01885986328125, 0.0963134765625, 0.17376708984375, 0.251220703125, 0.32867431640625, 0.4061279296875, 0.48358154296875, 0.56103515625, 0.63848876953125, 0.7159423828125, 0.79339599609375, 0.870849609375, 0.94830322265625, 1.0257568359375, 1.10321044921875, 1.1806640625, 1.25811767578125, 1.3355712890625, 1.41302490234375, 1.490478515625, 1.56793212890625, 1.6453857421875, 1.72283935546875, 1.80029296875, 1.87774658203125, 1.9552001953125, 2.03265380859375, 2.110107421875, 2.18756103515625, 2.2650146484375, 2.34246826171875, 2.419921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 15.0, 101.0, 531.0, 309.0, 38.0, 11.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.5164794921875, -26.19165802001953, -24.866838455200195, -23.542016983032227, -22.21719741821289, -20.892375946044922, -19.567554473876953, -18.242733001708984, -16.91791343688965, -15.593092918395996, -14.268272399902344, -12.943450927734375, -11.618630409240723, -10.29380989074707, -8.968988418579102, -7.644167900085449, -6.319347381591797, -4.9945268630981445, -3.669705867767334, -2.3448851108551025, -1.020064353942871, 0.30475616455078125, 1.6295771598815918, 2.9543981552124023, 4.279218673706055, 5.604039192199707, 6.928860187530518, 8.253681182861328, 9.57850170135498, 10.903322219848633, 12.228143692016602, 13.552964210510254, 14.87778091430664, 16.20260238647461, 17.527421951293945, 18.852243423461914, 20.17706298828125, 21.50188446044922, 22.826705932617188, 24.151527404785156, 25.476346969604492, 26.80116844177246, 28.125988006591797, 29.450809478759766, 30.775630950927734, 32.10044860839844, 33.425270080566406, 34.750091552734375, 36.074913024902344, 37.39973449707031, 38.72455596923828, 40.049373626708984, 41.37419509887695, 42.69901657104492, 44.02383804321289, 45.34865951538086, 46.67347717285156, 47.99829864501953, 49.3231201171875, 50.6479377746582, 51.97275924682617, 53.29758071899414, 54.62240219116211, 55.94722366333008, 57.27204513549805]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 11.0, 13.0, 19.0, 38.0, 35.0, 33.0, 55.0, 52.0, 51.0, 59.0, 85.0, 70.0, 66.0, 72.0, 59.0, 64.0, 58.0, 43.0, 28.0, 26.0, 20.0, 16.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.112067222595215, -8.796167373657227, -8.480266571044922, -8.164366722106934, -7.848465919494629, -7.532566070556641, -7.216665744781494, -6.900765419006348, -6.584865093231201, -6.268964767456055, -5.953064441680908, -5.637164115905762, -5.321264266967773, -5.005363464355469, -4.6894636154174805, -4.373563289642334, -4.0576629638671875, -3.741762638092041, -3.4258623123168945, -3.109962224960327, -2.7940618991851807, -2.478161573410034, -2.162261486053467, -1.8463611602783203, -1.5304608345031738, -1.2145605087280273, -0.8986603021621704, -0.5827600359916687, -0.266859769821167, 0.04904055595397949, 0.3649407625198364, 0.6808409690856934, 0.9967422485351562, 1.3126425743103027, 1.6285427808761597, 1.9444429874420166, 2.260343313217163, 2.5762436389923096, 2.892143726348877, 3.2080440521240234, 3.52394437789917, 3.8398447036743164, 4.155745029449463, 4.471645355224609, 4.787545204162598, 5.103446006774902, 5.419345855712891, 5.735246181488037, 6.051146507263184, 6.36704683303833, 6.682947158813477, 6.998847484588623, 7.3147478103637695, 7.630647659301758, 7.946547985076904, 8.26244831085205, 8.578348159790039, 8.894248008728027, 9.210148811340332, 9.52604866027832, 9.841949462890625, 10.157849311828613, 10.473750114440918, 10.789649963378906, 11.105550765991211]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 9.0, 20.0, 24.0, 34.0, 44.0, 68.0, 85.0, 141.0, 166.0, 257.0, 469.0, 806.0, 1757.0, 3754.0, 9668.0, 29123.0, 105182.0, 409492.0, 357590.0, 88839.0, 25413.0, 8628.0, 3346.0, 1549.0, 831.0, 414.0, 278.0, 141.0, 117.0, 80.0, 55.0, 51.0, 26.0, 29.0, 9.0, 11.0, 12.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.078125, -2.975311279296875, -2.87249755859375, -2.769683837890625, -2.6668701171875, -2.564056396484375, -2.46124267578125, -2.358428955078125, -2.255615234375, -2.152801513671875, -2.04998779296875, -1.947174072265625, -1.8443603515625, -1.741546630859375, -1.63873291015625, -1.535919189453125, -1.43310546875, -1.330291748046875, -1.22747802734375, -1.124664306640625, -1.0218505859375, -0.919036865234375, -0.81622314453125, -0.713409423828125, -0.610595703125, -0.507781982421875, -0.40496826171875, -0.302154541015625, -0.1993408203125, -0.096527099609375, 0.00628662109375, 0.109100341796875, 0.2119140625, 0.314727783203125, 0.41754150390625, 0.520355224609375, 0.6231689453125, 0.725982666015625, 0.82879638671875, 0.931610107421875, 1.034423828125, 1.137237548828125, 1.24005126953125, 1.342864990234375, 1.4456787109375, 1.548492431640625, 1.65130615234375, 1.754119873046875, 1.85693359375, 1.959747314453125, 2.06256103515625, 2.165374755859375, 2.2681884765625, 2.371002197265625, 2.47381591796875, 2.576629638671875, 2.679443359375, 2.782257080078125, 2.88507080078125, 2.987884521484375, 3.0906982421875, 3.193511962890625, 3.29632568359375, 3.399139404296875, 3.501953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 6.0, 10.0, 30.0, 25.0, 36.0, 57.0, 64.0, 78.0, 78.0, 89.0, 84.0, 89.0, 75.0, 75.0, 58.0, 46.0, 30.0, 24.0, 13.0, 9.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1326751708984375, -1.096405029296875, -1.0601348876953125, -1.02386474609375, -0.9875946044921875, -0.951324462890625, -0.9150543212890625, -0.8787841796875, -0.8425140380859375, -0.806243896484375, -0.7699737548828125, -0.73370361328125, -0.6974334716796875, -0.661163330078125, -0.6248931884765625, -0.588623046875, -0.5523529052734375, -0.516082763671875, -0.4798126220703125, -0.44354248046875, -0.4072723388671875, -0.371002197265625, -0.3347320556640625, -0.2984619140625, -0.2621917724609375, -0.225921630859375, -0.1896514892578125, -0.15338134765625, -0.1171112060546875, -0.080841064453125, -0.0445709228515625, -0.00830078125, 0.0279693603515625, 0.064239501953125, 0.1005096435546875, 0.13677978515625, 0.1730499267578125, 0.209320068359375, 0.2455902099609375, 0.2818603515625, 0.3181304931640625, 0.354400634765625, 0.3906707763671875, 0.42694091796875, 0.4632110595703125, 0.499481201171875, 0.5357513427734375, 0.572021484375, 0.6082916259765625, 0.644561767578125, 0.6808319091796875, 0.71710205078125, 0.7533721923828125, 0.789642333984375, 0.8259124755859375, 0.8621826171875, 0.8984527587890625, 0.934722900390625, 0.9709930419921875, 1.00726318359375, 1.0435333251953125, 1.079803466796875, 1.1160736083984375, 1.15234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 16.0, 16.0, 30.0, 64.0, 94.0, 159.0, 288.0, 591.0, 1074.0, 2302.0, 5080.0, 11643.0, 28399.0, 76855.0, 237427.0, 419288.0, 169487.0, 56937.0, 21669.0, 9153.0, 3991.0, 1900.0, 908.0, 491.0, 267.0, 160.0, 81.0, 56.0, 37.0, 18.0, 15.0, 15.0, 6.0, 7.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.53125, -2.45965576171875, -2.3880615234375, -2.31646728515625, -2.244873046875, -2.17327880859375, -2.1016845703125, -2.03009033203125, -1.95849609375, -1.88690185546875, -1.8153076171875, -1.74371337890625, -1.672119140625, -1.60052490234375, -1.5289306640625, -1.45733642578125, -1.3857421875, -1.31414794921875, -1.2425537109375, -1.17095947265625, -1.099365234375, -1.02777099609375, -0.9561767578125, -0.88458251953125, -0.81298828125, -0.74139404296875, -0.6697998046875, -0.59820556640625, -0.526611328125, -0.45501708984375, -0.3834228515625, -0.31182861328125, -0.240234375, -0.16864013671875, -0.0970458984375, -0.02545166015625, 0.046142578125, 0.11773681640625, 0.1893310546875, 0.26092529296875, 0.33251953125, 0.40411376953125, 0.4757080078125, 0.54730224609375, 0.618896484375, 0.69049072265625, 0.7620849609375, 0.83367919921875, 0.9052734375, 0.97686767578125, 1.0484619140625, 1.12005615234375, 1.191650390625, 1.26324462890625, 1.3348388671875, 1.40643310546875, 1.47802734375, 1.54962158203125, 1.6212158203125, 1.69281005859375, 1.764404296875, 1.83599853515625, 1.9075927734375, 1.97918701171875, 2.05078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 8.0, 8.0, 11.0, 16.0, 18.0, 24.0, 17.0, 18.0, 21.0, 30.0, 29.0, 49.0, 37.0, 29.0, 40.0, 32.0, 35.0, 40.0, 51.0, 44.0, 38.0, 41.0, 40.0, 34.0, 39.0, 29.0, 30.0, 20.0, 20.0, 19.0, 19.0, 17.0, 18.0, 13.0, 8.0, 6.0, 5.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.75390625, -2.675018310546875, -2.59613037109375, -2.517242431640625, -2.4383544921875, -2.359466552734375, -2.28057861328125, -2.201690673828125, -2.122802734375, -2.043914794921875, -1.96502685546875, -1.886138916015625, -1.8072509765625, -1.728363037109375, -1.64947509765625, -1.570587158203125, -1.49169921875, -1.412811279296875, -1.33392333984375, -1.255035400390625, -1.1761474609375, -1.097259521484375, -1.01837158203125, -0.939483642578125, -0.860595703125, -0.781707763671875, -0.70281982421875, -0.623931884765625, -0.5450439453125, -0.466156005859375, -0.38726806640625, -0.308380126953125, -0.2294921875, -0.150604248046875, -0.07171630859375, 0.007171630859375, 0.0860595703125, 0.164947509765625, 0.24383544921875, 0.322723388671875, 0.401611328125, 0.480499267578125, 0.55938720703125, 0.638275146484375, 0.7171630859375, 0.796051025390625, 0.87493896484375, 0.953826904296875, 1.03271484375, 1.111602783203125, 1.19049072265625, 1.269378662109375, 1.3482666015625, 1.427154541015625, 1.50604248046875, 1.584930419921875, 1.663818359375, 1.742706298828125, 1.82159423828125, 1.900482177734375, 1.9793701171875, 2.058258056640625, 2.13714599609375, 2.216033935546875, 2.294921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 4.0, 10.0, 9.0, 17.0, 42.0, 69.0, 125.0, 244.0, 546.0, 1375.0, 3948.0, 14469.0, 304426.0, 693058.0, 22144.0, 5013.0, 1787.0, 677.0, 265.0, 148.0, 64.0, 46.0, 12.0, 18.0, 11.0, 7.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.49273681640625, -2.3800048828125, -2.26727294921875, -2.154541015625, -2.04180908203125, -1.9290771484375, -1.81634521484375, -1.70361328125, -1.59088134765625, -1.4781494140625, -1.36541748046875, -1.252685546875, -1.13995361328125, -1.0272216796875, -0.91448974609375, -0.8017578125, -0.68902587890625, -0.5762939453125, -0.46356201171875, -0.350830078125, -0.23809814453125, -0.1253662109375, -0.01263427734375, 0.10009765625, 0.21282958984375, 0.3255615234375, 0.43829345703125, 0.551025390625, 0.66375732421875, 0.7764892578125, 0.88922119140625, 1.001953125, 1.11468505859375, 1.2274169921875, 1.34014892578125, 1.452880859375, 1.56561279296875, 1.6783447265625, 1.79107666015625, 1.90380859375, 2.01654052734375, 2.1292724609375, 2.24200439453125, 2.354736328125, 2.46746826171875, 2.5802001953125, 2.69293212890625, 2.8056640625, 2.91839599609375, 3.0311279296875, 3.14385986328125, 3.256591796875, 3.36932373046875, 3.4820556640625, 3.59478759765625, 3.70751953125, 3.82025146484375, 3.9329833984375, 4.04571533203125, 4.158447265625, 4.27117919921875, 4.3839111328125, 4.49664306640625, 4.609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 7.0, 8.0, 17.0, 17.0, 23.0, 39.0, 34.0, 67.0, 91.0, 127.0, 159.0, 122.0, 73.0, 65.0, 51.0, 24.0, 22.0, 14.0, 10.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00031566619873046875, -0.00030676648020744324, -0.0002978667616844177, -0.0002889670431613922, -0.0002800673246383667, -0.0002711676061153412, -0.0002622678875923157, -0.00025336816906929016, -0.00024446845054626465, -0.00023556873202323914, -0.00022666901350021362, -0.0002177692949771881, -0.0002088695764541626, -0.00019996985793113708, -0.00019107013940811157, -0.00018217042088508606, -0.00017327070236206055, -0.00016437098383903503, -0.00015547126531600952, -0.000146571546792984, -0.0001376718282699585, -0.00012877210974693298, -0.00011987239122390747, -0.00011097267270088196, -0.00010207295417785645, -9.317323565483093e-05, -8.427351713180542e-05, -7.537379860877991e-05, -6.64740800857544e-05, -5.757436156272888e-05, -4.867464303970337e-05, -3.9774924516677856e-05, -3.0875205993652344e-05, -2.197548747062683e-05, -1.3075768947601318e-05, -4.176050424575806e-06, 4.723668098449707e-06, 1.362338662147522e-05, 2.2523105144500732e-05, 3.1422823667526245e-05, 4.032254219055176e-05, 4.922226071357727e-05, 5.812197923660278e-05, 6.70216977596283e-05, 7.592141628265381e-05, 8.482113480567932e-05, 9.372085332870483e-05, 0.00010262057185173035, 0.00011152029037475586, 0.00012042000889778137, 0.00012931972742080688, 0.0001382194459438324, 0.0001471191644668579, 0.00015601888298988342, 0.00016491860151290894, 0.00017381832003593445, 0.00018271803855895996, 0.00019161775708198547, 0.00020051747560501099, 0.0002094171941280365, 0.000218316912651062, 0.00022721663117408752, 0.00023611634969711304, 0.00024501606822013855, 0.00025391578674316406]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 11.0, 22.0, 32.0, 81.0, 177.0, 486.0, 1476.0, 6146.0, 272033.0, 756890.0, 8452.0, 1807.0, 544.0, 216.0, 85.0, 39.0, 20.0, 16.0, 8.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10760498046875, -4.9378662109375, -4.76812744140625, -4.598388671875, -4.42864990234375, -4.2589111328125, -4.08917236328125, -3.91943359375, -3.74969482421875, -3.5799560546875, -3.41021728515625, -3.240478515625, -3.07073974609375, -2.9010009765625, -2.73126220703125, -2.5615234375, -2.39178466796875, -2.2220458984375, -2.05230712890625, -1.882568359375, -1.71282958984375, -1.5430908203125, -1.37335205078125, -1.20361328125, -1.03387451171875, -0.8641357421875, -0.69439697265625, -0.524658203125, -0.35491943359375, -0.1851806640625, -0.01544189453125, 0.154296875, 0.32403564453125, 0.4937744140625, 0.66351318359375, 0.833251953125, 1.00299072265625, 1.1727294921875, 1.34246826171875, 1.51220703125, 1.68194580078125, 1.8516845703125, 2.02142333984375, 2.191162109375, 2.36090087890625, 2.5306396484375, 2.70037841796875, 2.8701171875, 3.03985595703125, 3.2095947265625, 3.37933349609375, 3.549072265625, 3.71881103515625, 3.8885498046875, 4.05828857421875, 4.22802734375, 4.39776611328125, 4.5675048828125, 4.73724365234375, 4.906982421875, 5.07672119140625, 5.2464599609375, 5.41619873046875, 5.5859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 17.0, 21.0, 60.0, 110.0, 167.0, 181.0, 155.0, 120.0, 63.0, 22.0, 18.0, 11.0, 8.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.464599609375, -2.38623046875, -2.307861328125, -2.2294921875, -2.151123046875, -2.07275390625, -1.994384765625, -1.916015625, -1.837646484375, -1.75927734375, -1.680908203125, -1.6025390625, -1.524169921875, -1.44580078125, -1.367431640625, -1.2890625, -1.210693359375, -1.13232421875, -1.053955078125, -0.9755859375, -0.897216796875, -0.81884765625, -0.740478515625, -0.662109375, -0.583740234375, -0.50537109375, -0.427001953125, -0.3486328125, -0.270263671875, -0.19189453125, -0.113525390625, -0.03515625, 0.043212890625, 0.12158203125, 0.199951171875, 0.2783203125, 0.356689453125, 0.43505859375, 0.513427734375, 0.591796875, 0.670166015625, 0.74853515625, 0.826904296875, 0.9052734375, 0.983642578125, 1.06201171875, 1.140380859375, 1.21875, 1.297119140625, 1.37548828125, 1.453857421875, 1.5322265625, 1.610595703125, 1.68896484375, 1.767333984375, 1.845703125, 1.924072265625, 2.00244140625, 2.080810546875, 2.1591796875, 2.237548828125, 2.31591796875, 2.394287109375, 2.47265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 29.0, 194.0, 581.0, 162.0, 33.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-149.15074157714844, -146.50848388671875, -143.8662109375, -141.2239532470703, -138.58169555664062, -135.93942260742188, -133.2971649169922, -130.6549072265625, -128.01263427734375, -125.37036895751953, -122.72811126708984, -120.08584594726562, -117.4435806274414, -114.80132293701172, -112.1590576171875, -109.51679992675781, -106.87454223632812, -104.2322769165039, -101.59001922607422, -98.94775390625, -96.30548858642578, -93.6632308959961, -91.02096557617188, -88.37870788574219, -85.73643493652344, -83.09416961669922, -80.45191192626953, -77.80964660644531, -75.1673812866211, -72.5251235961914, -69.88285827636719, -67.2406005859375, -64.59834289550781, -61.95608139038086, -59.31381607055664, -56.67155456542969, -54.029293060302734, -51.38703155517578, -48.74476623535156, -46.10250473022461, -43.46023941040039, -40.81797790527344, -38.17571258544922, -35.533451080322266, -32.89118957519531, -30.248926162719727, -27.60666275024414, -24.964401245117188, -22.3221378326416, -19.679874420166016, -17.037612915039062, -14.395349502563477, -11.753087043762207, -9.110824584960938, -6.468561172485352, -3.8262996673583984, -1.1840362548828125, 1.4582264423370361, 4.100489139556885, 6.7427520751953125, 9.385014533996582, 12.027276992797852, 14.669540405273438, 17.31180191040039, 19.954065322875977]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 12.0, 11.0, 19.0, 17.0, 16.0, 20.0, 23.0, 29.0, 35.0, 38.0, 30.0, 53.0, 42.0, 42.0, 51.0, 55.0, 54.0, 39.0, 33.0, 34.0, 55.0, 29.0, 34.0, 20.0, 40.0, 25.0, 21.0, 19.0, 16.0, 11.0, 16.0, 13.0, 4.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.751077651977539, -15.216961860656738, -14.682846069335938, -14.148731231689453, -13.614615440368652, -13.080499649047852, -12.546384811401367, -12.012269020080566, -11.478153228759766, -10.944037437438965, -10.409921646118164, -9.87580680847168, -9.341691017150879, -8.807575225830078, -8.273460388183594, -7.739344596862793, -7.205228805541992, -6.671113014221191, -6.136997699737549, -5.602882385253906, -5.0687665939331055, -4.534650802612305, -4.000535488128662, -3.4664199352264404, -2.9323043823242188, -2.398188829421997, -1.8640732765197754, -1.3299577236175537, -0.795842170715332, -0.26172661781311035, 0.27238893508911133, 0.806504487991333, 1.3406219482421875, 1.8747375011444092, 2.408853054046631, 2.9429686069488525, 3.477084159851074, 4.011199951171875, 4.545315265655518, 5.07943058013916, 5.613546371459961, 6.147662162780762, 6.681777477264404, 7.215892791748047, 7.750008583068848, 8.284124374389648, 8.818239212036133, 9.352355003356934, 9.886470794677734, 10.420586585998535, 10.954702377319336, 11.48881721496582, 12.022933006286621, 12.557048797607422, 13.091163635253906, 13.625279426574707, 14.159395217895508, 14.693511009216309, 15.22762680053711, 15.761741638183594, 16.295856475830078, 16.829973220825195, 17.36408805847168, 17.898204803466797, 18.43231964111328]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 7.0, 5.0, 6.0, 15.0, 16.0, 14.0, 37.0, 47.0, 48.0, 79.0, 133.0, 222.0, 332.0, 689.0, 1437.0, 3308.0, 9112.0, 35210.0, 327622.0, 3698642.0, 90891.0, 16615.0, 5160.0, 2110.0, 1011.0, 568.0, 303.0, 190.0, 115.0, 96.0, 73.0, 47.0, 27.0, 34.0, 16.0, 14.0, 13.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.41796875, -3.3011474609375, -3.184326171875, -3.0675048828125, -2.95068359375, -2.8338623046875, -2.717041015625, -2.6002197265625, -2.4833984375, -2.3665771484375, -2.249755859375, -2.1329345703125, -2.01611328125, -1.8992919921875, -1.782470703125, -1.6656494140625, -1.548828125, -1.4320068359375, -1.315185546875, -1.1983642578125, -1.08154296875, -0.9647216796875, -0.847900390625, -0.7310791015625, -0.6142578125, -0.4974365234375, -0.380615234375, -0.2637939453125, -0.14697265625, -0.0301513671875, 0.086669921875, 0.2034912109375, 0.3203125, 0.4371337890625, 0.553955078125, 0.6707763671875, 0.78759765625, 0.9044189453125, 1.021240234375, 1.1380615234375, 1.2548828125, 1.3717041015625, 1.488525390625, 1.6053466796875, 1.72216796875, 1.8389892578125, 1.955810546875, 2.0726318359375, 2.189453125, 2.3062744140625, 2.423095703125, 2.5399169921875, 2.65673828125, 2.7735595703125, 2.890380859375, 3.0072021484375, 3.1240234375, 3.2408447265625, 3.357666015625, 3.4744873046875, 3.59130859375, 3.7081298828125, 3.824951171875, 3.9417724609375, 4.05859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 9.0, 16.0, 20.0, 25.0, 29.0, 26.0, 36.0, 59.0, 67.0, 63.0, 70.0, 77.0, 71.0, 88.0, 79.0, 49.0, 55.0, 39.0, 33.0, 29.0, 18.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1247711181640625, -1.090362548828125, -1.0559539794921875, -1.02154541015625, -0.9871368408203125, -0.952728271484375, -0.9183197021484375, -0.8839111328125, -0.8495025634765625, -0.815093994140625, -0.7806854248046875, -0.74627685546875, -0.7118682861328125, -0.677459716796875, -0.6430511474609375, -0.608642578125, -0.5742340087890625, -0.539825439453125, -0.5054168701171875, -0.47100830078125, -0.4365997314453125, -0.402191162109375, -0.3677825927734375, -0.3333740234375, -0.2989654541015625, -0.264556884765625, -0.2301483154296875, -0.19573974609375, -0.1613311767578125, -0.126922607421875, -0.0925140380859375, -0.05810546875, -0.0236968994140625, 0.010711669921875, 0.0451202392578125, 0.07952880859375, 0.1139373779296875, 0.148345947265625, 0.1827545166015625, 0.2171630859375, 0.2515716552734375, 0.285980224609375, 0.3203887939453125, 0.35479736328125, 0.3892059326171875, 0.423614501953125, 0.4580230712890625, 0.492431640625, 0.5268402099609375, 0.561248779296875, 0.5956573486328125, 0.63006591796875, 0.6644744873046875, 0.698883056640625, 0.7332916259765625, 0.7677001953125, 0.8021087646484375, 0.836517333984375, 0.8709259033203125, 0.90533447265625, 0.9397430419921875, 0.974151611328125, 1.0085601806640625, 1.04296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 5.0, 11.0, 25.0, 30.0, 48.0, 66.0, 130.0, 198.0, 433.0, 1981.0, 40759.0, 4122613.0, 25496.0, 1554.0, 423.0, 214.0, 122.0, 74.0, 38.0, 32.0, 15.0, 12.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59375, -5.231689453125, -4.86962890625, -4.507568359375, -4.1455078125, -3.783447265625, -3.42138671875, -3.059326171875, -2.697265625, -2.335205078125, -1.97314453125, -1.611083984375, -1.2490234375, -0.886962890625, -0.52490234375, -0.162841796875, 0.19921875, 0.561279296875, 0.92333984375, 1.285400390625, 1.6474609375, 2.009521484375, 2.37158203125, 2.733642578125, 3.095703125, 3.457763671875, 3.81982421875, 4.181884765625, 4.5439453125, 4.906005859375, 5.26806640625, 5.630126953125, 5.9921875, 6.354248046875, 6.71630859375, 7.078369140625, 7.4404296875, 7.802490234375, 8.16455078125, 8.526611328125, 8.888671875, 9.250732421875, 9.61279296875, 9.974853515625, 10.3369140625, 10.698974609375, 11.06103515625, 11.423095703125, 11.78515625, 12.147216796875, 12.50927734375, 12.871337890625, 13.2333984375, 13.595458984375, 13.95751953125, 14.319580078125, 14.681640625, 15.043701171875, 15.40576171875, 15.767822265625, 16.1298828125, 16.491943359375, 16.85400390625, 17.216064453125, 17.578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 13.0, 17.0, 39.0, 76.0, 191.0, 1308.0, 2010.0, 255.0, 84.0, 41.0, 13.0, 11.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.2664794921875, -2.179443359375, -2.0924072265625, -2.00537109375, -1.9183349609375, -1.831298828125, -1.7442626953125, -1.6572265625, -1.5701904296875, -1.483154296875, -1.3961181640625, -1.30908203125, -1.2220458984375, -1.135009765625, -1.0479736328125, -0.9609375, -0.8739013671875, -0.786865234375, -0.6998291015625, -0.61279296875, -0.5257568359375, -0.438720703125, -0.3516845703125, -0.2646484375, -0.1776123046875, -0.090576171875, -0.0035400390625, 0.08349609375, 0.1705322265625, 0.257568359375, 0.3446044921875, 0.431640625, 0.5186767578125, 0.605712890625, 0.6927490234375, 0.77978515625, 0.8668212890625, 0.953857421875, 1.0408935546875, 1.1279296875, 1.2149658203125, 1.302001953125, 1.3890380859375, 1.47607421875, 1.5631103515625, 1.650146484375, 1.7371826171875, 1.82421875, 1.9112548828125, 1.998291015625, 2.0853271484375, 2.17236328125, 2.2593994140625, 2.346435546875, 2.4334716796875, 2.5205078125, 2.6075439453125, 2.694580078125, 2.7816162109375, 2.86865234375, 2.9556884765625, 3.042724609375, 3.1297607421875, 3.216796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 10.0, 23.0, 88.0, 304.0, 354.0, 156.0, 50.0, 15.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.165985107421875, -20.46157455444336, -19.757165908813477, -19.05275535583496, -18.348344802856445, -17.643936157226562, -16.939525604248047, -16.23511505126953, -15.530705451965332, -14.826295852661133, -14.121885299682617, -13.417475700378418, -12.713066101074219, -12.008655548095703, -11.304245948791504, -10.599836349487305, -9.895425796508789, -9.19101619720459, -8.486605644226074, -7.782196044921875, -7.077785968780518, -6.37337589263916, -5.668966293334961, -4.9645562171936035, -4.260146141052246, -3.5557360649108887, -2.8513262271881104, -2.146916389465332, -1.4425063133239746, -0.7380962371826172, -0.03368663787841797, 0.6707234382629395, 1.3751335144042969, 2.0795435905456543, 2.7839534282684326, 3.488363265991211, 4.192773342132568, 4.897183418273926, 5.601593017578125, 6.306003093719482, 7.01041316986084, 7.714823246002197, 8.419233322143555, 9.123642921447754, 9.828052520751953, 10.532463073730469, 11.236872673034668, 11.941282272338867, 12.645692825317383, 13.350102424621582, 14.054512977600098, 14.758922576904297, 15.463333129882812, 16.167743682861328, 16.87215232849121, 17.576562881469727, 18.28097152709961, 18.985382080078125, 19.689790725708008, 20.394201278686523, 21.09861183166504, 21.803020477294922, 22.507431030273438, 23.211841583251953, 23.91625213623047]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 5.0, 4.0, 19.0, 13.0, 24.0, 17.0, 29.0, 33.0, 46.0, 66.0, 60.0, 64.0, 61.0, 71.0, 65.0, 67.0, 59.0, 68.0, 60.0, 38.0, 35.0, 23.0, 16.0, 21.0, 8.0, 7.0, 5.0, 5.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.95045280456543, -5.712652206420898, -5.474851608276367, -5.237051010131836, -4.999250411987305, -4.761449813842773, -4.523649215698242, -4.285848617553711, -4.04804801940918, -3.8102474212646484, -3.572446823120117, -3.334646224975586, -3.0968456268310547, -2.8590450286865234, -2.6212446689605713, -2.38344407081604, -2.145643711090088, -1.9078431129455566, -1.6700425148010254, -1.4322420358657837, -1.1944414377212524, -0.9566408395767212, -0.7188403606414795, -0.48103976249694824, -0.243239164352417, -0.00543859601020813, 0.23236197233200073, 0.4701625108718872, 0.7079631090164185, 0.9457637071609497, 1.1835641860961914, 1.4213647842407227, 1.659165382385254, 1.8969659805297852, 2.1347665786743164, 2.3725671768188477, 2.610367774963379, 2.84816837310791, 3.0859687328338623, 3.3237693309783936, 3.561569929122925, 3.799370527267456, 4.037170886993408, 4.2749714851379395, 4.512772083282471, 4.750572681427002, 4.988373279571533, 5.2261738777160645, 5.463974475860596, 5.701775074005127, 5.939575672149658, 6.1773762702941895, 6.415176868438721, 6.652977466583252, 6.890777587890625, 7.128578186035156, 7.3663787841796875, 7.604179382324219, 7.84197998046875, 8.079780578613281, 8.317581176757812, 8.555381774902344, 8.793182373046875, 9.030982971191406, 9.268783569335938]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 13.0, 16.0, 11.0, 17.0, 17.0, 39.0, 64.0, 72.0, 97.0, 164.0, 277.0, 434.0, 701.0, 1285.0, 2351.0, 4712.0, 10155.0, 23332.0, 57600.0, 160905.0, 390101.0, 248386.0, 86640.0, 33536.0, 14321.0, 6420.0, 3060.0, 1588.0, 827.0, 462.0, 333.0, 180.0, 134.0, 91.0, 70.0, 34.0, 27.0, 23.0, 15.0, 5.0, 9.0, 9.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.564453125, -2.478118896484375, -2.39178466796875, -2.305450439453125, -2.2191162109375, -2.132781982421875, -2.04644775390625, -1.960113525390625, -1.873779296875, -1.787445068359375, -1.70111083984375, -1.614776611328125, -1.5284423828125, -1.442108154296875, -1.35577392578125, -1.269439697265625, -1.18310546875, -1.096771240234375, -1.01043701171875, -0.924102783203125, -0.8377685546875, -0.751434326171875, -0.66510009765625, -0.578765869140625, -0.492431640625, -0.406097412109375, -0.31976318359375, -0.233428955078125, -0.1470947265625, -0.060760498046875, 0.02557373046875, 0.111907958984375, 0.1982421875, 0.284576416015625, 0.37091064453125, 0.457244873046875, 0.5435791015625, 0.629913330078125, 0.71624755859375, 0.802581787109375, 0.888916015625, 0.975250244140625, 1.06158447265625, 1.147918701171875, 1.2342529296875, 1.320587158203125, 1.40692138671875, 1.493255615234375, 1.57958984375, 1.665924072265625, 1.75225830078125, 1.838592529296875, 1.9249267578125, 2.011260986328125, 2.09759521484375, 2.183929443359375, 2.270263671875, 2.356597900390625, 2.44293212890625, 2.529266357421875, 2.6156005859375, 2.701934814453125, 2.78826904296875, 2.874603271484375, 2.9609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 8.0, 12.0, 18.0, 30.0, 22.0, 31.0, 52.0, 47.0, 50.0, 70.0, 81.0, 87.0, 88.0, 75.0, 73.0, 61.0, 32.0, 33.0, 42.0, 31.0, 18.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3079376220703125, -1.271148681640625, -1.2343597412109375, -1.19757080078125, -1.1607818603515625, -1.123992919921875, -1.0872039794921875, -1.0504150390625, -1.0136260986328125, -0.976837158203125, -0.9400482177734375, -0.90325927734375, -0.8664703369140625, -0.829681396484375, -0.7928924560546875, -0.756103515625, -0.7193145751953125, -0.682525634765625, -0.6457366943359375, -0.60894775390625, -0.5721588134765625, -0.535369873046875, -0.4985809326171875, -0.4617919921875, -0.4250030517578125, -0.388214111328125, -0.3514251708984375, -0.31463623046875, -0.2778472900390625, -0.241058349609375, -0.2042694091796875, -0.16748046875, -0.1306915283203125, -0.093902587890625, -0.0571136474609375, -0.02032470703125, 0.0164642333984375, 0.053253173828125, 0.0900421142578125, 0.1268310546875, 0.1636199951171875, 0.200408935546875, 0.2371978759765625, 0.27398681640625, 0.3107757568359375, 0.347564697265625, 0.3843536376953125, 0.421142578125, 0.4579315185546875, 0.494720458984375, 0.5315093994140625, 0.56829833984375, 0.6050872802734375, 0.641876220703125, 0.6786651611328125, 0.7154541015625, 0.7522430419921875, 0.789031982421875, 0.8258209228515625, 0.86260986328125, 0.8993988037109375, 0.936187744140625, 0.9729766845703125, 1.009765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 9.0, 7.0, 7.0, 10.0, 12.0, 20.0, 29.0, 42.0, 85.0, 97.0, 199.0, 329.0, 578.0, 1206.0, 2399.0, 5332.0, 13028.0, 34723.0, 114653.0, 379519.0, 342991.0, 100717.0, 31272.0, 11702.0, 4975.0, 2172.0, 1073.0, 549.0, 310.0, 176.0, 113.0, 62.0, 45.0, 26.0, 19.0, 14.0, 14.0, 7.0, 2.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-3.064453125, -2.97418212890625, -2.8839111328125, -2.79364013671875, -2.703369140625, -2.61309814453125, -2.5228271484375, -2.43255615234375, -2.34228515625, -2.25201416015625, -2.1617431640625, -2.07147216796875, -1.981201171875, -1.89093017578125, -1.8006591796875, -1.71038818359375, -1.6201171875, -1.52984619140625, -1.4395751953125, -1.34930419921875, -1.259033203125, -1.16876220703125, -1.0784912109375, -0.98822021484375, -0.89794921875, -0.80767822265625, -0.7174072265625, -0.62713623046875, -0.536865234375, -0.44659423828125, -0.3563232421875, -0.26605224609375, -0.17578125, -0.08551025390625, 0.0047607421875, 0.09503173828125, 0.185302734375, 0.27557373046875, 0.3658447265625, 0.45611572265625, 0.54638671875, 0.63665771484375, 0.7269287109375, 0.81719970703125, 0.907470703125, 0.99774169921875, 1.0880126953125, 1.17828369140625, 1.2685546875, 1.35882568359375, 1.4490966796875, 1.53936767578125, 1.629638671875, 1.71990966796875, 1.8101806640625, 1.90045166015625, 1.99072265625, 2.08099365234375, 2.1712646484375, 2.26153564453125, 2.351806640625, 2.44207763671875, 2.5323486328125, 2.62261962890625, 2.712890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 4.0, 16.0, 8.0, 14.0, 16.0, 25.0, 20.0, 26.0, 34.0, 43.0, 45.0, 50.0, 48.0, 57.0, 45.0, 43.0, 61.0, 46.0, 57.0, 46.0, 54.0, 43.0, 31.0, 32.0, 26.0, 21.0, 17.0, 15.0, 14.0, 4.0, 5.0, 3.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.4688720703125, -4.340087890625, -4.2113037109375, -4.08251953125, -3.9537353515625, -3.824951171875, -3.6961669921875, -3.5673828125, -3.4385986328125, -3.309814453125, -3.1810302734375, -3.05224609375, -2.9234619140625, -2.794677734375, -2.6658935546875, -2.537109375, -2.4083251953125, -2.279541015625, -2.1507568359375, -2.02197265625, -1.8931884765625, -1.764404296875, -1.6356201171875, -1.5068359375, -1.3780517578125, -1.249267578125, -1.1204833984375, -0.99169921875, -0.8629150390625, -0.734130859375, -0.6053466796875, -0.4765625, -0.3477783203125, -0.218994140625, -0.0902099609375, 0.03857421875, 0.1673583984375, 0.296142578125, 0.4249267578125, 0.5537109375, 0.6824951171875, 0.811279296875, 0.9400634765625, 1.06884765625, 1.1976318359375, 1.326416015625, 1.4552001953125, 1.583984375, 1.7127685546875, 1.841552734375, 1.9703369140625, 2.09912109375, 2.2279052734375, 2.356689453125, 2.4854736328125, 2.6142578125, 2.7430419921875, 2.871826171875, 3.0006103515625, 3.12939453125, 3.2581787109375, 3.386962890625, 3.5157470703125, 3.64453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 11.0, 8.0, 11.0, 19.0, 26.0, 33.0, 53.0, 75.0, 124.0, 192.0, 394.0, 749.0, 1904.0, 5246.0, 20748.0, 164889.0, 715171.0, 114946.0, 16338.0, 4353.0, 1632.0, 715.0, 364.0, 191.0, 110.0, 54.0, 64.0, 34.0, 20.0, 14.0, 11.0, 13.0, 10.0, 13.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.226043701171875, -2.15521240234375, -2.084381103515625, -2.0135498046875, -1.942718505859375, -1.87188720703125, -1.801055908203125, -1.730224609375, -1.659393310546875, -1.58856201171875, -1.517730712890625, -1.4468994140625, -1.376068115234375, -1.30523681640625, -1.234405517578125, -1.16357421875, -1.092742919921875, -1.02191162109375, -0.951080322265625, -0.8802490234375, -0.809417724609375, -0.73858642578125, -0.667755126953125, -0.596923828125, -0.526092529296875, -0.45526123046875, -0.384429931640625, -0.3135986328125, -0.242767333984375, -0.17193603515625, -0.101104736328125, -0.0302734375, 0.040557861328125, 0.11138916015625, 0.182220458984375, 0.2530517578125, 0.323883056640625, 0.39471435546875, 0.465545654296875, 0.536376953125, 0.607208251953125, 0.67803955078125, 0.748870849609375, 0.8197021484375, 0.890533447265625, 0.96136474609375, 1.032196044921875, 1.10302734375, 1.173858642578125, 1.24468994140625, 1.315521240234375, 1.3863525390625, 1.457183837890625, 1.52801513671875, 1.598846435546875, 1.669677734375, 1.740509033203125, 1.81134033203125, 1.882171630859375, 1.9530029296875, 2.023834228515625, 2.09466552734375, 2.165496826171875, 2.236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 9.0, 6.0, 12.0, 18.0, 32.0, 23.0, 43.0, 78.0, 86.0, 117.0, 122.0, 112.0, 98.0, 68.0, 39.0, 33.0, 20.0, 18.0, 9.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0003829002380371094, -0.0003738868981599808, -0.00036487355828285217, -0.00035586021840572357, -0.00034684687852859497, -0.00033783353865146637, -0.00032882019877433777, -0.00031980685889720917, -0.00031079351902008057, -0.00030178017914295197, -0.00029276683926582336, -0.00028375349938869476, -0.00027474015951156616, -0.00026572681963443756, -0.00025671347975730896, -0.00024770013988018036, -0.00023868680000305176, -0.00022967346012592316, -0.00022066012024879456, -0.00021164678037166595, -0.00020263344049453735, -0.00019362010061740875, -0.00018460676074028015, -0.00017559342086315155, -0.00016658008098602295, -0.00015756674110889435, -0.00014855340123176575, -0.00013954006135463715, -0.00013052672147750854, -0.00012151338160037994, -0.00011250004172325134, -0.00010348670184612274, -9.447336196899414e-05, -8.546002209186554e-05, -7.644668221473694e-05, -6.743334233760834e-05, -5.8420002460479736e-05, -4.9406662583351135e-05, -4.0393322706222534e-05, -3.137998282909393e-05, -2.2366642951965332e-05, -1.3353303074836731e-05, -4.33996319770813e-06, 4.673376679420471e-06, 1.3686716556549072e-05, 2.2700056433677673e-05, 3.1713396310806274e-05, 4.0726736187934875e-05, 4.9740076065063477e-05, 5.875341594219208e-05, 6.776675581932068e-05, 7.678009569644928e-05, 8.579343557357788e-05, 9.480677545070648e-05, 0.00010382011532783508, 0.00011283345520496368, 0.00012184679508209229, 0.00013086013495922089, 0.0001398734748363495, 0.0001488868147134781, 0.0001579001545906067, 0.0001669134944677353, 0.0001759268343448639, 0.0001849401742219925, 0.0001939535140991211]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 4.0, 8.0, 19.0, 26.0, 49.0, 115.0, 230.0, 771.0, 2415.0, 10201.0, 72782.0, 735343.0, 201682.0, 19213.0, 3839.0, 1112.0, 389.0, 166.0, 71.0, 38.0, 25.0, 8.0, 11.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.43487548828125, -2.3580322265625, -2.28118896484375, -2.204345703125, -2.12750244140625, -2.0506591796875, -1.97381591796875, -1.89697265625, -1.82012939453125, -1.7432861328125, -1.66644287109375, -1.589599609375, -1.51275634765625, -1.4359130859375, -1.35906982421875, -1.2822265625, -1.20538330078125, -1.1285400390625, -1.05169677734375, -0.974853515625, -0.89801025390625, -0.8211669921875, -0.74432373046875, -0.66748046875, -0.59063720703125, -0.5137939453125, -0.43695068359375, -0.360107421875, -0.28326416015625, -0.2064208984375, -0.12957763671875, -0.052734375, 0.02410888671875, 0.1009521484375, 0.17779541015625, 0.254638671875, 0.33148193359375, 0.4083251953125, 0.48516845703125, 0.56201171875, 0.63885498046875, 0.7156982421875, 0.79254150390625, 0.869384765625, 0.94622802734375, 1.0230712890625, 1.09991455078125, 1.1767578125, 1.25360107421875, 1.3304443359375, 1.40728759765625, 1.484130859375, 1.56097412109375, 1.6378173828125, 1.71466064453125, 1.79150390625, 1.86834716796875, 1.9451904296875, 2.02203369140625, 2.098876953125, 2.17572021484375, 2.2525634765625, 2.32940673828125, 2.40625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 7.0, 6.0, 14.0, 7.0, 17.0, 14.0, 31.0, 29.0, 50.0, 61.0, 72.0, 78.0, 104.0, 76.0, 84.0, 78.0, 51.0, 45.0, 34.0, 28.0, 18.0, 24.0, 12.0, 13.0, 7.0, 11.0, 9.0, 1.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0], "bins": [-2.078125, -2.02862548828125, -1.9791259765625, -1.92962646484375, -1.880126953125, -1.83062744140625, -1.7811279296875, -1.73162841796875, -1.68212890625, -1.63262939453125, -1.5831298828125, -1.53363037109375, -1.484130859375, -1.43463134765625, -1.3851318359375, -1.33563232421875, -1.2861328125, -1.23663330078125, -1.1871337890625, -1.13763427734375, -1.088134765625, -1.03863525390625, -0.9891357421875, -0.93963623046875, -0.89013671875, -0.84063720703125, -0.7911376953125, -0.74163818359375, -0.692138671875, -0.64263916015625, -0.5931396484375, -0.54364013671875, -0.494140625, -0.44464111328125, -0.3951416015625, -0.34564208984375, -0.296142578125, -0.24664306640625, -0.1971435546875, -0.14764404296875, -0.09814453125, -0.04864501953125, 0.0008544921875, 0.05035400390625, 0.099853515625, 0.14935302734375, 0.1988525390625, 0.24835205078125, 0.2978515625, 0.34735107421875, 0.3968505859375, 0.44635009765625, 0.495849609375, 0.54534912109375, 0.5948486328125, 0.64434814453125, 0.69384765625, 0.74334716796875, 0.7928466796875, 0.84234619140625, 0.891845703125, 0.94134521484375, 0.9908447265625, 1.04034423828125, 1.08984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 24.0, 156.0, 611.0, 184.0, 28.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.2753143310547, -144.61911010742188, -140.96290588378906, -137.30670166015625, -133.65049743652344, -129.99429321289062, -126.33808898925781, -122.68189239501953, -119.02568817138672, -115.3694839477539, -111.7132797241211, -108.05707550048828, -104.40087127685547, -100.74467468261719, -97.08847045898438, -93.43226623535156, -89.77606201171875, -86.11985778808594, -82.46365356445312, -78.80744934082031, -75.1512451171875, -71.49504089355469, -67.83883666992188, -64.1826400756836, -60.52642822265625, -56.87022399902344, -53.214019775390625, -49.55781555175781, -45.901615142822266, -42.24541091918945, -38.58920669555664, -34.933006286621094, -31.27680206298828, -27.62059783935547, -23.96439552307129, -20.308191299438477, -16.651988983154297, -12.995784759521484, -9.339580535888672, -5.683378219604492, -2.0271739959716797, 1.6290295124053955, 5.285233020782471, 8.941436767578125, 12.597640037536621, 16.253843307495117, 19.91004753112793, 23.56624984741211, 27.222454071044922, 30.878658294677734, 34.53486251831055, 38.191062927246094, 41.847267150878906, 45.50347137451172, 49.15967559814453, 52.815879821777344, 56.472084045410156, 60.12828826904297, 63.78449249267578, 67.4406967163086, 71.0969009399414, 74.75309753417969, 78.4093017578125, 82.06550598144531, 85.72171020507812]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 10.0, 11.0, 9.0, 7.0, 24.0, 12.0, 14.0, 33.0, 29.0, 37.0, 32.0, 29.0, 38.0, 55.0, 42.0, 42.0, 47.0, 57.0, 51.0, 46.0, 40.0, 32.0, 36.0, 40.0, 36.0, 34.0, 31.0, 25.0, 23.0, 13.0, 11.0, 10.0, 10.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.484071731567383, -26.738187789916992, -25.99230194091797, -25.246417999267578, -24.500534057617188, -23.754650115966797, -23.008764266967773, -22.262880325317383, -21.51699447631836, -20.77111053466797, -20.025224685668945, -19.279340744018555, -18.533456802368164, -17.78757095336914, -17.04168701171875, -16.29580307006836, -15.549919128417969, -14.804034233093262, -14.058150291442871, -13.312265396118164, -12.566381454467773, -11.820496559143066, -11.07461166381836, -10.328727722167969, -9.582842826843262, -8.836957931518555, -8.091073989868164, -7.345189094543457, -6.599304676055908, -5.853420257568359, -5.107535362243652, -4.3616509437561035, -3.6157684326171875, -2.8698840141296387, -2.1239993572235107, -1.3781147003173828, -0.632230281829834, 0.11365413665771484, 0.8595390319824219, 1.6054234504699707, 2.3513078689575195, 3.0971922874450684, 3.8430769443511963, 4.588961601257324, 5.334846019744873, 6.080730438232422, 6.826615333557129, 7.572499752044678, 8.318384170532227, 9.064269065856934, 9.810153007507324, 10.556037902832031, 11.301921844482422, 12.047806739807129, 12.793691635131836, 13.539575576782227, 14.285460472106934, 15.03134536743164, 15.777229309082031, 16.523113250732422, 17.268999099731445, 18.014883041381836, 18.76076889038086, 19.50665283203125, 20.25253677368164]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 8.0, 2.0, 4.0, 8.0, 9.0, 8.0, 11.0, 18.0, 17.0, 31.0, 42.0, 69.0, 125.0, 179.0, 323.0, 554.0, 861.0, 1686.0, 3442.0, 7407.0, 19456.0, 72068.0, 1367221.0, 2606526.0, 78792.0, 20617.0, 7670.0, 3409.0, 1681.0, 831.0, 511.0, 273.0, 159.0, 102.0, 59.0, 37.0, 21.0, 15.0, 11.0, 6.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.61328125, -4.498016357421875, -4.38275146484375, -4.267486572265625, -4.1522216796875, -4.036956787109375, -3.92169189453125, -3.806427001953125, -3.691162109375, -3.575897216796875, -3.46063232421875, -3.345367431640625, -3.2301025390625, -3.114837646484375, -2.99957275390625, -2.884307861328125, -2.76904296875, -2.653778076171875, -2.53851318359375, -2.423248291015625, -2.3079833984375, -2.192718505859375, -2.07745361328125, -1.962188720703125, -1.846923828125, -1.731658935546875, -1.61639404296875, -1.501129150390625, -1.3858642578125, -1.270599365234375, -1.15533447265625, -1.040069580078125, -0.9248046875, -0.809539794921875, -0.69427490234375, -0.579010009765625, -0.4637451171875, -0.348480224609375, -0.23321533203125, -0.117950439453125, -0.002685546875, 0.112579345703125, 0.22784423828125, 0.343109130859375, 0.4583740234375, 0.573638916015625, 0.68890380859375, 0.804168701171875, 0.91943359375, 1.034698486328125, 1.14996337890625, 1.265228271484375, 1.3804931640625, 1.495758056640625, 1.61102294921875, 1.726287841796875, 1.841552734375, 1.956817626953125, 2.07208251953125, 2.187347412109375, 2.3026123046875, 2.417877197265625, 2.53314208984375, 2.648406982421875, 2.763671875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 9.0, 13.0, 15.0, 22.0, 27.0, 34.0, 32.0, 45.0, 59.0, 62.0, 76.0, 95.0, 81.0, 83.0, 66.0, 61.0, 56.0, 45.0, 32.0, 25.0, 24.0, 17.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.185546875, -2.13470458984375, -2.0838623046875, -2.03302001953125, -1.982177734375, -1.93133544921875, -1.8804931640625, -1.82965087890625, -1.77880859375, -1.72796630859375, -1.6771240234375, -1.62628173828125, -1.575439453125, -1.52459716796875, -1.4737548828125, -1.42291259765625, -1.3720703125, -1.32122802734375, -1.2703857421875, -1.21954345703125, -1.168701171875, -1.11785888671875, -1.0670166015625, -1.01617431640625, -0.96533203125, -0.91448974609375, -0.8636474609375, -0.81280517578125, -0.761962890625, -0.71112060546875, -0.6602783203125, -0.60943603515625, -0.55859375, -0.50775146484375, -0.4569091796875, -0.40606689453125, -0.355224609375, -0.30438232421875, -0.2535400390625, -0.20269775390625, -0.15185546875, -0.10101318359375, -0.0501708984375, 0.00067138671875, 0.051513671875, 0.10235595703125, 0.1531982421875, 0.20404052734375, 0.2548828125, 0.30572509765625, 0.3565673828125, 0.40740966796875, 0.458251953125, 0.50909423828125, 0.5599365234375, 0.61077880859375, 0.66162109375, 0.71246337890625, 0.7633056640625, 0.81414794921875, 0.864990234375, 0.91583251953125, 0.9666748046875, 1.01751708984375, 1.068359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 10.0, 7.0, 18.0, 52.0, 129.0, 465.0, 1502.0, 7443.0, 113519.0, 4011906.0, 52144.0, 5405.0, 1174.0, 317.0, 113.0, 33.0, 24.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.5655517578125, -8.263916015625, -7.9622802734375, -7.66064453125, -7.3590087890625, -7.057373046875, -6.7557373046875, -6.4541015625, -6.1524658203125, -5.850830078125, -5.5491943359375, -5.24755859375, -4.9459228515625, -4.644287109375, -4.3426513671875, -4.041015625, -3.7393798828125, -3.437744140625, -3.1361083984375, -2.83447265625, -2.5328369140625, -2.231201171875, -1.9295654296875, -1.6279296875, -1.3262939453125, -1.024658203125, -0.7230224609375, -0.42138671875, -0.1197509765625, 0.181884765625, 0.4835205078125, 0.78515625, 1.0867919921875, 1.388427734375, 1.6900634765625, 1.99169921875, 2.2933349609375, 2.594970703125, 2.8966064453125, 3.1982421875, 3.4998779296875, 3.801513671875, 4.1031494140625, 4.40478515625, 4.7064208984375, 5.008056640625, 5.3096923828125, 5.611328125, 5.9129638671875, 6.214599609375, 6.5162353515625, 6.81787109375, 7.1195068359375, 7.421142578125, 7.7227783203125, 8.0244140625, 8.3260498046875, 8.627685546875, 8.9293212890625, 9.23095703125, 9.5325927734375, 9.834228515625, 10.1358642578125, 10.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 12.0, 21.0, 21.0, 18.0, 35.0, 79.0, 118.0, 207.0, 573.0, 2114.0, 436.0, 180.0, 96.0, 52.0, 27.0, 16.0, 14.0, 12.0, 3.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.1513671875, -2.078125, -2.0048828125, -1.931640625, -1.8583984375, -1.78515625, -1.7119140625, -1.638671875, -1.5654296875, -1.4921875, -1.4189453125, -1.345703125, -1.2724609375, -1.19921875, -1.1259765625, -1.052734375, -0.9794921875, -0.90625, -0.8330078125, -0.759765625, -0.6865234375, -0.61328125, -0.5400390625, -0.466796875, -0.3935546875, -0.3203125, -0.2470703125, -0.173828125, -0.1005859375, -0.02734375, 0.0458984375, 0.119140625, 0.1923828125, 0.265625, 0.3388671875, 0.412109375, 0.4853515625, 0.55859375, 0.6318359375, 0.705078125, 0.7783203125, 0.8515625, 0.9248046875, 0.998046875, 1.0712890625, 1.14453125, 1.2177734375, 1.291015625, 1.3642578125, 1.4375, 1.5107421875, 1.583984375, 1.6572265625, 1.73046875, 1.8037109375, 1.876953125, 1.9501953125, 2.0234375, 2.0966796875, 2.169921875, 2.2431640625, 2.31640625, 2.3896484375, 2.462890625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 18.0, 37.0, 118.0, 272.0, 310.0, 146.0, 54.0, 24.0, 11.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.700407028198242, -19.023239135742188, -18.346073150634766, -17.668907165527344, -16.99173927307129, -16.314571380615234, -15.637405395507812, -14.960238456726074, -14.283071517944336, -13.605904579162598, -12.92873764038086, -12.251570701599121, -11.574403762817383, -10.897236824035645, -10.220069885253906, -9.542902946472168, -8.86573600769043, -8.188569068908691, -7.511402130126953, -6.834235191345215, -6.157068252563477, -5.479901313781738, -4.802734375, -4.125567436218262, -3.4484004974365234, -2.771233558654785, -2.094066619873047, -1.4168996810913086, -0.7397327423095703, -0.06256580352783203, 0.6146011352539062, 1.2917680740356445, 1.9689369201660156, 2.646103858947754, 3.323270797729492, 4.0004377365112305, 4.677604675292969, 5.354771614074707, 6.031938552856445, 6.709105491638184, 7.386272430419922, 8.06343936920166, 8.740606307983398, 9.417773246765137, 10.094940185546875, 10.772107124328613, 11.449274063110352, 12.12644100189209, 12.803607940673828, 13.480774879455566, 14.157941818237305, 14.835108757019043, 15.512275695800781, 16.189441680908203, 16.866609573364258, 17.543777465820312, 18.220943450927734, 18.898109436035156, 19.57527732849121, 20.252445220947266, 20.929611206054688, 21.60677719116211, 22.283945083618164, 22.96111297607422, 23.63827896118164]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 6.0, 5.0, 5.0, 14.0, 12.0, 13.0, 25.0, 28.0, 32.0, 39.0, 28.0, 52.0, 53.0, 75.0, 78.0, 69.0, 56.0, 70.0, 55.0, 50.0, 32.0, 51.0, 31.0, 30.0, 17.0, 19.0, 17.0, 5.0, 13.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.306209087371826, -6.028374195098877, -5.750539779663086, -5.472704887390137, -5.1948699951171875, -4.917035102844238, -4.639200210571289, -4.361365795135498, -4.083530902862549, -3.8056960105895996, -3.5278613567352295, -3.2500267028808594, -2.97219181060791, -2.694356918334961, -2.416522264480591, -2.1386876106262207, -1.8608527183532715, -1.5830179452896118, -1.3051831722259521, -1.0273483991622925, -0.7495136260986328, -0.47167885303497314, -0.19384407997131348, 0.08399069309234619, 0.36182546615600586, 0.6396602392196655, 0.9174950122833252, 1.1953297853469849, 1.4731645584106445, 1.7509993314743042, 2.028834104537964, 2.306668758392334, 2.584503173828125, 2.862338066101074, 3.1401727199554443, 3.4180073738098145, 3.6958422660827637, 3.973677158355713, 4.251511573791504, 4.529346466064453, 4.807181358337402, 5.085016250610352, 5.362851142883301, 5.640685558319092, 5.918520450592041, 6.19635534286499, 6.474189758300781, 6.7520246505737305, 7.02985954284668, 7.307694435119629, 7.585529327392578, 7.863363742828369, 8.141199111938477, 8.41903305053711, 8.696867942810059, 8.974702835083008, 9.252537727355957, 9.530372619628906, 9.808207511901855, 10.086042404174805, 10.363876342773438, 10.641711235046387, 10.919546127319336, 11.197381019592285, 11.475215911865234]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 13.0, 20.0, 23.0, 31.0, 55.0, 77.0, 109.0, 159.0, 266.0, 399.0, 724.0, 1176.0, 2232.0, 4173.0, 8351.0, 17923.0, 41455.0, 109724.0, 337828.0, 336601.0, 109992.0, 41385.0, 18023.0, 8278.0, 4207.0, 2236.0, 1172.0, 747.0, 421.0, 268.0, 165.0, 103.0, 77.0, 51.0, 28.0, 21.0, 13.0, 8.0, 11.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.125, -3.02734375, -2.9296875, -2.83203125, -2.734375, -2.63671875, -2.5390625, -2.44140625, -2.34375, -2.24609375, -2.1484375, -2.05078125, -1.953125, -1.85546875, -1.7578125, -1.66015625, -1.5625, -1.46484375, -1.3671875, -1.26953125, -1.171875, -1.07421875, -0.9765625, -0.87890625, -0.78125, -0.68359375, -0.5859375, -0.48828125, -0.390625, -0.29296875, -0.1953125, -0.09765625, 0.0, 0.09765625, 0.1953125, 0.29296875, 0.390625, 0.48828125, 0.5859375, 0.68359375, 0.78125, 0.87890625, 0.9765625, 1.07421875, 1.171875, 1.26953125, 1.3671875, 1.46484375, 1.5625, 1.66015625, 1.7578125, 1.85546875, 1.953125, 2.05078125, 2.1484375, 2.24609375, 2.34375, 2.44140625, 2.5390625, 2.63671875, 2.734375, 2.83203125, 2.9296875, 3.02734375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 7.0, 10.0, 8.0, 10.0, 15.0, 19.0, 31.0, 24.0, 32.0, 38.0, 39.0, 53.0, 60.0, 70.0, 62.0, 72.0, 54.0, 56.0, 46.0, 63.0, 41.0, 39.0, 39.0, 24.0, 20.0, 21.0, 9.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.447265625, -1.406158447265625, -1.36505126953125, -1.323944091796875, -1.2828369140625, -1.241729736328125, -1.20062255859375, -1.159515380859375, -1.118408203125, -1.077301025390625, -1.03619384765625, -0.995086669921875, -0.9539794921875, -0.912872314453125, -0.87176513671875, -0.830657958984375, -0.78955078125, -0.748443603515625, -0.70733642578125, -0.666229248046875, -0.6251220703125, -0.584014892578125, -0.54290771484375, -0.501800537109375, -0.460693359375, -0.419586181640625, -0.37847900390625, -0.337371826171875, -0.2962646484375, -0.255157470703125, -0.21405029296875, -0.172943115234375, -0.1318359375, -0.090728759765625, -0.04962158203125, -0.008514404296875, 0.0325927734375, 0.073699951171875, 0.11480712890625, 0.155914306640625, 0.197021484375, 0.238128662109375, 0.27923583984375, 0.320343017578125, 0.3614501953125, 0.402557373046875, 0.44366455078125, 0.484771728515625, 0.52587890625, 0.566986083984375, 0.60809326171875, 0.649200439453125, 0.6903076171875, 0.731414794921875, 0.77252197265625, 0.813629150390625, 0.854736328125, 0.895843505859375, 0.93695068359375, 0.978057861328125, 1.0191650390625, 1.060272216796875, 1.10137939453125, 1.142486572265625, 1.18359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 13.0, 12.0, 23.0, 32.0, 44.0, 79.0, 110.0, 186.0, 386.0, 903.0, 2380.0, 7324.0, 26556.0, 128879.0, 610965.0, 215081.0, 39840.0, 10298.0, 3149.0, 1150.0, 478.0, 261.0, 128.0, 79.0, 56.0, 31.0, 16.0, 16.0, 15.0, 12.0, 5.0, 8.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.43359375, -5.2767333984375, -5.119873046875, -4.9630126953125, -4.80615234375, -4.6492919921875, -4.492431640625, -4.3355712890625, -4.1787109375, -4.0218505859375, -3.864990234375, -3.7081298828125, -3.55126953125, -3.3944091796875, -3.237548828125, -3.0806884765625, -2.923828125, -2.7669677734375, -2.610107421875, -2.4532470703125, -2.29638671875, -2.1395263671875, -1.982666015625, -1.8258056640625, -1.6689453125, -1.5120849609375, -1.355224609375, -1.1983642578125, -1.04150390625, -0.8846435546875, -0.727783203125, -0.5709228515625, -0.4140625, -0.2572021484375, -0.100341796875, 0.0565185546875, 0.21337890625, 0.3702392578125, 0.527099609375, 0.6839599609375, 0.8408203125, 0.9976806640625, 1.154541015625, 1.3114013671875, 1.46826171875, 1.6251220703125, 1.781982421875, 1.9388427734375, 2.095703125, 2.2525634765625, 2.409423828125, 2.5662841796875, 2.72314453125, 2.8800048828125, 3.036865234375, 3.1937255859375, 3.3505859375, 3.5074462890625, 3.664306640625, 3.8211669921875, 3.97802734375, 4.1348876953125, 4.291748046875, 4.4486083984375, 4.60546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 7.0, 6.0, 5.0, 14.0, 10.0, 11.0, 10.0, 23.0, 16.0, 26.0, 32.0, 39.0, 53.0, 42.0, 65.0, 60.0, 41.0, 46.0, 54.0, 63.0, 51.0, 46.0, 51.0, 42.0, 35.0, 31.0, 25.0, 22.0, 18.0, 7.0, 8.0, 6.0, 13.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.41796875, -5.24658203125, -5.0751953125, -4.90380859375, -4.732421875, -4.56103515625, -4.3896484375, -4.21826171875, -4.046875, -3.87548828125, -3.7041015625, -3.53271484375, -3.361328125, -3.18994140625, -3.0185546875, -2.84716796875, -2.67578125, -2.50439453125, -2.3330078125, -2.16162109375, -1.990234375, -1.81884765625, -1.6474609375, -1.47607421875, -1.3046875, -1.13330078125, -0.9619140625, -0.79052734375, -0.619140625, -0.44775390625, -0.2763671875, -0.10498046875, 0.06640625, 0.23779296875, 0.4091796875, 0.58056640625, 0.751953125, 0.92333984375, 1.0947265625, 1.26611328125, 1.4375, 1.60888671875, 1.7802734375, 1.95166015625, 2.123046875, 2.29443359375, 2.4658203125, 2.63720703125, 2.80859375, 2.97998046875, 3.1513671875, 3.32275390625, 3.494140625, 3.66552734375, 3.8369140625, 4.00830078125, 4.1796875, 4.35107421875, 4.5224609375, 4.69384765625, 4.865234375, 5.03662109375, 5.2080078125, 5.37939453125, 5.55078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 13.0, 22.0, 58.0, 160.0, 494.0, 2378.0, 38872.0, 988468.0, 15979.0, 1495.0, 378.0, 105.0, 57.0, 26.0, 10.0, 7.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.66485595703125, -7.4039306640625, -7.14300537109375, -6.882080078125, -6.62115478515625, -6.3602294921875, -6.09930419921875, -5.83837890625, -5.57745361328125, -5.3165283203125, -5.05560302734375, -4.794677734375, -4.53375244140625, -4.2728271484375, -4.01190185546875, -3.7509765625, -3.49005126953125, -3.2291259765625, -2.96820068359375, -2.707275390625, -2.44635009765625, -2.1854248046875, -1.92449951171875, -1.66357421875, -1.40264892578125, -1.1417236328125, -0.88079833984375, -0.619873046875, -0.35894775390625, -0.0980224609375, 0.16290283203125, 0.423828125, 0.68475341796875, 0.9456787109375, 1.20660400390625, 1.467529296875, 1.72845458984375, 1.9893798828125, 2.25030517578125, 2.51123046875, 2.77215576171875, 3.0330810546875, 3.29400634765625, 3.554931640625, 3.81585693359375, 4.0767822265625, 4.33770751953125, 4.5986328125, 4.85955810546875, 5.1204833984375, 5.38140869140625, 5.642333984375, 5.90325927734375, 6.1641845703125, 6.42510986328125, 6.68603515625, 6.94696044921875, 7.2078857421875, 7.46881103515625, 7.729736328125, 7.99066162109375, 8.2515869140625, 8.51251220703125, 8.7734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 9.0, 20.0, 42.0, 63.0, 114.0, 219.0, 213.0, 144.0, 61.0, 32.0, 26.0, 12.0, 4.0, 8.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004799365997314453, -0.0004639439284801483, -0.0004479512572288513, -0.0004319585859775543, -0.0004159659147262573, -0.00039997324347496033, -0.00038398057222366333, -0.00036798790097236633, -0.00035199522972106934, -0.00033600255846977234, -0.00032000988721847534, -0.00030401721596717834, -0.00028802454471588135, -0.00027203187346458435, -0.00025603920221328735, -0.00024004653096199036, -0.00022405385971069336, -0.00020806118845939636, -0.00019206851720809937, -0.00017607584595680237, -0.00016008317470550537, -0.00014409050345420837, -0.00012809783220291138, -0.00011210516095161438, -9.611248970031738e-05, -8.011981844902039e-05, -6.412714719772339e-05, -4.813447594642639e-05, -3.2141804695129395e-05, -1.6149133443832397e-05, -1.564621925354004e-07, 1.5836209058761597e-05, 3.1828880310058594e-05, 4.782155156135559e-05, 6.381422281265259e-05, 7.980689406394958e-05, 9.579956531524658e-05, 0.00011179223656654358, 0.00012778490781784058, 0.00014377757906913757, 0.00015977025032043457, 0.00017576292157173157, 0.00019175559282302856, 0.00020774826407432556, 0.00022374093532562256, 0.00023973360657691956, 0.00025572627782821655, 0.00027171894907951355, 0.00028771162033081055, 0.00030370429158210754, 0.00031969696283340454, 0.00033568963408470154, 0.00035168230533599854, 0.00036767497658729553, 0.00038366764783859253, 0.0003996603190898895, 0.0004156529903411865, 0.0004316456615924835, 0.0004476383328437805, 0.0004636310040950775, 0.0004796236753463745, 0.0004956163465976715, 0.0005116090178489685, 0.0005276016891002655, 0.0005435943603515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 18.0, 32.0, 39.0, 81.0, 152.0, 304.0, 828.0, 3542.0, 46862.0, 974128.0, 19113.0, 2266.0, 643.0, 235.0, 138.0, 72.0, 29.0, 21.0, 16.0, 6.0, 2.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08203125, -6.86981201171875, -6.6575927734375, -6.44537353515625, -6.233154296875, -6.02093505859375, -5.8087158203125, -5.59649658203125, -5.38427734375, -5.17205810546875, -4.9598388671875, -4.74761962890625, -4.535400390625, -4.32318115234375, -4.1109619140625, -3.89874267578125, -3.6865234375, -3.47430419921875, -3.2620849609375, -3.04986572265625, -2.837646484375, -2.62542724609375, -2.4132080078125, -2.20098876953125, -1.98876953125, -1.77655029296875, -1.5643310546875, -1.35211181640625, -1.139892578125, -0.92767333984375, -0.7154541015625, -0.50323486328125, -0.291015625, -0.07879638671875, 0.1334228515625, 0.34564208984375, 0.557861328125, 0.77008056640625, 0.9822998046875, 1.19451904296875, 1.40673828125, 1.61895751953125, 1.8311767578125, 2.04339599609375, 2.255615234375, 2.46783447265625, 2.6800537109375, 2.89227294921875, 3.1044921875, 3.31671142578125, 3.5289306640625, 3.74114990234375, 3.953369140625, 4.16558837890625, 4.3778076171875, 4.59002685546875, 4.80224609375, 5.01446533203125, 5.2266845703125, 5.43890380859375, 5.651123046875, 5.86334228515625, 6.0755615234375, 6.28778076171875, 6.5]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 12.0, 26.0, 44.0, 132.0, 335.0, 279.0, 105.0, 23.0, 11.0, 12.0, 9.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.5374755859375, -7.348388671875, -7.1593017578125, -6.97021484375, -6.7811279296875, -6.592041015625, -6.4029541015625, -6.2138671875, -6.0247802734375, -5.835693359375, -5.6466064453125, -5.45751953125, -5.2684326171875, -5.079345703125, -4.8902587890625, -4.701171875, -4.5120849609375, -4.322998046875, -4.1339111328125, -3.94482421875, -3.7557373046875, -3.566650390625, -3.3775634765625, -3.1884765625, -2.9993896484375, -2.810302734375, -2.6212158203125, -2.43212890625, -2.2430419921875, -2.053955078125, -1.8648681640625, -1.67578125, -1.4866943359375, -1.297607421875, -1.1085205078125, -0.91943359375, -0.7303466796875, -0.541259765625, -0.3521728515625, -0.1630859375, 0.0260009765625, 0.215087890625, 0.4041748046875, 0.59326171875, 0.7823486328125, 0.971435546875, 1.1605224609375, 1.349609375, 1.5386962890625, 1.727783203125, 1.9168701171875, 2.10595703125, 2.2950439453125, 2.484130859375, 2.6732177734375, 2.8623046875, 3.0513916015625, 3.240478515625, 3.4295654296875, 3.61865234375, 3.8077392578125, 3.996826171875, 4.1859130859375, 4.375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 10.0, 46.0, 114.0, 301.0, 308.0, 140.0, 62.0, 14.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.95260620117188, -106.82132720947266, -104.69004821777344, -102.55876922607422, -100.427490234375, -98.29621124267578, -96.16493225097656, -94.03365325927734, -91.90237426757812, -89.7710952758789, -87.63981628417969, -85.50853729248047, -83.37725830078125, -81.24597930908203, -79.11470031738281, -76.9834213256836, -74.85214233398438, -72.72086334228516, -70.58958435058594, -68.45830535888672, -66.3270263671875, -64.19574737548828, -62.06446838378906, -59.933189392089844, -57.801910400390625, -55.670631408691406, -53.53935241699219, -51.40807342529297, -49.27679443359375, -47.14551544189453, -45.01423645019531, -42.882957458496094, -40.751678466796875, -38.620399475097656, -36.48912048339844, -34.35784149169922, -32.2265625, -30.09528350830078, -27.964004516601562, -25.832725524902344, -23.701448440551758, -21.57016944885254, -19.43889045715332, -17.3076114654541, -15.176332473754883, -13.045053482055664, -10.913774490356445, -8.782495498657227, -6.651216506958008, -4.519937515258789, -2.3886585235595703, -0.25737953186035156, 1.8738994598388672, 4.005178451538086, 6.136457443237305, 8.267736434936523, 10.399015426635742, 12.530294418334961, 14.66157341003418, 16.7928524017334, 18.924131393432617, 21.055410385131836, 23.186689376831055, 25.317968368530273, 27.449247360229492]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 11.0, 13.0, 10.0, 15.0, 15.0, 23.0, 22.0, 37.0, 24.0, 29.0, 42.0, 44.0, 34.0, 34.0, 36.0, 37.0, 33.0, 42.0, 52.0, 53.0, 43.0, 43.0, 37.0, 34.0, 18.0, 22.0, 30.0, 24.0, 21.0, 20.0, 15.0, 17.0, 13.0, 5.0, 10.0, 11.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.015832901000977, -23.306915283203125, -22.597999572753906, -21.889083862304688, -21.180166244506836, -20.471248626708984, -19.762332916259766, -19.053417205810547, -18.344499588012695, -17.635581970214844, -16.926666259765625, -16.217750549316406, -15.508832931518555, -14.79991626739502, -14.090999603271484, -13.38208293914795, -12.673166275024414, -11.964249610900879, -11.255332946777344, -10.546416282653809, -9.837499618530273, -9.128582954406738, -8.419666290283203, -7.710749626159668, -7.001832962036133, -6.292916297912598, -5.5839996337890625, -4.875082969665527, -4.166166305541992, -3.457249641418457, -2.748332977294922, -2.0394163131713867, -1.3305015563964844, -0.6215848922729492, 0.08733177185058594, 0.7962484359741211, 1.5051651000976562, 2.2140817642211914, 2.9229984283447266, 3.6319150924682617, 4.340831756591797, 5.049748420715332, 5.758665084838867, 6.467581748962402, 7.1764984130859375, 7.885415077209473, 8.594331741333008, 9.303248405456543, 10.012165069580078, 10.721081733703613, 11.429998397827148, 12.138915061950684, 12.847831726074219, 13.556748390197754, 14.265665054321289, 14.974581718444824, 15.68349838256836, 16.392414093017578, 17.10133171081543, 17.81024932861328, 18.5191650390625, 19.22808074951172, 19.93699836730957, 20.645915985107422, 21.35483169555664]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 1.0, 2.0, 5.0, 9.0, 7.0, 15.0, 26.0, 17.0, 32.0, 62.0, 79.0, 105.0, 151.0, 244.0, 428.0, 593.0, 1036.0, 1867.0, 3493.0, 7273.0, 18145.0, 58425.0, 490520.0, 3480464.0, 88536.0, 23870.0, 9246.0, 4334.0, 2148.0, 1175.0, 706.0, 411.0, 267.0, 187.0, 117.0, 85.0, 57.0, 36.0, 23.0, 26.0, 22.0, 14.0, 4.0, 4.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.072265625, -2.973602294921875, -2.87493896484375, -2.776275634765625, -2.6776123046875, -2.578948974609375, -2.48028564453125, -2.381622314453125, -2.282958984375, -2.184295654296875, -2.08563232421875, -1.986968994140625, -1.8883056640625, -1.789642333984375, -1.69097900390625, -1.592315673828125, -1.49365234375, -1.394989013671875, -1.29632568359375, -1.197662353515625, -1.0989990234375, -1.000335693359375, -0.90167236328125, -0.803009033203125, -0.704345703125, -0.605682373046875, -0.50701904296875, -0.408355712890625, -0.3096923828125, -0.211029052734375, -0.11236572265625, -0.013702392578125, 0.0849609375, 0.183624267578125, 0.28228759765625, 0.380950927734375, 0.4796142578125, 0.578277587890625, 0.67694091796875, 0.775604248046875, 0.874267578125, 0.972930908203125, 1.07159423828125, 1.170257568359375, 1.2689208984375, 1.367584228515625, 1.46624755859375, 1.564910888671875, 1.66357421875, 1.762237548828125, 1.86090087890625, 1.959564208984375, 2.0582275390625, 2.156890869140625, 2.25555419921875, 2.354217529296875, 2.452880859375, 2.551544189453125, 2.65020751953125, 2.748870849609375, 2.8475341796875, 2.946197509765625, 3.04486083984375, 3.143524169921875, 3.2421875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 19.0, 10.0, 6.0, 10.0, 14.0, 15.0, 20.0, 22.0, 35.0, 38.0, 32.0, 31.0, 43.0, 57.0, 53.0, 49.0, 61.0, 61.0, 47.0, 52.0, 52.0, 47.0, 42.0, 33.0, 30.0, 21.0, 22.0, 12.0, 12.0, 13.0, 4.0, 5.0, 6.0, 7.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30078125, -1.26165771484375, -1.2225341796875, -1.18341064453125, -1.144287109375, -1.10516357421875, -1.0660400390625, -1.02691650390625, -0.98779296875, -0.94866943359375, -0.9095458984375, -0.87042236328125, -0.831298828125, -0.79217529296875, -0.7530517578125, -0.71392822265625, -0.6748046875, -0.63568115234375, -0.5965576171875, -0.55743408203125, -0.518310546875, -0.47918701171875, -0.4400634765625, -0.40093994140625, -0.36181640625, -0.32269287109375, -0.2835693359375, -0.24444580078125, -0.205322265625, -0.16619873046875, -0.1270751953125, -0.08795166015625, -0.048828125, -0.00970458984375, 0.0294189453125, 0.06854248046875, 0.107666015625, 0.14678955078125, 0.1859130859375, 0.22503662109375, 0.26416015625, 0.30328369140625, 0.3424072265625, 0.38153076171875, 0.420654296875, 0.45977783203125, 0.4989013671875, 0.53802490234375, 0.5771484375, 0.61627197265625, 0.6553955078125, 0.69451904296875, 0.733642578125, 0.77276611328125, 0.8118896484375, 0.85101318359375, 0.89013671875, 0.92926025390625, 0.9683837890625, 1.00750732421875, 1.046630859375, 1.08575439453125, 1.1248779296875, 1.16400146484375, 1.203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 12.0, 7.0, 8.0, 35.0, 48.0, 59.0, 93.0, 322.0, 8134.0, 4170901.0, 13907.0, 454.0, 126.0, 86.0, 44.0, 26.0, 20.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -10.892333984375, -10.14404296875, -9.395751953125, -8.6474609375, -7.899169921875, -7.15087890625, -6.402587890625, -5.654296875, -4.906005859375, -4.15771484375, -3.409423828125, -2.6611328125, -1.912841796875, -1.16455078125, -0.416259765625, 0.33203125, 1.080322265625, 1.82861328125, 2.576904296875, 3.3251953125, 4.073486328125, 4.82177734375, 5.570068359375, 6.318359375, 7.066650390625, 7.81494140625, 8.563232421875, 9.3115234375, 10.059814453125, 10.80810546875, 11.556396484375, 12.3046875, 13.052978515625, 13.80126953125, 14.549560546875, 15.2978515625, 16.046142578125, 16.79443359375, 17.542724609375, 18.291015625, 19.039306640625, 19.78759765625, 20.535888671875, 21.2841796875, 22.032470703125, 22.78076171875, 23.529052734375, 24.27734375, 25.025634765625, 25.77392578125, 26.522216796875, 27.2705078125, 28.018798828125, 28.76708984375, 29.515380859375, 30.263671875, 31.011962890625, 31.76025390625, 32.508544921875, 33.2568359375, 34.005126953125, 34.75341796875, 35.501708984375, 36.25]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 13.0, 23.0, 38.0, 92.0, 363.0, 3179.0, 252.0, 67.0, 28.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.908203125, -1.765716552734375, -1.62322998046875, -1.480743408203125, -1.3382568359375, -1.195770263671875, -1.05328369140625, -0.910797119140625, -0.768310546875, -0.625823974609375, -0.48333740234375, -0.340850830078125, -0.1983642578125, -0.055877685546875, 0.08660888671875, 0.229095458984375, 0.37158203125, 0.514068603515625, 0.65655517578125, 0.799041748046875, 0.9415283203125, 1.084014892578125, 1.22650146484375, 1.368988037109375, 1.511474609375, 1.653961181640625, 1.79644775390625, 1.938934326171875, 2.0814208984375, 2.223907470703125, 2.36639404296875, 2.508880615234375, 2.6513671875, 2.793853759765625, 2.93634033203125, 3.078826904296875, 3.2213134765625, 3.363800048828125, 3.50628662109375, 3.648773193359375, 3.791259765625, 3.933746337890625, 4.07623291015625, 4.218719482421875, 4.3612060546875, 4.503692626953125, 4.64617919921875, 4.788665771484375, 4.93115234375, 5.073638916015625, 5.21612548828125, 5.358612060546875, 5.5010986328125, 5.643585205078125, 5.78607177734375, 5.928558349609375, 6.071044921875, 6.213531494140625, 6.35601806640625, 6.498504638671875, 6.6409912109375, 6.783477783203125, 6.92596435546875, 7.068450927734375, 7.2109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 11.0, 25.0, 45.0, 102.0, 156.0, 203.0, 165.0, 124.0, 74.0, 31.0, 25.0, 8.0, 7.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.504908561706543, -12.05265998840332, -11.600411415100098, -11.148162841796875, -10.695914268493652, -10.24366569519043, -9.79141616821289, -9.339168548583984, -8.886919021606445, -8.434670448303223, -7.982421875, -7.530173301696777, -7.077924728393555, -6.625676155090332, -6.173427104949951, -5.7211785316467285, -5.268930435180664, -4.816681861877441, -4.364433288574219, -3.912184476852417, -3.4599359035491943, -3.0076873302459717, -2.55543851852417, -2.1031899452209473, -1.6509413719177246, -1.198692798614502, -0.7464441061019897, -0.29419541358947754, 0.15805315971374512, 0.6103017330169678, 1.0625505447387695, 1.5147991180419922, 1.9670467376708984, 2.419295310974121, 2.8715438842773438, 3.3237926959991455, 3.776041269302368, 4.228289604187012, 4.680538654327393, 5.132787227630615, 5.585035800933838, 6.0372843742370605, 6.489532947540283, 6.941781997680664, 7.394030570983887, 7.846279144287109, 8.298527717590332, 8.750776290893555, 9.203024864196777, 9.6552734375, 10.107522010803223, 10.559770584106445, 11.012019157409668, 11.46426773071289, 11.91651725769043, 12.368764877319336, 12.821014404296875, 13.273262977600098, 13.72551155090332, 14.177760124206543, 14.630008697509766, 15.082257270812988, 15.534505844116211, 15.98675537109375, 16.439002990722656]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 12.0, 12.0, 13.0, 16.0, 17.0, 25.0, 27.0, 34.0, 34.0, 24.0, 42.0, 39.0, 38.0, 46.0, 51.0, 42.0, 46.0, 35.0, 45.0, 54.0, 45.0, 44.0, 36.0, 33.0, 23.0, 25.0, 24.0, 19.0, 18.0, 8.0, 10.0, 9.0, 7.0, 13.0, 2.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.29758071899414, -8.067474365234375, -7.837368488311768, -7.607262134552002, -7.3771562576293945, -7.147049903869629, -6.916943550109863, -6.686837673187256, -6.456731796264648, -6.226625442504883, -5.996519565582275, -5.76641321182251, -5.536307334899902, -5.306200981140137, -5.076094627380371, -4.845988750457764, -4.615882396697998, -4.385776042938232, -4.155670166015625, -3.9255638122558594, -3.695457935333252, -3.4653515815734863, -3.2352454662323, -3.0051393508911133, -2.7750332355499268, -2.5449271202087402, -2.3148210048675537, -2.084714889526367, -1.8546086549758911, -1.6245025396347046, -1.3943963050842285, -1.164290189743042, -0.9341835975646973, -0.7040774822235107, -0.47397130727767944, -0.24386513233184814, -0.013759016990661621, 0.2163470983505249, 0.446453332901001, 0.6765594482421875, 0.906665563583374, 1.1367716789245605, 1.366877794265747, 1.5969840288162231, 1.8270901441574097, 2.0571961402893066, 2.2873024940490723, 2.517408609390259, 2.7475147247314453, 2.977620840072632, 3.2077269554138184, 3.437833309173584, 3.6679391860961914, 3.898045539855957, 4.128151893615723, 4.35825777053833, 4.5883636474609375, 4.818470001220703, 5.0485758781433105, 5.278682231903076, 5.508788108825684, 5.738894462585449, 5.969000816345215, 6.199106693267822, 6.429213047027588]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 0.0, 5.0, 3.0, 6.0, 5.0, 18.0, 19.0, 32.0, 42.0, 75.0, 106.0, 169.0, 297.0, 599.0, 1051.0, 2075.0, 4088.0, 8555.0, 19437.0, 47490.0, 127704.0, 363671.0, 299945.0, 102950.0, 39192.0, 16165.0, 7352.0, 3595.0, 1756.0, 896.0, 526.0, 270.0, 178.0, 102.0, 62.0, 38.0, 25.0, 16.0, 11.0, 6.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.66796875, -3.55975341796875, -3.4515380859375, -3.34332275390625, -3.235107421875, -3.12689208984375, -3.0186767578125, -2.91046142578125, -2.80224609375, -2.69403076171875, -2.5858154296875, -2.47760009765625, -2.369384765625, -2.26116943359375, -2.1529541015625, -2.04473876953125, -1.9365234375, -1.82830810546875, -1.7200927734375, -1.61187744140625, -1.503662109375, -1.39544677734375, -1.2872314453125, -1.17901611328125, -1.07080078125, -0.96258544921875, -0.8543701171875, -0.74615478515625, -0.637939453125, -0.52972412109375, -0.4215087890625, -0.31329345703125, -0.205078125, -0.09686279296875, 0.0113525390625, 0.11956787109375, 0.227783203125, 0.33599853515625, 0.4442138671875, 0.55242919921875, 0.66064453125, 0.76885986328125, 0.8770751953125, 0.98529052734375, 1.093505859375, 1.20172119140625, 1.3099365234375, 1.41815185546875, 1.5263671875, 1.63458251953125, 1.7427978515625, 1.85101318359375, 1.959228515625, 2.06744384765625, 2.1756591796875, 2.28387451171875, 2.39208984375, 2.50030517578125, 2.6085205078125, 2.71673583984375, 2.824951171875, 2.93316650390625, 3.0413818359375, 3.14959716796875, 3.2578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 11.0, 11.0, 8.0, 11.0, 10.0, 22.0, 21.0, 30.0, 28.0, 25.0, 27.0, 41.0, 43.0, 46.0, 39.0, 49.0, 42.0, 45.0, 55.0, 46.0, 54.0, 46.0, 35.0, 39.0, 30.0, 28.0, 26.0, 26.0, 14.0, 11.0, 11.0, 14.0, 9.0, 8.0, 5.0, 1.0, 4.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.283203125, -1.244293212890625, -1.20538330078125, -1.166473388671875, -1.1275634765625, -1.088653564453125, -1.04974365234375, -1.010833740234375, -0.971923828125, -0.933013916015625, -0.89410400390625, -0.855194091796875, -0.8162841796875, -0.777374267578125, -0.73846435546875, -0.699554443359375, -0.66064453125, -0.621734619140625, -0.58282470703125, -0.543914794921875, -0.5050048828125, -0.466094970703125, -0.42718505859375, -0.388275146484375, -0.349365234375, -0.310455322265625, -0.27154541015625, -0.232635498046875, -0.1937255859375, -0.154815673828125, -0.11590576171875, -0.076995849609375, -0.0380859375, 0.000823974609375, 0.03973388671875, 0.078643798828125, 0.1175537109375, 0.156463623046875, 0.19537353515625, 0.234283447265625, 0.273193359375, 0.312103271484375, 0.35101318359375, 0.389923095703125, 0.4288330078125, 0.467742919921875, 0.50665283203125, 0.545562744140625, 0.58447265625, 0.623382568359375, 0.66229248046875, 0.701202392578125, 0.7401123046875, 0.779022216796875, 0.81793212890625, 0.856842041015625, 0.895751953125, 0.934661865234375, 0.97357177734375, 1.012481689453125, 1.0513916015625, 1.090301513671875, 1.12921142578125, 1.168121337890625, 1.20703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 7.0, 10.0, 8.0, 11.0, 12.0, 19.0, 40.0, 60.0, 94.0, 257.0, 782.0, 2949.0, 14300.0, 91227.0, 663475.0, 237039.0, 30513.0, 5616.0, 1338.0, 406.0, 144.0, 67.0, 45.0, 22.0, 27.0, 16.0, 11.0, 7.0, 8.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.81640625, -6.57904052734375, -6.3416748046875, -6.10430908203125, -5.866943359375, -5.62957763671875, -5.3922119140625, -5.15484619140625, -4.91748046875, -4.68011474609375, -4.4427490234375, -4.20538330078125, -3.968017578125, -3.73065185546875, -3.4932861328125, -3.25592041015625, -3.0185546875, -2.78118896484375, -2.5438232421875, -2.30645751953125, -2.069091796875, -1.83172607421875, -1.5943603515625, -1.35699462890625, -1.11962890625, -0.88226318359375, -0.6448974609375, -0.40753173828125, -0.170166015625, 0.06719970703125, 0.3045654296875, 0.54193115234375, 0.779296875, 1.01666259765625, 1.2540283203125, 1.49139404296875, 1.728759765625, 1.96612548828125, 2.2034912109375, 2.44085693359375, 2.67822265625, 2.91558837890625, 3.1529541015625, 3.39031982421875, 3.627685546875, 3.86505126953125, 4.1024169921875, 4.33978271484375, 4.5771484375, 4.81451416015625, 5.0518798828125, 5.28924560546875, 5.526611328125, 5.76397705078125, 6.0013427734375, 6.23870849609375, 6.47607421875, 6.71343994140625, 6.9508056640625, 7.18817138671875, 7.425537109375, 7.66290283203125, 7.9002685546875, 8.13763427734375, 8.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 7.0, 8.0, 11.0, 9.0, 8.0, 12.0, 16.0, 15.0, 20.0, 16.0, 25.0, 20.0, 33.0, 29.0, 38.0, 35.0, 45.0, 36.0, 34.0, 37.0, 47.0, 29.0, 41.0, 35.0, 42.0, 39.0, 36.0, 35.0, 26.0, 25.0, 25.0, 23.0, 17.0, 15.0, 16.0, 14.0, 12.0, 9.0, 7.0, 9.0, 10.0, 5.0, 8.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-4.4609375, -4.31494140625, -4.1689453125, -4.02294921875, -3.876953125, -3.73095703125, -3.5849609375, -3.43896484375, -3.29296875, -3.14697265625, -3.0009765625, -2.85498046875, -2.708984375, -2.56298828125, -2.4169921875, -2.27099609375, -2.125, -1.97900390625, -1.8330078125, -1.68701171875, -1.541015625, -1.39501953125, -1.2490234375, -1.10302734375, -0.95703125, -0.81103515625, -0.6650390625, -0.51904296875, -0.373046875, -0.22705078125, -0.0810546875, 0.06494140625, 0.2109375, 0.35693359375, 0.5029296875, 0.64892578125, 0.794921875, 0.94091796875, 1.0869140625, 1.23291015625, 1.37890625, 1.52490234375, 1.6708984375, 1.81689453125, 1.962890625, 2.10888671875, 2.2548828125, 2.40087890625, 2.546875, 2.69287109375, 2.8388671875, 2.98486328125, 3.130859375, 3.27685546875, 3.4228515625, 3.56884765625, 3.71484375, 3.86083984375, 4.0068359375, 4.15283203125, 4.298828125, 4.44482421875, 4.5908203125, 4.73681640625, 4.8828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 4.0, 4.0, 12.0, 7.0, 17.0, 25.0, 54.0, 72.0, 180.0, 547.0, 2467.0, 30690.0, 1003670.0, 8718.0, 1397.0, 365.0, 148.0, 66.0, 41.0, 27.0, 14.0, 10.0, 7.0, 7.0, 1.0, 1.0, 5.0, 1.0, 4.0], "bins": [-15.2265625, -14.90484619140625, -14.5831298828125, -14.26141357421875, -13.939697265625, -13.61798095703125, -13.2962646484375, -12.97454833984375, -12.65283203125, -12.33111572265625, -12.0093994140625, -11.68768310546875, -11.365966796875, -11.04425048828125, -10.7225341796875, -10.40081787109375, -10.0791015625, -9.75738525390625, -9.4356689453125, -9.11395263671875, -8.792236328125, -8.47052001953125, -8.1488037109375, -7.82708740234375, -7.50537109375, -7.18365478515625, -6.8619384765625, -6.54022216796875, -6.218505859375, -5.89678955078125, -5.5750732421875, -5.25335693359375, -4.931640625, -4.60992431640625, -4.2882080078125, -3.96649169921875, -3.644775390625, -3.32305908203125, -3.0013427734375, -2.67962646484375, -2.35791015625, -2.03619384765625, -1.7144775390625, -1.39276123046875, -1.071044921875, -0.74932861328125, -0.4276123046875, -0.10589599609375, 0.2158203125, 0.53753662109375, 0.8592529296875, 1.18096923828125, 1.502685546875, 1.82440185546875, 2.1461181640625, 2.46783447265625, 2.78955078125, 3.11126708984375, 3.4329833984375, 3.75469970703125, 4.076416015625, 4.39813232421875, 4.7198486328125, 5.04156494140625, 5.36328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 13.0, 12.0, 31.0, 55.0, 84.0, 136.0, 222.0, 192.0, 94.0, 62.0, 33.0, 18.0, 10.0, 14.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005717277526855469, -0.0005547478795051575, -0.0005377680063247681, -0.0005207881331443787, -0.0005038082599639893, -0.00048682838678359985, -0.00046984851360321045, -0.00045286864042282104, -0.00043588876724243164, -0.00041890889406204224, -0.00040192902088165283, -0.00038494914770126343, -0.000367969274520874, -0.0003509894013404846, -0.0003340095281600952, -0.0003170296549797058, -0.0003000497817993164, -0.000283069908618927, -0.0002660900354385376, -0.0002491101622581482, -0.0002321302890777588, -0.00021515041589736938, -0.00019817054271697998, -0.00018119066953659058, -0.00016421079635620117, -0.00014723092317581177, -0.00013025104999542236, -0.00011327117681503296, -9.629130363464355e-05, -7.931143045425415e-05, -6.233155727386475e-05, -4.535168409347534e-05, -2.8371810913085938e-05, -1.1391937732696533e-05, 5.587935447692871e-06, 2.2567808628082275e-05, 3.954768180847168e-05, 5.6527554988861084e-05, 7.350742816925049e-05, 9.048730134963989e-05, 0.0001074671745300293, 0.0001244470477104187, 0.0001414269208908081, 0.0001584067940711975, 0.00017538666725158691, 0.00019236654043197632, 0.00020934641361236572, 0.00022632628679275513, 0.00024330615997314453, 0.00026028603315353394, 0.00027726590633392334, 0.00029424577951431274, 0.00031122565269470215, 0.00032820552587509155, 0.00034518539905548096, 0.00036216527223587036, 0.00037914514541625977, 0.00039612501859664917, 0.0004131048917770386, 0.000430084764957428, 0.0004470646381378174, 0.0004640445113182068, 0.0004810243844985962, 0.0004980042576789856, 0.000514984130859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 6.0, 26.0, 51.0, 189.0, 724.0, 4688.0, 723348.0, 314573.0, 3980.0, 672.0, 171.0, 45.0, 28.0, 14.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -6.99322509765625, -6.7012939453125, -6.40936279296875, -6.117431640625, -5.82550048828125, -5.5335693359375, -5.24163818359375, -4.94970703125, -4.65777587890625, -4.3658447265625, -4.07391357421875, -3.781982421875, -3.49005126953125, -3.1981201171875, -2.90618896484375, -2.6142578125, -2.32232666015625, -2.0303955078125, -1.73846435546875, -1.446533203125, -1.15460205078125, -0.8626708984375, -0.57073974609375, -0.27880859375, 0.01312255859375, 0.3050537109375, 0.59698486328125, 0.888916015625, 1.18084716796875, 1.4727783203125, 1.76470947265625, 2.056640625, 2.34857177734375, 2.6405029296875, 2.93243408203125, 3.224365234375, 3.51629638671875, 3.8082275390625, 4.10015869140625, 4.39208984375, 4.68402099609375, 4.9759521484375, 5.26788330078125, 5.559814453125, 5.85174560546875, 6.1436767578125, 6.43560791015625, 6.7275390625, 7.01947021484375, 7.3114013671875, 7.60333251953125, 7.895263671875, 8.18719482421875, 8.4791259765625, 8.77105712890625, 9.06298828125, 9.35491943359375, 9.6468505859375, 9.93878173828125, 10.230712890625, 10.52264404296875, 10.8145751953125, 11.10650634765625, 11.3984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 7.0, 4.0, 8.0, 24.0, 39.0, 98.0, 155.0, 222.0, 160.0, 117.0, 69.0, 37.0, 15.0, 13.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8828125, -2.770263671875, -2.65771484375, -2.545166015625, -2.4326171875, -2.320068359375, -2.20751953125, -2.094970703125, -1.982421875, -1.869873046875, -1.75732421875, -1.644775390625, -1.5322265625, -1.419677734375, -1.30712890625, -1.194580078125, -1.08203125, -0.969482421875, -0.85693359375, -0.744384765625, -0.6318359375, -0.519287109375, -0.40673828125, -0.294189453125, -0.181640625, -0.069091796875, 0.04345703125, 0.156005859375, 0.2685546875, 0.381103515625, 0.49365234375, 0.606201171875, 0.71875, 0.831298828125, 0.94384765625, 1.056396484375, 1.1689453125, 1.281494140625, 1.39404296875, 1.506591796875, 1.619140625, 1.731689453125, 1.84423828125, 1.956787109375, 2.0693359375, 2.181884765625, 2.29443359375, 2.406982421875, 2.51953125, 2.632080078125, 2.74462890625, 2.857177734375, 2.9697265625, 3.082275390625, 3.19482421875, 3.307373046875, 3.419921875, 3.532470703125, 3.64501953125, 3.757568359375, 3.8701171875, 3.982666015625, 4.09521484375, 4.207763671875, 4.3203125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [3.0, 6.0, 5.0, 20.0, 57.0, 170.0, 322.0, 252.0, 112.0, 43.0, 14.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.072458267211914, -12.796661376953125, -10.520864486694336, -8.245067596435547, -5.969270706176758, -3.6934738159179688, -1.4176769256591797, 0.8581199645996094, 3.1339168548583984, 5.4097137451171875, 7.685510635375977, 9.961307525634766, 12.237104415893555, 14.512901306152344, 16.788698196411133, 19.064495086669922, 21.34029197692871, 23.6160888671875, 25.89188575744629, 28.167682647705078, 30.443479537963867, 32.719276428222656, 34.99507141113281, 37.270870208740234, 39.546669006347656, 41.82246398925781, 44.098262786865234, 46.374061584472656, 48.64985656738281, 50.92565155029297, 53.20145034790039, 55.47724914550781, 57.75303649902344, 60.028831481933594, 62.304630279541016, 64.58042907714844, 66.8562240600586, 69.13201904296875, 71.40782165527344, 73.6836166381836, 75.95941162109375, 78.2352066040039, 80.51100158691406, 82.78680419921875, 85.0625991821289, 87.33839416503906, 89.61419677734375, 91.8899917602539, 94.16578674316406, 96.44158172607422, 98.71737670898438, 100.99317932128906, 103.26897430419922, 105.54476928710938, 107.82057189941406, 110.09636688232422, 112.37216186523438, 114.64795684814453, 116.92375183105469, 119.19955444335938, 121.47534942626953, 123.75114440917969, 126.02694702148438, 128.302734375, 130.5785369873047]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 9.0, 9.0, 3.0, 10.0, 13.0, 10.0, 18.0, 30.0, 18.0, 16.0, 27.0, 31.0, 29.0, 24.0, 42.0, 41.0, 44.0, 50.0, 45.0, 38.0, 33.0, 35.0, 46.0, 43.0, 34.0, 32.0, 38.0, 29.0, 26.0, 26.0, 17.0, 22.0, 26.0, 11.0, 9.0, 14.0, 17.0, 9.0, 5.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.151662826538086, -24.38291358947754, -23.614166259765625, -22.845417022705078, -22.07666778564453, -21.307918548583984, -20.539169311523438, -19.770421981811523, -19.001672744750977, -18.23292350769043, -17.464176177978516, -16.69542694091797, -15.926677703857422, -15.157928466796875, -14.389180183410645, -13.620431900024414, -12.851682662963867, -12.08293342590332, -11.31418514251709, -10.54543685913086, -9.776687622070312, -9.007938385009766, -8.239190101623535, -7.4704413414001465, -6.701692581176758, -5.932943820953369, -5.1641950607299805, -4.395446300506592, -3.626697540283203, -2.8579487800598145, -2.089200019836426, -1.320451259613037, -0.5517024993896484, 0.21704626083374023, 0.9857950210571289, 1.7545437812805176, 2.5232925415039062, 3.292041301727295, 4.060790061950684, 4.829538822174072, 5.598287582397461, 6.36703634262085, 7.135785102844238, 7.904533863067627, 8.673282623291016, 9.442031860351562, 10.210780143737793, 10.979528427124023, 11.74827766418457, 12.517026901245117, 13.285775184631348, 14.054523468017578, 14.823272705078125, 15.592021942138672, 16.36077117919922, 17.129518508911133, 17.89826774597168, 18.667016983032227, 19.43576431274414, 20.204513549804688, 20.973262786865234, 21.74201202392578, 22.510761260986328, 23.279508590698242, 24.04825782775879]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 12.0, 13.0, 34.0, 40.0, 37.0, 97.0, 133.0, 246.0, 355.0, 666.0, 1391.0, 2607.0, 6027.0, 17235.0, 75550.0, 3918876.0, 132714.0, 23700.0, 7811.0, 3180.0, 1516.0, 807.0, 470.0, 258.0, 165.0, 129.0, 60.0, 46.0, 28.0, 15.0, 11.0, 14.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.25408935546875, -6.0277099609375, -5.80133056640625, -5.574951171875, -5.34857177734375, -5.1221923828125, -4.89581298828125, -4.66943359375, -4.44305419921875, -4.2166748046875, -3.99029541015625, -3.763916015625, -3.53753662109375, -3.3111572265625, -3.08477783203125, -2.8583984375, -2.63201904296875, -2.4056396484375, -2.17926025390625, -1.952880859375, -1.72650146484375, -1.5001220703125, -1.27374267578125, -1.04736328125, -0.82098388671875, -0.5946044921875, -0.36822509765625, -0.141845703125, 0.08453369140625, 0.3109130859375, 0.53729248046875, 0.763671875, 0.99005126953125, 1.2164306640625, 1.44281005859375, 1.669189453125, 1.89556884765625, 2.1219482421875, 2.34832763671875, 2.57470703125, 2.80108642578125, 3.0274658203125, 3.25384521484375, 3.480224609375, 3.70660400390625, 3.9329833984375, 4.15936279296875, 4.3857421875, 4.61212158203125, 4.8385009765625, 5.06488037109375, 5.291259765625, 5.51763916015625, 5.7440185546875, 5.97039794921875, 6.19677734375, 6.42315673828125, 6.6495361328125, 6.87591552734375, 7.102294921875, 7.32867431640625, 7.5550537109375, 7.78143310546875, 8.0078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 2.0, 9.0, 6.0, 9.0, 12.0, 12.0, 15.0, 26.0, 34.0, 25.0, 37.0, 33.0, 44.0, 45.0, 39.0, 46.0, 38.0, 58.0, 55.0, 56.0, 49.0, 50.0, 46.0, 46.0, 31.0, 23.0, 29.0, 34.0, 12.0, 17.0, 17.0, 8.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4365234375, -1.3884124755859375, -1.340301513671875, -1.2921905517578125, -1.24407958984375, -1.1959686279296875, -1.147857666015625, -1.0997467041015625, -1.0516357421875, -1.0035247802734375, -0.955413818359375, -0.9073028564453125, -0.85919189453125, -0.8110809326171875, -0.762969970703125, -0.7148590087890625, -0.666748046875, -0.6186370849609375, -0.570526123046875, -0.5224151611328125, -0.47430419921875, -0.4261932373046875, -0.378082275390625, -0.3299713134765625, -0.2818603515625, -0.2337493896484375, -0.185638427734375, -0.1375274658203125, -0.08941650390625, -0.0413055419921875, 0.006805419921875, 0.0549163818359375, 0.10302734375, 0.1511383056640625, 0.199249267578125, 0.2473602294921875, 0.29547119140625, 0.3435821533203125, 0.391693115234375, 0.4398040771484375, 0.4879150390625, 0.5360260009765625, 0.584136962890625, 0.6322479248046875, 0.68035888671875, 0.7284698486328125, 0.776580810546875, 0.8246917724609375, 0.872802734375, 0.9209136962890625, 0.969024658203125, 1.0171356201171875, 1.06524658203125, 1.1133575439453125, 1.161468505859375, 1.2095794677734375, 1.2576904296875, 1.3058013916015625, 1.353912353515625, 1.4020233154296875, 1.45013427734375, 1.4982452392578125, 1.546356201171875, 1.5944671630859375, 1.642578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 1.0, 1.0, 9.0, 19.0, 52.0, 124.0, 303.0, 918.0, 3381.0, 23135.0, 4000210.0, 154430.0, 9003.0, 1765.0, 585.0, 212.0, 81.0, 30.0, 12.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.484375, -14.9971923828125, -14.510009765625, -14.0228271484375, -13.53564453125, -13.0484619140625, -12.561279296875, -12.0740966796875, -11.5869140625, -11.0997314453125, -10.612548828125, -10.1253662109375, -9.63818359375, -9.1510009765625, -8.663818359375, -8.1766357421875, -7.689453125, -7.2022705078125, -6.715087890625, -6.2279052734375, -5.74072265625, -5.2535400390625, -4.766357421875, -4.2791748046875, -3.7919921875, -3.3048095703125, -2.817626953125, -2.3304443359375, -1.84326171875, -1.3560791015625, -0.868896484375, -0.3817138671875, 0.10546875, 0.5926513671875, 1.079833984375, 1.5670166015625, 2.05419921875, 2.5413818359375, 3.028564453125, 3.5157470703125, 4.0029296875, 4.4901123046875, 4.977294921875, 5.4644775390625, 5.95166015625, 6.4388427734375, 6.926025390625, 7.4132080078125, 7.900390625, 8.3875732421875, 8.874755859375, 9.3619384765625, 9.84912109375, 10.3363037109375, 10.823486328125, 11.3106689453125, 11.7978515625, 12.2850341796875, 12.772216796875, 13.2593994140625, 13.74658203125, 14.2337646484375, 14.720947265625, 15.2081298828125, 15.6953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 1.0, 8.0, 3.0, 14.0, 16.0, 26.0, 36.0, 44.0, 67.0, 173.0, 2808.0, 562.0, 130.0, 65.0, 41.0, 12.0, 9.0, 9.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.212890625, -3.11187744140625, -3.0108642578125, -2.90985107421875, -2.808837890625, -2.70782470703125, -2.6068115234375, -2.50579833984375, -2.40478515625, -2.30377197265625, -2.2027587890625, -2.10174560546875, -2.000732421875, -1.89971923828125, -1.7987060546875, -1.69769287109375, -1.5966796875, -1.49566650390625, -1.3946533203125, -1.29364013671875, -1.192626953125, -1.09161376953125, -0.9906005859375, -0.88958740234375, -0.78857421875, -0.68756103515625, -0.5865478515625, -0.48553466796875, -0.384521484375, -0.28350830078125, -0.1824951171875, -0.08148193359375, 0.01953125, 0.12054443359375, 0.2215576171875, 0.32257080078125, 0.423583984375, 0.52459716796875, 0.6256103515625, 0.72662353515625, 0.82763671875, 0.92864990234375, 1.0296630859375, 1.13067626953125, 1.231689453125, 1.33270263671875, 1.4337158203125, 1.53472900390625, 1.6357421875, 1.73675537109375, 1.8377685546875, 1.93878173828125, 2.039794921875, 2.14080810546875, 2.2418212890625, 2.34283447265625, 2.44384765625, 2.54486083984375, 2.6458740234375, 2.74688720703125, 2.847900390625, 2.94891357421875, 3.0499267578125, 3.15093994140625, 3.251953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 8.0, 13.0, 37.0, 78.0, 177.0, 262.0, 246.0, 114.0, 36.0, 14.0, 4.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.7468204498291, -17.033931732177734, -16.321043014526367, -15.608153343200684, -14.895264625549316, -14.18237590789795, -13.469486236572266, -12.756597518920898, -12.043708801269531, -11.330820083618164, -10.617931365966797, -9.905041694641113, -9.192152976989746, -8.479264259338379, -7.7663750648498535, -7.053485870361328, -6.340597152709961, -5.627708435058594, -4.914819240570068, -4.201930046081543, -3.489041328430176, -2.7761523723602295, -2.063263416290283, -1.3503742218017578, -0.6374855041503906, 0.07540345191955566, 0.788292407989502, 1.5011813640594482, 2.2140703201293945, 2.926959276199341, 3.639848232269287, 4.3527374267578125, 5.06562614440918, 5.778514862060547, 6.491404056549072, 7.204293251037598, 7.917181968688965, 8.630070686340332, 9.342960357666016, 10.055849075317383, 10.76873779296875, 11.481626510620117, 12.194515228271484, 12.907404899597168, 13.620293617248535, 14.333182334899902, 15.046072006225586, 15.758960723876953, 16.47184944152832, 17.184738159179688, 17.897626876831055, 18.610515594482422, 19.323406219482422, 20.03629493713379, 20.749183654785156, 21.462072372436523, 22.17496109008789, 22.887849807739258, 23.600738525390625, 24.313627243041992, 25.02651596069336, 25.73940658569336, 26.452295303344727, 27.165184020996094, 27.87807273864746]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 11.0, 4.0, 9.0, 15.0, 23.0, 25.0, 26.0, 30.0, 31.0, 31.0, 31.0, 39.0, 41.0, 32.0, 41.0, 46.0, 43.0, 48.0, 44.0, 63.0, 33.0, 32.0, 39.0, 39.0, 34.0, 24.0, 33.0, 26.0, 14.0, 19.0, 17.0, 10.0, 12.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.619104862213135, -6.378561973571777, -6.13801908493042, -5.8974761962890625, -5.656933307647705, -5.416390419006348, -5.17584753036499, -4.935304641723633, -4.694761753082275, -4.454218864440918, -4.2136759757995605, -3.973133087158203, -3.7325901985168457, -3.4920473098754883, -3.251504421234131, -3.0109615325927734, -2.770418643951416, -2.5298757553100586, -2.289332866668701, -2.0487899780273438, -1.8082470893859863, -1.567704200744629, -1.3271613121032715, -1.086618423461914, -0.8460755348205566, -0.6055326461791992, -0.3649897575378418, -0.12444686889648438, 0.11609601974487305, 0.35663890838623047, 0.5971817970275879, 0.8377246856689453, 1.078268051147461, 1.3188109397888184, 1.5593538284301758, 1.7998967170715332, 2.0404396057128906, 2.280982494354248, 2.5215253829956055, 2.762068271636963, 3.0026111602783203, 3.2431540489196777, 3.483696937561035, 3.7242398262023926, 3.96478271484375, 4.205325603485107, 4.445868492126465, 4.686411380767822, 4.92695426940918, 5.167497158050537, 5.4080400466918945, 5.648582935333252, 5.889125823974609, 6.129668712615967, 6.370211601257324, 6.610754489898682, 6.851297378540039, 7.0918402671813965, 7.332383155822754, 7.572926044464111, 7.813468933105469, 8.054012298583984, 8.294554710388184, 8.535097122192383, 8.775640487670898]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 6.0, 9.0, 11.0, 21.0, 19.0, 44.0, 59.0, 96.0, 122.0, 176.0, 327.0, 484.0, 841.0, 1302.0, 2373.0, 4339.0, 8610.0, 17960.0, 41369.0, 102849.0, 277466.0, 353332.0, 136723.0, 54217.0, 23116.0, 10654.0, 5195.0, 2768.0, 1596.0, 949.0, 544.0, 335.0, 235.0, 139.0, 78.0, 62.0, 42.0, 32.0, 20.0, 10.0, 7.0, 8.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.96551513671875, -3.8294677734375, -3.69342041015625, -3.557373046875, -3.42132568359375, -3.2852783203125, -3.14923095703125, -3.01318359375, -2.87713623046875, -2.7410888671875, -2.60504150390625, -2.468994140625, -2.33294677734375, -2.1968994140625, -2.06085205078125, -1.9248046875, -1.78875732421875, -1.6527099609375, -1.51666259765625, -1.380615234375, -1.24456787109375, -1.1085205078125, -0.97247314453125, -0.83642578125, -0.70037841796875, -0.5643310546875, -0.42828369140625, -0.292236328125, -0.15618896484375, -0.0201416015625, 0.11590576171875, 0.251953125, 0.38800048828125, 0.5240478515625, 0.66009521484375, 0.796142578125, 0.93218994140625, 1.0682373046875, 1.20428466796875, 1.34033203125, 1.47637939453125, 1.6124267578125, 1.74847412109375, 1.884521484375, 2.02056884765625, 2.1566162109375, 2.29266357421875, 2.4287109375, 2.56475830078125, 2.7008056640625, 2.83685302734375, 2.972900390625, 3.10894775390625, 3.2449951171875, 3.38104248046875, 3.51708984375, 3.65313720703125, 3.7891845703125, 3.92523193359375, 4.061279296875, 4.19732666015625, 4.3333740234375, 4.46942138671875, 4.60546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 8.0, 8.0, 15.0, 12.0, 19.0, 23.0, 26.0, 27.0, 33.0, 45.0, 45.0, 38.0, 52.0, 45.0, 43.0, 46.0, 61.0, 61.0, 44.0, 37.0, 47.0, 36.0, 27.0, 32.0, 34.0, 19.0, 24.0, 14.0, 12.0, 8.0, 15.0, 16.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.4725189208984375, -1.421600341796875, -1.3706817626953125, -1.31976318359375, -1.2688446044921875, -1.217926025390625, -1.1670074462890625, -1.1160888671875, -1.0651702880859375, -1.014251708984375, -0.9633331298828125, -0.91241455078125, -0.8614959716796875, -0.810577392578125, -0.7596588134765625, -0.708740234375, -0.6578216552734375, -0.606903076171875, -0.5559844970703125, -0.50506591796875, -0.4541473388671875, -0.403228759765625, -0.3523101806640625, -0.3013916015625, -0.2504730224609375, -0.199554443359375, -0.1486358642578125, -0.09771728515625, -0.0467987060546875, 0.004119873046875, 0.0550384521484375, 0.10595703125, 0.1568756103515625, 0.207794189453125, 0.2587127685546875, 0.30963134765625, 0.3605499267578125, 0.411468505859375, 0.4623870849609375, 0.5133056640625, 0.5642242431640625, 0.615142822265625, 0.6660614013671875, 0.71697998046875, 0.7678985595703125, 0.818817138671875, 0.8697357177734375, 0.920654296875, 0.9715728759765625, 1.022491455078125, 1.0734100341796875, 1.12432861328125, 1.1752471923828125, 1.226165771484375, 1.2770843505859375, 1.3280029296875, 1.3789215087890625, 1.429840087890625, 1.4807586669921875, 1.53167724609375, 1.5825958251953125, 1.633514404296875, 1.6844329833984375, 1.7353515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 2.0, 5.0, 7.0, 9.0, 9.0, 18.0, 20.0, 24.0, 22.0, 60.0, 102.0, 125.0, 281.0, 540.0, 1166.0, 3353.0, 10997.0, 45008.0, 298514.0, 578492.0, 83443.0, 18094.0, 4972.0, 1770.0, 701.0, 327.0, 184.0, 79.0, 72.0, 44.0, 29.0, 21.0, 11.0, 12.0, 11.0, 6.0, 7.0, 0.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.265625, -8.0087890625, -7.751953125, -7.4951171875, -7.23828125, -6.9814453125, -6.724609375, -6.4677734375, -6.2109375, -5.9541015625, -5.697265625, -5.4404296875, -5.18359375, -4.9267578125, -4.669921875, -4.4130859375, -4.15625, -3.8994140625, -3.642578125, -3.3857421875, -3.12890625, -2.8720703125, -2.615234375, -2.3583984375, -2.1015625, -1.8447265625, -1.587890625, -1.3310546875, -1.07421875, -0.8173828125, -0.560546875, -0.3037109375, -0.046875, 0.2099609375, 0.466796875, 0.7236328125, 0.98046875, 1.2373046875, 1.494140625, 1.7509765625, 2.0078125, 2.2646484375, 2.521484375, 2.7783203125, 3.03515625, 3.2919921875, 3.548828125, 3.8056640625, 4.0625, 4.3193359375, 4.576171875, 4.8330078125, 5.08984375, 5.3466796875, 5.603515625, 5.8603515625, 6.1171875, 6.3740234375, 6.630859375, 6.8876953125, 7.14453125, 7.4013671875, 7.658203125, 7.9150390625, 8.171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 8.0, 10.0, 18.0, 22.0, 25.0, 22.0, 41.0, 52.0, 54.0, 73.0, 69.0, 72.0, 68.0, 66.0, 67.0, 56.0, 51.0, 38.0, 38.0, 28.0, 28.0, 19.0, 16.0, 12.0, 15.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.34375, -11.994140625, -11.64453125, -11.294921875, -10.9453125, -10.595703125, -10.24609375, -9.896484375, -9.546875, -9.197265625, -8.84765625, -8.498046875, -8.1484375, -7.798828125, -7.44921875, -7.099609375, -6.75, -6.400390625, -6.05078125, -5.701171875, -5.3515625, -5.001953125, -4.65234375, -4.302734375, -3.953125, -3.603515625, -3.25390625, -2.904296875, -2.5546875, -2.205078125, -1.85546875, -1.505859375, -1.15625, -0.806640625, -0.45703125, -0.107421875, 0.2421875, 0.591796875, 0.94140625, 1.291015625, 1.640625, 1.990234375, 2.33984375, 2.689453125, 3.0390625, 3.388671875, 3.73828125, 4.087890625, 4.4375, 4.787109375, 5.13671875, 5.486328125, 5.8359375, 6.185546875, 6.53515625, 6.884765625, 7.234375, 7.583984375, 7.93359375, 8.283203125, 8.6328125, 8.982421875, 9.33203125, 9.681640625, 10.03125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 6.0, 7.0, 15.0, 48.0, 66.0, 129.0, 321.0, 822.0, 3156.0, 25469.0, 984486.0, 29154.0, 3340.0, 924.0, 335.0, 141.0, 69.0, 29.0, 17.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6640625, -12.2862548828125, -11.908447265625, -11.5306396484375, -11.15283203125, -10.7750244140625, -10.397216796875, -10.0194091796875, -9.6416015625, -9.2637939453125, -8.885986328125, -8.5081787109375, -8.13037109375, -7.7525634765625, -7.374755859375, -6.9969482421875, -6.619140625, -6.2413330078125, -5.863525390625, -5.4857177734375, -5.10791015625, -4.7301025390625, -4.352294921875, -3.9744873046875, -3.5966796875, -3.2188720703125, -2.841064453125, -2.4632568359375, -2.08544921875, -1.7076416015625, -1.329833984375, -0.9520263671875, -0.57421875, -0.1964111328125, 0.181396484375, 0.5592041015625, 0.93701171875, 1.3148193359375, 1.692626953125, 2.0704345703125, 2.4482421875, 2.8260498046875, 3.203857421875, 3.5816650390625, 3.95947265625, 4.3372802734375, 4.715087890625, 5.0928955078125, 5.470703125, 5.8485107421875, 6.226318359375, 6.6041259765625, 6.98193359375, 7.3597412109375, 7.737548828125, 8.1153564453125, 8.4931640625, 8.8709716796875, 9.248779296875, 9.6265869140625, 10.00439453125, 10.3822021484375, 10.760009765625, 11.1378173828125, 11.515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 17.0, 14.0, 27.0, 40.0, 88.0, 149.0, 248.0, 180.0, 111.0, 61.0, 26.0, 9.0, 5.0, 8.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010576248168945312, -0.0010309815406799316, -0.001004338264465332, -0.0009776949882507324, -0.0009510517120361328, -0.0009244084358215332, -0.0008977651596069336, -0.000871121883392334, -0.0008444786071777344, -0.0008178353309631348, -0.0007911920547485352, -0.0007645487785339355, -0.0007379055023193359, -0.0007112622261047363, -0.0006846189498901367, -0.0006579756736755371, -0.0006313323974609375, -0.0006046891212463379, -0.0005780458450317383, -0.0005514025688171387, -0.0005247592926025391, -0.0004981160163879395, -0.00047147274017333984, -0.00044482946395874023, -0.0004181861877441406, -0.000391542911529541, -0.0003648996353149414, -0.0003382563591003418, -0.0003116130828857422, -0.0002849698066711426, -0.00025832653045654297, -0.00023168325424194336, -0.00020503997802734375, -0.00017839670181274414, -0.00015175342559814453, -0.00012511014938354492, -9.846687316894531e-05, -7.18235969543457e-05, -4.5180320739746094e-05, -1.8537044525146484e-05, 8.106231689453125e-06, 3.4749507904052734e-05, 6.139278411865234e-05, 8.803606033325195e-05, 0.00011467933654785156, 0.00014132261276245117, 0.00016796588897705078, 0.0001946091651916504, 0.00022125244140625, 0.0002478957176208496, 0.0002745389938354492, 0.00030118227005004883, 0.00032782554626464844, 0.00035446882247924805, 0.00038111209869384766, 0.00040775537490844727, 0.0004343986511230469, 0.0004610419273376465, 0.0004876852035522461, 0.0005143284797668457, 0.0005409717559814453, 0.0005676150321960449, 0.0005942583084106445, 0.0006209015846252441, 0.0006475448608398438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 3.0, 8.0, 13.0, 25.0, 49.0, 131.0, 402.0, 1812.0, 14595.0, 929767.0, 96091.0, 4428.0, 833.0, 214.0, 84.0, 40.0, 25.0, 9.0, 7.0, 0.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -6.924072265625, -6.59033203125, -6.256591796875, -5.9228515625, -5.589111328125, -5.25537109375, -4.921630859375, -4.587890625, -4.254150390625, -3.92041015625, -3.586669921875, -3.2529296875, -2.919189453125, -2.58544921875, -2.251708984375, -1.91796875, -1.584228515625, -1.25048828125, -0.916748046875, -0.5830078125, -0.249267578125, 0.08447265625, 0.418212890625, 0.751953125, 1.085693359375, 1.41943359375, 1.753173828125, 2.0869140625, 2.420654296875, 2.75439453125, 3.088134765625, 3.421875, 3.755615234375, 4.08935546875, 4.423095703125, 4.7568359375, 5.090576171875, 5.42431640625, 5.758056640625, 6.091796875, 6.425537109375, 6.75927734375, 7.093017578125, 7.4267578125, 7.760498046875, 8.09423828125, 8.427978515625, 8.76171875, 9.095458984375, 9.42919921875, 9.762939453125, 10.0966796875, 10.430419921875, 10.76416015625, 11.097900390625, 11.431640625, 11.765380859375, 12.09912109375, 12.432861328125, 12.7666015625, 13.100341796875, 13.43408203125, 13.767822265625, 14.1015625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 13.0, 11.0, 33.0, 36.0, 78.0, 112.0, 214.0, 185.0, 101.0, 66.0, 43.0, 27.0, 13.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.233642578125, -5.02197265625, -4.810302734375, -4.5986328125, -4.386962890625, -4.17529296875, -3.963623046875, -3.751953125, -3.540283203125, -3.32861328125, -3.116943359375, -2.9052734375, -2.693603515625, -2.48193359375, -2.270263671875, -2.05859375, -1.846923828125, -1.63525390625, -1.423583984375, -1.2119140625, -1.000244140625, -0.78857421875, -0.576904296875, -0.365234375, -0.153564453125, 0.05810546875, 0.269775390625, 0.4814453125, 0.693115234375, 0.90478515625, 1.116455078125, 1.328125, 1.539794921875, 1.75146484375, 1.963134765625, 2.1748046875, 2.386474609375, 2.59814453125, 2.809814453125, 3.021484375, 3.233154296875, 3.44482421875, 3.656494140625, 3.8681640625, 4.079833984375, 4.29150390625, 4.503173828125, 4.71484375, 4.926513671875, 5.13818359375, 5.349853515625, 5.5615234375, 5.773193359375, 5.98486328125, 6.196533203125, 6.408203125, 6.619873046875, 6.83154296875, 7.043212890625, 7.2548828125, 7.466552734375, 7.67822265625, 7.889892578125, 8.1015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 14.0, 68.0, 242.0, 460.0, 166.0, 47.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.6890411376953, -177.04290771484375, -171.39678955078125, -165.7506561279297, -160.10452270507812, -154.45840454101562, -148.81227111816406, -143.1661376953125, -137.52001953125, -131.87388610839844, -126.22776794433594, -120.58163452148438, -114.93550872802734, -109.28938293457031, -103.64324951171875, -97.99712371826172, -92.35099792480469, -86.70487213134766, -81.05874633789062, -75.41261291503906, -69.76648712158203, -64.120361328125, -58.4742317199707, -52.828102111816406, -47.181976318359375, -41.535850524902344, -35.88972091674805, -30.243593215942383, -24.59746551513672, -18.951337814331055, -13.30521011352539, -7.659080505371094, -2.0129547119140625, 3.6331729888916016, 9.279300689697266, 14.92542839050293, 20.571556091308594, 26.217683792114258, 31.863811492919922, 37.50994110107422, 43.15606689453125, 48.80219268798828, 54.44832229614258, 60.094451904296875, 65.7405776977539, 71.38670349121094, 77.0328369140625, 82.67896270751953, 88.32508850097656, 93.9712142944336, 99.61734008789062, 105.26347351074219, 110.90959930419922, 116.55572509765625, 122.20185852050781, 127.84798431396484, 133.49411010742188, 139.14024353027344, 144.78636169433594, 150.4324951171875, 156.07861328125, 161.72474670410156, 167.37088012695312, 173.01699829101562, 178.6631317138672]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 1.0, 2.0, 8.0, 5.0, 6.0, 11.0, 14.0, 11.0, 13.0, 14.0, 26.0, 27.0, 26.0, 29.0, 34.0, 46.0, 30.0, 43.0, 27.0, 57.0, 58.0, 43.0, 45.0, 34.0, 42.0, 52.0, 58.0, 33.0, 34.0, 26.0, 24.0, 18.0, 18.0, 15.0, 14.0, 16.0, 10.0, 5.0, 4.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.800453186035156, -45.3001823425293, -43.79991149902344, -42.29964065551758, -40.79936981201172, -39.299095153808594, -37.798824310302734, -36.298553466796875, -34.798282623291016, -33.298011779785156, -31.797740936279297, -30.297468185424805, -28.797197341918945, -27.296926498413086, -25.796653747558594, -24.296382904052734, -22.796112060546875, -21.295841217041016, -19.795570373535156, -18.295297622680664, -16.795026779174805, -15.294755935668945, -13.79448413848877, -12.294212341308594, -10.793941497802734, -9.293670654296875, -7.793398857116699, -6.293127536773682, -4.792856216430664, -3.2925848960876465, -1.792313575744629, -0.2920417785644531, 1.2082290649414062, 2.708500385284424, 4.208771705627441, 5.709043025970459, 7.209314346313477, 8.709585189819336, 10.209856986999512, 11.710128784179688, 13.210399627685547, 14.710670471191406, 16.210941314697266, 17.711214065551758, 19.211484909057617, 20.711755752563477, 22.21202850341797, 23.712299346923828, 25.212570190429688, 26.712841033935547, 28.213111877441406, 29.7133846282959, 31.213655471801758, 32.71392822265625, 34.21419906616211, 35.71446990966797, 37.21474075317383, 38.71501159667969, 40.21528244018555, 41.715553283691406, 43.21582794189453, 44.71609878540039, 46.21636962890625, 47.71664047241211, 49.21691131591797]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 15.0, 17.0, 19.0, 34.0, 49.0, 63.0, 94.0, 145.0, 194.0, 255.0, 406.0, 648.0, 946.0, 1591.0, 2804.0, 5072.0, 9900.0, 21853.0, 61831.0, 576853.0, 3379351.0, 80844.0, 26209.0, 11314.0, 5762.0, 3111.0, 1739.0, 1073.0, 640.0, 454.0, 291.0, 188.0, 147.0, 98.0, 80.0, 55.0, 32.0, 26.0, 19.0, 15.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.609375, -5.43463134765625, -5.2598876953125, -5.08514404296875, -4.910400390625, -4.73565673828125, -4.5609130859375, -4.38616943359375, -4.21142578125, -4.03668212890625, -3.8619384765625, -3.68719482421875, -3.512451171875, -3.33770751953125, -3.1629638671875, -2.98822021484375, -2.8134765625, -2.63873291015625, -2.4639892578125, -2.28924560546875, -2.114501953125, -1.93975830078125, -1.7650146484375, -1.59027099609375, -1.41552734375, -1.24078369140625, -1.0660400390625, -0.89129638671875, -0.716552734375, -0.54180908203125, -0.3670654296875, -0.19232177734375, -0.017578125, 0.15716552734375, 0.3319091796875, 0.50665283203125, 0.681396484375, 0.85614013671875, 1.0308837890625, 1.20562744140625, 1.38037109375, 1.55511474609375, 1.7298583984375, 1.90460205078125, 2.079345703125, 2.25408935546875, 2.4288330078125, 2.60357666015625, 2.7783203125, 2.95306396484375, 3.1278076171875, 3.30255126953125, 3.477294921875, 3.65203857421875, 3.8267822265625, 4.00152587890625, 4.17626953125, 4.35101318359375, 4.5257568359375, 4.70050048828125, 4.875244140625, 5.04998779296875, 5.2247314453125, 5.39947509765625, 5.57421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 6.0, 4.0, 8.0, 12.0, 14.0, 15.0, 16.0, 28.0, 23.0, 24.0, 31.0, 38.0, 39.0, 42.0, 36.0, 36.0, 42.0, 50.0, 51.0, 40.0, 42.0, 51.0, 52.0, 49.0, 30.0, 34.0, 25.0, 31.0, 14.0, 25.0, 13.0, 17.0, 13.0, 4.0, 10.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.125, -2.059295654296875, -1.99359130859375, -1.927886962890625, -1.8621826171875, -1.796478271484375, -1.73077392578125, -1.665069580078125, -1.599365234375, -1.533660888671875, -1.46795654296875, -1.402252197265625, -1.3365478515625, -1.270843505859375, -1.20513916015625, -1.139434814453125, -1.07373046875, -1.008026123046875, -0.94232177734375, -0.876617431640625, -0.8109130859375, -0.745208740234375, -0.67950439453125, -0.613800048828125, -0.548095703125, -0.482391357421875, -0.41668701171875, -0.350982666015625, -0.2852783203125, -0.219573974609375, -0.15386962890625, -0.088165283203125, -0.0224609375, 0.043243408203125, 0.10894775390625, 0.174652099609375, 0.2403564453125, 0.306060791015625, 0.37176513671875, 0.437469482421875, 0.503173828125, 0.568878173828125, 0.63458251953125, 0.700286865234375, 0.7659912109375, 0.831695556640625, 0.89739990234375, 0.963104248046875, 1.02880859375, 1.094512939453125, 1.16021728515625, 1.225921630859375, 1.2916259765625, 1.357330322265625, 1.42303466796875, 1.488739013671875, 1.554443359375, 1.620147705078125, 1.68585205078125, 1.751556396484375, 1.8172607421875, 1.882965087890625, 1.94866943359375, 2.014373779296875, 2.080078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 26.0, 18.0, 46.0, 75.0, 100.0, 221.0, 411.0, 757.0, 1668.0, 4466.0, 18250.0, 221368.0, 3890456.0, 43861.0, 7749.0, 2537.0, 1076.0, 551.0, 263.0, 146.0, 98.0, 48.0, 33.0, 18.0, 7.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.6341552734375, -13.151123046875, -12.6680908203125, -12.18505859375, -11.7020263671875, -11.218994140625, -10.7359619140625, -10.2529296875, -9.7698974609375, -9.286865234375, -8.8038330078125, -8.32080078125, -7.8377685546875, -7.354736328125, -6.8717041015625, -6.388671875, -5.9056396484375, -5.422607421875, -4.9395751953125, -4.45654296875, -3.9735107421875, -3.490478515625, -3.0074462890625, -2.5244140625, -2.0413818359375, -1.558349609375, -1.0753173828125, -0.59228515625, -0.1092529296875, 0.373779296875, 0.8568115234375, 1.33984375, 1.8228759765625, 2.305908203125, 2.7889404296875, 3.27197265625, 3.7550048828125, 4.238037109375, 4.7210693359375, 5.2041015625, 5.6871337890625, 6.170166015625, 6.6531982421875, 7.13623046875, 7.6192626953125, 8.102294921875, 8.5853271484375, 9.068359375, 9.5513916015625, 10.034423828125, 10.5174560546875, 11.00048828125, 11.4835205078125, 11.966552734375, 12.4495849609375, 12.9326171875, 13.4156494140625, 13.898681640625, 14.3817138671875, 14.86474609375, 15.3477783203125, 15.830810546875, 16.3138427734375, 16.796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 24.0, 34.0, 61.0, 162.0, 2276.0, 1209.0, 137.0, 45.0, 38.0, 13.0, 20.0, 8.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.052490234375, -7.79248046875, -7.532470703125, -7.2724609375, -7.012451171875, -6.75244140625, -6.492431640625, -6.232421875, -5.972412109375, -5.71240234375, -5.452392578125, -5.1923828125, -4.932373046875, -4.67236328125, -4.412353515625, -4.15234375, -3.892333984375, -3.63232421875, -3.372314453125, -3.1123046875, -2.852294921875, -2.59228515625, -2.332275390625, -2.072265625, -1.812255859375, -1.55224609375, -1.292236328125, -1.0322265625, -0.772216796875, -0.51220703125, -0.252197265625, 0.0078125, 0.267822265625, 0.52783203125, 0.787841796875, 1.0478515625, 1.307861328125, 1.56787109375, 1.827880859375, 2.087890625, 2.347900390625, 2.60791015625, 2.867919921875, 3.1279296875, 3.387939453125, 3.64794921875, 3.907958984375, 4.16796875, 4.427978515625, 4.68798828125, 4.947998046875, 5.2080078125, 5.468017578125, 5.72802734375, 5.988037109375, 6.248046875, 6.508056640625, 6.76806640625, 7.028076171875, 7.2880859375, 7.548095703125, 7.80810546875, 8.068115234375, 8.328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 32.0, 79.0, 211.0, 332.0, 226.0, 76.0, 20.0, 11.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.95905303955078, -45.25733947753906, -43.555625915527344, -41.853912353515625, -40.15220260620117, -38.45048904418945, -36.748775482177734, -35.047061920166016, -33.34535217285156, -31.643638610839844, -29.941926956176758, -28.24021339416504, -26.538501739501953, -24.836788177490234, -23.135074615478516, -21.433361053466797, -19.731647491455078, -18.02993392944336, -16.328222274780273, -14.626508712768555, -12.924796104431152, -11.22308349609375, -9.521369934082031, -7.819657325744629, -6.117944717407227, -4.416232109069824, -2.7145190238952637, -1.0128059387207031, 0.6889066696166992, 2.3906192779541016, 4.09233283996582, 5.794045448303223, 7.495758056640625, 9.197470664978027, 10.89918327331543, 12.600896835327148, 14.30260944366455, 16.004322052001953, 17.706035614013672, 19.40774917602539, 21.109460830688477, 22.811174392700195, 24.51288604736328, 26.214599609375, 27.91631317138672, 29.618024826049805, 31.319738388061523, 33.02145004272461, 34.72316360473633, 36.42487716674805, 38.126590728759766, 39.82830047607422, 41.53001403808594, 43.231727600097656, 44.933441162109375, 46.635154724121094, 48.33686828613281, 50.03858184814453, 51.74029541015625, 53.44200897216797, 55.14371871948242, 56.84543228149414, 58.54714584350586, 60.24885940551758, 61.95056915283203]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 9.0, 11.0, 5.0, 15.0, 19.0, 18.0, 17.0, 24.0, 16.0, 28.0, 27.0, 31.0, 46.0, 33.0, 51.0, 49.0, 46.0, 47.0, 38.0, 41.0, 38.0, 58.0, 47.0, 40.0, 34.0, 26.0, 29.0, 28.0, 20.0, 21.0, 22.0, 11.0, 11.0, 7.0, 13.0, 6.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-17.317501068115234, -16.852710723876953, -16.38791847229004, -15.923128128051758, -15.45833683013916, -14.993545532226562, -14.528755187988281, -14.063963890075684, -13.599172592163086, -13.134381294250488, -12.669590950012207, -12.20479965209961, -11.740008354187012, -11.275217056274414, -10.810426712036133, -10.345635414123535, -9.880845069885254, -9.416053771972656, -8.951263427734375, -8.486472129821777, -8.02168083190918, -7.55689001083374, -7.092099189758301, -6.627307891845703, -6.162517070770264, -5.697726249694824, -5.232934951782227, -4.768144130706787, -4.303353309631348, -3.83856201171875, -3.3737711906433105, -2.908980131149292, -2.4441890716552734, -1.9793980121612549, -1.5146070718765259, -1.0498161315917969, -0.5850250720977783, -0.12023401260375977, 0.3445568084716797, 0.8093478679656982, 1.2741389274597168, 1.7389299869537354, 2.203721046447754, 2.6685118675231934, 3.133302927017212, 3.5980939865112305, 4.06288480758667, 4.527675628662109, 4.992466926574707, 5.4572577476501465, 5.922049045562744, 6.386839866638184, 6.851631164550781, 7.316421985626221, 7.78121280670166, 8.246004104614258, 8.710794448852539, 9.175585746765137, 9.640376091003418, 10.105167388916016, 10.569958686828613, 11.034749984741211, 11.499540328979492, 11.96433162689209, 12.429122924804688]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 7.0, 6.0, 12.0, 9.0, 10.0, 24.0, 28.0, 44.0, 79.0, 89.0, 139.0, 200.0, 337.0, 466.0, 657.0, 1029.0, 1437.0, 2072.0, 3096.0, 4934.0, 7589.0, 11988.0, 19369.0, 32224.0, 55589.0, 100417.0, 183773.0, 245224.0, 162626.0, 88236.0, 49128.0, 28849.0, 17602.0, 10865.0, 7018.0, 4292.0, 2976.0, 1965.0, 1353.0, 897.0, 600.0, 439.0, 269.0, 173.0, 109.0, 110.0, 67.0, 50.0, 23.0, 24.0, 12.0, 7.0, 12.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.591796875, -3.477386474609375, -3.36297607421875, -3.248565673828125, -3.1341552734375, -3.019744873046875, -2.90533447265625, -2.790924072265625, -2.676513671875, -2.562103271484375, -2.44769287109375, -2.333282470703125, -2.2188720703125, -2.104461669921875, -1.99005126953125, -1.875640869140625, -1.76123046875, -1.646820068359375, -1.53240966796875, -1.417999267578125, -1.3035888671875, -1.189178466796875, -1.07476806640625, -0.960357666015625, -0.845947265625, -0.731536865234375, -0.61712646484375, -0.502716064453125, -0.3883056640625, -0.273895263671875, -0.15948486328125, -0.045074462890625, 0.0693359375, 0.183746337890625, 0.29815673828125, 0.412567138671875, 0.5269775390625, 0.641387939453125, 0.75579833984375, 0.870208740234375, 0.984619140625, 1.099029541015625, 1.21343994140625, 1.327850341796875, 1.4422607421875, 1.556671142578125, 1.67108154296875, 1.785491943359375, 1.89990234375, 2.014312744140625, 2.12872314453125, 2.243133544921875, 2.3575439453125, 2.471954345703125, 2.58636474609375, 2.700775146484375, 2.815185546875, 2.929595947265625, 3.04400634765625, 3.158416748046875, 3.2728271484375, 3.387237548828125, 3.50164794921875, 3.616058349609375, 3.73046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 10.0, 10.0, 13.0, 20.0, 15.0, 20.0, 27.0, 20.0, 26.0, 35.0, 34.0, 34.0, 44.0, 41.0, 35.0, 50.0, 42.0, 50.0, 49.0, 39.0, 49.0, 36.0, 36.0, 39.0, 30.0, 27.0, 30.0, 25.0, 20.0, 13.0, 10.0, 11.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.359375, -2.287689208984375, -2.21600341796875, -2.144317626953125, -2.0726318359375, -2.000946044921875, -1.92926025390625, -1.857574462890625, -1.785888671875, -1.714202880859375, -1.64251708984375, -1.570831298828125, -1.4991455078125, -1.427459716796875, -1.35577392578125, -1.284088134765625, -1.21240234375, -1.140716552734375, -1.06903076171875, -0.997344970703125, -0.9256591796875, -0.853973388671875, -0.78228759765625, -0.710601806640625, -0.638916015625, -0.567230224609375, -0.49554443359375, -0.423858642578125, -0.3521728515625, -0.280487060546875, -0.20880126953125, -0.137115478515625, -0.0654296875, 0.006256103515625, 0.07794189453125, 0.149627685546875, 0.2213134765625, 0.292999267578125, 0.36468505859375, 0.436370849609375, 0.508056640625, 0.579742431640625, 0.65142822265625, 0.723114013671875, 0.7947998046875, 0.866485595703125, 0.93817138671875, 1.009857177734375, 1.08154296875, 1.153228759765625, 1.22491455078125, 1.296600341796875, 1.3682861328125, 1.439971923828125, 1.51165771484375, 1.583343505859375, 1.655029296875, 1.726715087890625, 1.79840087890625, 1.870086669921875, 1.9417724609375, 2.013458251953125, 2.08514404296875, 2.156829833984375, 2.228515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 20.0, 30.0, 25.0, 46.0, 69.0, 114.0, 186.0, 337.0, 576.0, 1051.0, 2020.0, 4441.0, 10252.0, 26730.0, 83066.0, 332452.0, 425511.0, 106133.0, 33138.0, 12194.0, 4977.0, 2426.0, 1201.0, 623.0, 388.0, 187.0, 127.0, 55.0, 43.0, 28.0, 24.0, 13.0, 11.0, 11.0, 8.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.9609375, -8.690185546875, -8.41943359375, -8.148681640625, -7.8779296875, -7.607177734375, -7.33642578125, -7.065673828125, -6.794921875, -6.524169921875, -6.25341796875, -5.982666015625, -5.7119140625, -5.441162109375, -5.17041015625, -4.899658203125, -4.62890625, -4.358154296875, -4.08740234375, -3.816650390625, -3.5458984375, -3.275146484375, -3.00439453125, -2.733642578125, -2.462890625, -2.192138671875, -1.92138671875, -1.650634765625, -1.3798828125, -1.109130859375, -0.83837890625, -0.567626953125, -0.296875, -0.026123046875, 0.24462890625, 0.515380859375, 0.7861328125, 1.056884765625, 1.32763671875, 1.598388671875, 1.869140625, 2.139892578125, 2.41064453125, 2.681396484375, 2.9521484375, 3.222900390625, 3.49365234375, 3.764404296875, 4.03515625, 4.305908203125, 4.57666015625, 4.847412109375, 5.1181640625, 5.388916015625, 5.65966796875, 5.930419921875, 6.201171875, 6.471923828125, 6.74267578125, 7.013427734375, 7.2841796875, 7.554931640625, 7.82568359375, 8.096435546875, 8.3671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 10.0, 20.0, 18.0, 25.0, 33.0, 28.0, 37.0, 40.0, 53.0, 38.0, 57.0, 60.0, 65.0, 57.0, 50.0, 50.0, 45.0, 53.0, 43.0, 46.0, 24.0, 20.0, 20.0, 14.0, 13.0, 9.0, 12.0, 11.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.3125, -17.813232421875, -17.31396484375, -16.814697265625, -16.3154296875, -15.816162109375, -15.31689453125, -14.817626953125, -14.318359375, -13.819091796875, -13.31982421875, -12.820556640625, -12.3212890625, -11.822021484375, -11.32275390625, -10.823486328125, -10.32421875, -9.824951171875, -9.32568359375, -8.826416015625, -8.3271484375, -7.827880859375, -7.32861328125, -6.829345703125, -6.330078125, -5.830810546875, -5.33154296875, -4.832275390625, -4.3330078125, -3.833740234375, -3.33447265625, -2.835205078125, -2.3359375, -1.836669921875, -1.33740234375, -0.838134765625, -0.3388671875, 0.160400390625, 0.65966796875, 1.158935546875, 1.658203125, 2.157470703125, 2.65673828125, 3.156005859375, 3.6552734375, 4.154541015625, 4.65380859375, 5.153076171875, 5.65234375, 6.151611328125, 6.65087890625, 7.150146484375, 7.6494140625, 8.148681640625, 8.64794921875, 9.147216796875, 9.646484375, 10.145751953125, 10.64501953125, 11.144287109375, 11.6435546875, 12.142822265625, 12.64208984375, 13.141357421875, 13.640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 14.0, 17.0, 8.0, 29.0, 41.0, 74.0, 115.0, 209.0, 470.0, 1207.0, 4951.0, 33603.0, 569768.0, 407265.0, 24998.0, 3853.0, 1034.0, 421.0, 218.0, 110.0, 57.0, 34.0, 24.0, 14.0, 10.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1812744140625, -7.932861328125, -7.6844482421875, -7.43603515625, -7.1876220703125, -6.939208984375, -6.6907958984375, -6.4423828125, -6.1939697265625, -5.945556640625, -5.6971435546875, -5.44873046875, -5.2003173828125, -4.951904296875, -4.7034912109375, -4.455078125, -4.2066650390625, -3.958251953125, -3.7098388671875, -3.46142578125, -3.2130126953125, -2.964599609375, -2.7161865234375, -2.4677734375, -2.2193603515625, -1.970947265625, -1.7225341796875, -1.47412109375, -1.2257080078125, -0.977294921875, -0.7288818359375, -0.48046875, -0.2320556640625, 0.016357421875, 0.2647705078125, 0.51318359375, 0.7615966796875, 1.010009765625, 1.2584228515625, 1.5068359375, 1.7552490234375, 2.003662109375, 2.2520751953125, 2.50048828125, 2.7489013671875, 2.997314453125, 3.2457275390625, 3.494140625, 3.7425537109375, 3.990966796875, 4.2393798828125, 4.48779296875, 4.7362060546875, 4.984619140625, 5.2330322265625, 5.4814453125, 5.7298583984375, 5.978271484375, 6.2266845703125, 6.47509765625, 6.7235107421875, 6.971923828125, 7.2203369140625, 7.46875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 29.0, 36.0, 50.0, 128.0, 163.0, 185.0, 128.0, 108.0, 73.0, 37.0, 27.0, 8.0, 5.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005888938903808594, -0.0005531683564186096, -0.0005174428224563599, -0.0004817172884941101, -0.00044599175453186035, -0.0004102662205696106, -0.00037454068660736084, -0.0003388151526451111, -0.00030308961868286133, -0.00026736408472061157, -0.00023163855075836182, -0.00019591301679611206, -0.0001601874828338623, -0.00012446194887161255, -8.873641490936279e-05, -5.301088094711304e-05, -1.728534698486328e-05, 1.8440186977386475e-05, 5.416572093963623e-05, 8.989125490188599e-05, 0.00012561678886413574, 0.0001613423228263855, 0.00019706785678863525, 0.000232793390750885, 0.00026851892471313477, 0.0003042444586753845, 0.0003399699926376343, 0.00037569552659988403, 0.0004114210605621338, 0.00044714659452438354, 0.0004828721284866333, 0.0005185976624488831, 0.0005543231964111328, 0.0005900487303733826, 0.0006257742643356323, 0.0006614997982978821, 0.0006972253322601318, 0.0007329508662223816, 0.0007686764001846313, 0.0008044019341468811, 0.0008401274681091309, 0.0008758530020713806, 0.0009115785360336304, 0.0009473040699958801, 0.0009830296039581299, 0.0010187551379203796, 0.0010544806718826294, 0.0010902062058448792, 0.001125931739807129, 0.0011616572737693787, 0.0011973828077316284, 0.0012331083416938782, 0.001268833875656128, 0.0013045594096183777, 0.0013402849435806274, 0.0013760104775428772, 0.001411736011505127, 0.0014474615454673767, 0.0014831870794296265, 0.0015189126133918762, 0.001554638147354126, 0.0015903636813163757, 0.0016260892152786255, 0.0016618147492408752, 0.001697540283203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 10.0, 4.0, 11.0, 11.0, 20.0, 25.0, 36.0, 63.0, 93.0, 138.0, 262.0, 513.0, 1476.0, 5098.0, 25700.0, 221730.0, 671279.0, 102291.0, 14443.0, 3395.0, 1006.0, 413.0, 208.0, 115.0, 65.0, 52.0, 40.0, 27.0, 14.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -4.0379638671875, -3.857177734375, -3.6763916015625, -3.49560546875, -3.3148193359375, -3.134033203125, -2.9532470703125, -2.7724609375, -2.5916748046875, -2.410888671875, -2.2301025390625, -2.04931640625, -1.8685302734375, -1.687744140625, -1.5069580078125, -1.326171875, -1.1453857421875, -0.964599609375, -0.7838134765625, -0.60302734375, -0.4222412109375, -0.241455078125, -0.0606689453125, 0.1201171875, 0.3009033203125, 0.481689453125, 0.6624755859375, 0.84326171875, 1.0240478515625, 1.204833984375, 1.3856201171875, 1.56640625, 1.7471923828125, 1.927978515625, 2.1087646484375, 2.28955078125, 2.4703369140625, 2.651123046875, 2.8319091796875, 3.0126953125, 3.1934814453125, 3.374267578125, 3.5550537109375, 3.73583984375, 3.9166259765625, 4.097412109375, 4.2781982421875, 4.458984375, 4.6397705078125, 4.820556640625, 5.0013427734375, 5.18212890625, 5.3629150390625, 5.543701171875, 5.7244873046875, 5.9052734375, 6.0860595703125, 6.266845703125, 6.4476318359375, 6.62841796875, 6.8092041015625, 6.989990234375, 7.1707763671875, 7.3515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 7.0, 7.0, 19.0, 35.0, 44.0, 72.0, 101.0, 129.0, 163.0, 125.0, 101.0, 66.0, 42.0, 28.0, 30.0, 10.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.37432861328125, -12.0689697265625, -11.76361083984375, -11.458251953125, -11.15289306640625, -10.8475341796875, -10.54217529296875, -10.23681640625, -9.93145751953125, -9.6260986328125, -9.32073974609375, -9.015380859375, -8.71002197265625, -8.4046630859375, -8.09930419921875, -7.7939453125, -7.48858642578125, -7.1832275390625, -6.87786865234375, -6.572509765625, -6.26715087890625, -5.9617919921875, -5.65643310546875, -5.35107421875, -5.04571533203125, -4.7403564453125, -4.43499755859375, -4.129638671875, -3.82427978515625, -3.5189208984375, -3.21356201171875, -2.908203125, -2.60284423828125, -2.2974853515625, -1.99212646484375, -1.686767578125, -1.38140869140625, -1.0760498046875, -0.77069091796875, -0.46533203125, -0.15997314453125, 0.1453857421875, 0.45074462890625, 0.756103515625, 1.06146240234375, 1.3668212890625, 1.67218017578125, 1.9775390625, 2.28289794921875, 2.5882568359375, 2.89361572265625, 3.198974609375, 3.50433349609375, 3.8096923828125, 4.11505126953125, 4.42041015625, 4.72576904296875, 5.0311279296875, 5.33648681640625, 5.641845703125, 5.94720458984375, 6.2525634765625, 6.55792236328125, 6.86328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 12.0, 14.0, 28.0, 69.0, 175.0, 277.0, 216.0, 123.0, 48.0, 22.0, 12.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.73076629638672, -59.09770584106445, -54.46464157104492, -49.831581115722656, -45.198516845703125, -40.56545639038086, -35.932395935058594, -31.299331665039062, -26.666271209716797, -22.0332088470459, -17.400146484375, -12.767086029052734, -8.134023666381836, -3.5009613037109375, 1.1320991516113281, 5.765163421630859, 10.398223876953125, 15.031286239624023, 19.664348602294922, 24.297409057617188, 28.930471420288086, 33.563533782958984, 38.19659423828125, 42.82965850830078, 47.46271896362305, 52.09577941894531, 56.728843688964844, 61.36190414428711, 65.99496459960938, 70.6280288696289, 75.26109313964844, 79.89414978027344, 84.5272216796875, 89.16028594970703, 93.79334259033203, 98.42640686035156, 103.0594711303711, 107.69253540039062, 112.32559204101562, 116.95865631103516, 121.59172058105469, 126.22478485107422, 130.85784912109375, 135.49090576171875, 140.12396240234375, 144.7570343017578, 149.3900909423828, 154.02316284179688, 158.65621948242188, 163.28927612304688, 167.92234802246094, 172.55540466308594, 177.18846130371094, 181.821533203125, 186.45458984375, 191.087646484375, 195.720703125, 200.353759765625, 204.98683166503906, 209.61988830566406, 214.25294494628906, 218.88601684570312, 223.51907348632812, 228.15213012695312, 232.7852020263672]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 11.0, 13.0, 12.0, 13.0, 12.0, 8.0, 24.0, 25.0, 32.0, 27.0, 29.0, 33.0, 37.0, 39.0, 38.0, 56.0, 47.0, 45.0, 49.0, 47.0, 55.0, 43.0, 29.0, 32.0, 40.0, 31.0, 24.0, 16.0, 26.0, 20.0, 15.0, 13.0, 9.0, 5.0, 5.0, 4.0, 4.0, 7.0, 1.0, 0.0, 2.0, 2.0, 4.0], "bins": [-89.3072509765625, -86.95874786376953, -84.61024475097656, -82.26174926757812, -79.91324615478516, -77.56474304199219, -75.21623992919922, -72.86773681640625, -70.51923370361328, -68.17073059082031, -65.82222747802734, -63.47372817993164, -61.12522506713867, -58.77672576904297, -56.42822265625, -54.07971954345703, -51.73122024536133, -49.38271713256836, -47.034217834472656, -44.68571472167969, -42.33721160888672, -39.98870849609375, -37.64020919799805, -35.29170608520508, -32.943206787109375, -30.59470558166504, -28.24620246887207, -25.897701263427734, -23.549198150634766, -21.20069694519043, -18.852195739746094, -16.503692626953125, -14.15518569946289, -11.806683540344238, -9.458181381225586, -7.10968017578125, -4.761178016662598, -2.4126758575439453, -0.06417465209960938, 2.2843284606933594, 4.632829666137695, 6.981331825256348, 9.329833984375, 11.678335189819336, 14.026837348937988, 16.37533950805664, 18.723840713500977, 21.072343826293945, 23.42084503173828, 25.769346237182617, 28.117849349975586, 30.466350555419922, 32.81485366821289, 35.163352966308594, 37.51185607910156, 39.86035919189453, 42.2088623046875, 44.55736541748047, 46.90586471557617, 49.25436782836914, 51.60287094116211, 53.95137023925781, 56.29987335205078, 58.64837646484375, 60.99687576293945]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 13.0, 5.0, 11.0, 12.0, 14.0, 22.0, 22.0, 38.0, 42.0, 58.0, 92.0, 153.0, 261.0, 520.0, 1108.0, 2417.0, 6213.0, 34678.0, 4122899.0, 17330.0, 4526.0, 1958.0, 875.0, 409.0, 205.0, 99.0, 77.0, 47.0, 34.0, 24.0, 25.0, 18.0, 13.0, 14.0, 10.0, 15.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.071044921875, -11.67333984375, -11.275634765625, -10.8779296875, -10.480224609375, -10.08251953125, -9.684814453125, -9.287109375, -8.889404296875, -8.49169921875, -8.093994140625, -7.6962890625, -7.298583984375, -6.90087890625, -6.503173828125, -6.10546875, -5.707763671875, -5.31005859375, -4.912353515625, -4.5146484375, -4.116943359375, -3.71923828125, -3.321533203125, -2.923828125, -2.526123046875, -2.12841796875, -1.730712890625, -1.3330078125, -0.935302734375, -0.53759765625, -0.139892578125, 0.2578125, 0.655517578125, 1.05322265625, 1.450927734375, 1.8486328125, 2.246337890625, 2.64404296875, 3.041748046875, 3.439453125, 3.837158203125, 4.23486328125, 4.632568359375, 5.0302734375, 5.427978515625, 5.82568359375, 6.223388671875, 6.62109375, 7.018798828125, 7.41650390625, 7.814208984375, 8.2119140625, 8.609619140625, 9.00732421875, 9.405029296875, 9.802734375, 10.200439453125, 10.59814453125, 10.995849609375, 11.3935546875, 11.791259765625, 12.18896484375, 12.586669921875, 12.984375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 12.0, 12.0, 11.0, 8.0, 10.0, 14.0, 25.0, 25.0, 37.0, 46.0, 44.0, 52.0, 50.0, 58.0, 42.0, 60.0, 53.0, 49.0, 54.0, 55.0, 54.0, 38.0, 25.0, 33.0, 23.0, 21.0, 20.0, 17.0, 8.0, 9.0, 6.0, 10.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.271240234375, -4.14404296875, -4.016845703125, -3.8896484375, -3.762451171875, -3.63525390625, -3.508056640625, -3.380859375, -3.253662109375, -3.12646484375, -2.999267578125, -2.8720703125, -2.744873046875, -2.61767578125, -2.490478515625, -2.36328125, -2.236083984375, -2.10888671875, -1.981689453125, -1.8544921875, -1.727294921875, -1.60009765625, -1.472900390625, -1.345703125, -1.218505859375, -1.09130859375, -0.964111328125, -0.8369140625, -0.709716796875, -0.58251953125, -0.455322265625, -0.328125, -0.200927734375, -0.07373046875, 0.053466796875, 0.1806640625, 0.307861328125, 0.43505859375, 0.562255859375, 0.689453125, 0.816650390625, 0.94384765625, 1.071044921875, 1.1982421875, 1.325439453125, 1.45263671875, 1.579833984375, 1.70703125, 1.834228515625, 1.96142578125, 2.088623046875, 2.2158203125, 2.343017578125, 2.47021484375, 2.597412109375, 2.724609375, 2.851806640625, 2.97900390625, 3.106201171875, 3.2333984375, 3.360595703125, 3.48779296875, 3.614990234375, 3.7421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 2.0, 3.0, 8.0, 16.0, 13.0, 20.0, 30.0, 32.0, 56.0, 89.0, 106.0, 223.0, 541.0, 1276.0, 4219.0, 72932.0, 4105515.0, 6137.0, 1736.0, 610.0, 278.0, 149.0, 80.0, 53.0, 45.0, 20.0, 19.0, 13.0, 15.0, 16.0, 5.0, 9.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -30.955078125, -29.72265625, -28.490234375, -27.2578125, -26.025390625, -24.79296875, -23.560546875, -22.328125, -21.095703125, -19.86328125, -18.630859375, -17.3984375, -16.166015625, -14.93359375, -13.701171875, -12.46875, -11.236328125, -10.00390625, -8.771484375, -7.5390625, -6.306640625, -5.07421875, -3.841796875, -2.609375, -1.376953125, -0.14453125, 1.087890625, 2.3203125, 3.552734375, 4.78515625, 6.017578125, 7.25, 8.482421875, 9.71484375, 10.947265625, 12.1796875, 13.412109375, 14.64453125, 15.876953125, 17.109375, 18.341796875, 19.57421875, 20.806640625, 22.0390625, 23.271484375, 24.50390625, 25.736328125, 26.96875, 28.201171875, 29.43359375, 30.666015625, 31.8984375, 33.130859375, 34.36328125, 35.595703125, 36.828125, 38.060546875, 39.29296875, 40.525390625, 41.7578125, 42.990234375, 44.22265625, 45.455078125, 46.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 6.0, 13.0, 40.0, 3903.0, 78.0, 22.0, 8.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.7308349609375, -4.461669921875, -4.1925048828125, -3.92333984375, -3.6541748046875, -3.385009765625, -3.1158447265625, -2.8466796875, -2.5775146484375, -2.308349609375, -2.0391845703125, -1.77001953125, -1.5008544921875, -1.231689453125, -0.9625244140625, -0.693359375, -0.4241943359375, -0.155029296875, 0.1141357421875, 0.38330078125, 0.6524658203125, 0.921630859375, 1.1907958984375, 1.4599609375, 1.7291259765625, 1.998291015625, 2.2674560546875, 2.53662109375, 2.8057861328125, 3.074951171875, 3.3441162109375, 3.61328125, 3.8824462890625, 4.151611328125, 4.4207763671875, 4.68994140625, 4.9591064453125, 5.228271484375, 5.4974365234375, 5.7666015625, 6.0357666015625, 6.304931640625, 6.5740966796875, 6.84326171875, 7.1124267578125, 7.381591796875, 7.6507568359375, 7.919921875, 8.1890869140625, 8.458251953125, 8.7274169921875, 8.99658203125, 9.2657470703125, 9.534912109375, 9.8040771484375, 10.0732421875, 10.3424072265625, 10.611572265625, 10.8807373046875, 11.14990234375, 11.4190673828125, 11.688232421875, 11.9573974609375, 12.2265625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 9.0, 10.0, 20.0, 30.0, 47.0, 120.0, 159.0, 189.0, 159.0, 88.0, 69.0, 37.0, 24.0, 12.0, 14.0, 4.0, 4.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.949695587158203, -8.398055076599121, -7.8464155197143555, -7.294775009155273, -6.743135452270508, -6.191494941711426, -5.639854907989502, -5.088214874267578, -4.536574840545654, -3.9849348068237305, -3.4332947731018066, -2.8816545009613037, -2.33001446723938, -1.778374433517456, -1.2267341613769531, -0.6750941276550293, -0.12345409393310547, 0.42818599939346313, 0.9798260927200317, 1.5314662456512451, 2.083106279373169, 2.6347463130950928, 3.1863865852355957, 3.7380266189575195, 4.289666652679443, 4.841306686401367, 5.392946720123291, 5.944586753845215, 6.496227264404297, 7.0478668212890625, 7.5995073318481445, 8.151147842407227, 8.702787399291992, 9.254427909851074, 9.80606746673584, 10.357707977294922, 10.909347534179688, 11.46098804473877, 12.012628555297852, 12.564268112182617, 13.115907669067383, 13.667548179626465, 14.21918773651123, 14.770828247070312, 15.322467803955078, 15.87410831451416, 16.425748825073242, 16.977388381958008, 17.529029846191406, 18.080669403076172, 18.63231086730957, 19.183950424194336, 19.7355899810791, 20.287229537963867, 20.838871002197266, 21.39051055908203, 21.942150115966797, 22.493789672851562, 23.04543113708496, 23.597070693969727, 24.148710250854492, 24.700349807739258, 25.251991271972656, 25.803630828857422, 26.355270385742188]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 11.0, 15.0, 12.0, 18.0, 18.0, 15.0, 24.0, 17.0, 26.0, 25.0, 32.0, 36.0, 30.0, 44.0, 42.0, 37.0, 31.0, 39.0, 41.0, 41.0, 40.0, 46.0, 36.0, 22.0, 51.0, 39.0, 32.0, 30.0, 18.0, 15.0, 17.0, 9.0, 14.0, 8.0, 9.0, 11.0, 7.0, 11.0, 9.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.134509563446045, -6.869848728179932, -6.605187892913818, -6.340527057647705, -6.075866222381592, -5.8112053871154785, -5.546544075012207, -5.281883239746094, -5.0172224044799805, -4.752561569213867, -4.487900733947754, -4.223239898681641, -3.9585790634155273, -3.693918228149414, -3.4292571544647217, -3.1645963191986084, -2.899935722351074, -2.635274887084961, -2.3706140518188477, -2.1059532165527344, -1.8412922620773315, -1.5766314268112183, -1.3119704723358154, -1.0473096370697021, -0.7826488018035889, -0.5179879665374756, -0.25332707166671753, 0.011333823204040527, 0.2759946584701538, 0.5406554937362671, 0.8053164482116699, 1.0699772834777832, 1.3346376419067383, 1.5992984771728516, 1.8639593124389648, 2.128620147705078, 2.3932809829711914, 2.6579418182373047, 2.922602891921997, 3.1872637271881104, 3.4519245624542236, 3.716585397720337, 3.98124623298645, 4.245907306671143, 4.510568141937256, 4.775228977203369, 5.039889812469482, 5.304550647735596, 5.569211483001709, 5.833872318267822, 6.0985331535339355, 6.363193988800049, 6.627854824066162, 6.892515659332275, 7.157176971435547, 7.42183780670166, 7.686498641967773, 7.951159477233887, 8.2158203125, 8.480481147766113, 8.745141983032227, 9.00980281829834, 9.274463653564453, 9.539124488830566, 9.80378532409668]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 15.0, 22.0, 25.0, 48.0, 58.0, 89.0, 146.0, 175.0, 259.0, 465.0, 701.0, 1131.0, 1884.0, 3093.0, 5470.0, 9977.0, 19225.0, 39142.0, 87287.0, 203664.0, 328714.0, 189000.0, 80704.0, 36840.0, 17961.0, 9560.0, 5134.0, 2941.0, 1772.0, 1082.0, 674.0, 440.0, 275.0, 180.0, 125.0, 79.0, 58.0, 43.0, 30.0, 20.0, 13.0, 5.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.0859375, -7.84423828125, -7.6025390625, -7.36083984375, -7.119140625, -6.87744140625, -6.6357421875, -6.39404296875, -6.15234375, -5.91064453125, -5.6689453125, -5.42724609375, -5.185546875, -4.94384765625, -4.7021484375, -4.46044921875, -4.21875, -3.97705078125, -3.7353515625, -3.49365234375, -3.251953125, -3.01025390625, -2.7685546875, -2.52685546875, -2.28515625, -2.04345703125, -1.8017578125, -1.56005859375, -1.318359375, -1.07666015625, -0.8349609375, -0.59326171875, -0.3515625, -0.10986328125, 0.1318359375, 0.37353515625, 0.615234375, 0.85693359375, 1.0986328125, 1.34033203125, 1.58203125, 1.82373046875, 2.0654296875, 2.30712890625, 2.548828125, 2.79052734375, 3.0322265625, 3.27392578125, 3.515625, 3.75732421875, 3.9990234375, 4.24072265625, 4.482421875, 4.72412109375, 4.9658203125, 5.20751953125, 5.44921875, 5.69091796875, 5.9326171875, 6.17431640625, 6.416015625, 6.65771484375, 6.8994140625, 7.14111328125, 7.3828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 3.0, 10.0, 16.0, 14.0, 22.0, 17.0, 32.0, 28.0, 32.0, 36.0, 49.0, 38.0, 60.0, 58.0, 63.0, 51.0, 44.0, 55.0, 56.0, 51.0, 46.0, 28.0, 35.0, 33.0, 19.0, 17.0, 18.0, 9.0, 5.0, 10.0, 5.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.82672119140625, -4.6807861328125, -4.53485107421875, -4.388916015625, -4.24298095703125, -4.0970458984375, -3.95111083984375, -3.80517578125, -3.65924072265625, -3.5133056640625, -3.36737060546875, -3.221435546875, -3.07550048828125, -2.9295654296875, -2.78363037109375, -2.6376953125, -2.49176025390625, -2.3458251953125, -2.19989013671875, -2.053955078125, -1.90802001953125, -1.7620849609375, -1.61614990234375, -1.47021484375, -1.32427978515625, -1.1783447265625, -1.03240966796875, -0.886474609375, -0.74053955078125, -0.5946044921875, -0.44866943359375, -0.302734375, -0.15679931640625, -0.0108642578125, 0.13507080078125, 0.281005859375, 0.42694091796875, 0.5728759765625, 0.71881103515625, 0.86474609375, 1.01068115234375, 1.1566162109375, 1.30255126953125, 1.448486328125, 1.59442138671875, 1.7403564453125, 1.88629150390625, 2.0322265625, 2.17816162109375, 2.3240966796875, 2.47003173828125, 2.615966796875, 2.76190185546875, 2.9078369140625, 3.05377197265625, 3.19970703125, 3.34564208984375, 3.4915771484375, 3.63751220703125, 3.783447265625, 3.92938232421875, 4.0753173828125, 4.22125244140625, 4.3671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 9.0, 9.0, 14.0, 21.0, 20.0, 55.0, 70.0, 116.0, 183.0, 333.0, 625.0, 1188.0, 2690.0, 6729.0, 17702.0, 56278.0, 227125.0, 530205.0, 143984.0, 38840.0, 12974.0, 5030.0, 2109.0, 998.0, 501.0, 263.0, 157.0, 93.0, 57.0, 47.0, 22.0, 20.0, 14.0, 16.0, 12.0, 11.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8984375, -12.4434814453125, -11.988525390625, -11.5335693359375, -11.07861328125, -10.6236572265625, -10.168701171875, -9.7137451171875, -9.2587890625, -8.8038330078125, -8.348876953125, -7.8939208984375, -7.43896484375, -6.9840087890625, -6.529052734375, -6.0740966796875, -5.619140625, -5.1641845703125, -4.709228515625, -4.2542724609375, -3.79931640625, -3.3443603515625, -2.889404296875, -2.4344482421875, -1.9794921875, -1.5245361328125, -1.069580078125, -0.6146240234375, -0.15966796875, 0.2952880859375, 0.750244140625, 1.2052001953125, 1.66015625, 2.1151123046875, 2.570068359375, 3.0250244140625, 3.47998046875, 3.9349365234375, 4.389892578125, 4.8448486328125, 5.2998046875, 5.7547607421875, 6.209716796875, 6.6646728515625, 7.11962890625, 7.5745849609375, 8.029541015625, 8.4844970703125, 8.939453125, 9.3944091796875, 9.849365234375, 10.3043212890625, 10.75927734375, 11.2142333984375, 11.669189453125, 12.1241455078125, 12.5791015625, 13.0340576171875, 13.489013671875, 13.9439697265625, 14.39892578125, 14.8538818359375, 15.308837890625, 15.7637939453125, 16.21875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 9.0, 9.0, 9.0, 16.0, 10.0, 13.0, 21.0, 21.0, 24.0, 21.0, 41.0, 43.0, 44.0, 38.0, 46.0, 45.0, 41.0, 46.0, 53.0, 53.0, 45.0, 45.0, 26.0, 46.0, 36.0, 25.0, 26.0, 28.0, 25.0, 18.0, 12.0, 12.0, 7.0, 9.0, 9.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.181396484375, -20.44091796875, -19.700439453125, -18.9599609375, -18.219482421875, -17.47900390625, -16.738525390625, -15.998046875, -15.257568359375, -14.51708984375, -13.776611328125, -13.0361328125, -12.295654296875, -11.55517578125, -10.814697265625, -10.07421875, -9.333740234375, -8.59326171875, -7.852783203125, -7.1123046875, -6.371826171875, -5.63134765625, -4.890869140625, -4.150390625, -3.409912109375, -2.66943359375, -1.928955078125, -1.1884765625, -0.447998046875, 0.29248046875, 1.032958984375, 1.7734375, 2.513916015625, 3.25439453125, 3.994873046875, 4.7353515625, 5.475830078125, 6.21630859375, 6.956787109375, 7.697265625, 8.437744140625, 9.17822265625, 9.918701171875, 10.6591796875, 11.399658203125, 12.14013671875, 12.880615234375, 13.62109375, 14.361572265625, 15.10205078125, 15.842529296875, 16.5830078125, 17.323486328125, 18.06396484375, 18.804443359375, 19.544921875, 20.285400390625, 21.02587890625, 21.766357421875, 22.5068359375, 23.247314453125, 23.98779296875, 24.728271484375, 25.46875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 11.0, 9.0, 10.0, 29.0, 30.0, 49.0, 71.0, 79.0, 131.0, 231.0, 437.0, 968.0, 2666.0, 10822.0, 443095.0, 573514.0, 11480.0, 2771.0, 1032.0, 430.0, 229.0, 150.0, 104.0, 64.0, 47.0, 27.0, 19.0, 14.0, 9.0, 8.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.255126953125, -19.55712890625, -18.859130859375, -18.1611328125, -17.463134765625, -16.76513671875, -16.067138671875, -15.369140625, -14.671142578125, -13.97314453125, -13.275146484375, -12.5771484375, -11.879150390625, -11.18115234375, -10.483154296875, -9.78515625, -9.087158203125, -8.38916015625, -7.691162109375, -6.9931640625, -6.295166015625, -5.59716796875, -4.899169921875, -4.201171875, -3.503173828125, -2.80517578125, -2.107177734375, -1.4091796875, -0.711181640625, -0.01318359375, 0.684814453125, 1.3828125, 2.080810546875, 2.77880859375, 3.476806640625, 4.1748046875, 4.872802734375, 5.57080078125, 6.268798828125, 6.966796875, 7.664794921875, 8.36279296875, 9.060791015625, 9.7587890625, 10.456787109375, 11.15478515625, 11.852783203125, 12.55078125, 13.248779296875, 13.94677734375, 14.644775390625, 15.3427734375, 16.040771484375, 16.73876953125, 17.436767578125, 18.134765625, 18.832763671875, 19.53076171875, 20.228759765625, 20.9267578125, 21.624755859375, 22.32275390625, 23.020751953125, 23.71875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 11.0, 23.0, 42.0, 50.0, 71.0, 104.0, 138.0, 171.0, 133.0, 86.0, 48.0, 39.0, 22.0, 18.0, 6.0, 8.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001434326171875, -0.0013899058103561401, -0.0013454854488372803, -0.0013010650873184204, -0.0012566447257995605, -0.0012122243642807007, -0.0011678040027618408, -0.001123383641242981, -0.001078963279724121, -0.0010345429182052612, -0.0009901225566864014, -0.0009457021951675415, -0.0009012818336486816, -0.0008568614721298218, -0.0008124411106109619, -0.000768020749092102, -0.0007236003875732422, -0.0006791800260543823, -0.0006347596645355225, -0.0005903393030166626, -0.0005459189414978027, -0.0005014985799789429, -0.000457078218460083, -0.00041265785694122314, -0.0003682374954223633, -0.0003238171339035034, -0.00027939677238464355, -0.0002349764108657837, -0.00019055604934692383, -0.00014613568782806396, -0.0001017153263092041, -5.729496479034424e-05, -1.2874603271484375e-05, 3.154575824737549e-05, 7.596611976623535e-05, 0.00012038648128509521, 0.00016480684280395508, 0.00020922720432281494, 0.0002536475658416748, 0.00029806792736053467, 0.00034248828887939453, 0.0003869086503982544, 0.00043132901191711426, 0.0004757493734359741, 0.000520169734954834, 0.0005645900964736938, 0.0006090104579925537, 0.0006534308195114136, 0.0006978511810302734, 0.0007422715425491333, 0.0007866919040679932, 0.000831112265586853, 0.0008755326271057129, 0.0009199529886245728, 0.0009643733501434326, 0.0010087937116622925, 0.0010532140731811523, 0.0010976344347000122, 0.001142054796218872, 0.001186475157737732, 0.0012308955192565918, 0.0012753158807754517, 0.0013197362422943115, 0.0013641566038131714, 0.0014085769653320312]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 9.0, 2.0, 11.0, 33.0, 59.0, 132.0, 347.0, 1165.0, 4748.0, 66296.0, 953504.0, 18437.0, 2638.0, 704.0, 251.0, 91.0, 56.0, 28.0, 16.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.125, -28.38427734375, -27.6435546875, -26.90283203125, -26.162109375, -25.42138671875, -24.6806640625, -23.93994140625, -23.19921875, -22.45849609375, -21.7177734375, -20.97705078125, -20.236328125, -19.49560546875, -18.7548828125, -18.01416015625, -17.2734375, -16.53271484375, -15.7919921875, -15.05126953125, -14.310546875, -13.56982421875, -12.8291015625, -12.08837890625, -11.34765625, -10.60693359375, -9.8662109375, -9.12548828125, -8.384765625, -7.64404296875, -6.9033203125, -6.16259765625, -5.421875, -4.68115234375, -3.9404296875, -3.19970703125, -2.458984375, -1.71826171875, -0.9775390625, -0.23681640625, 0.50390625, 1.24462890625, 1.9853515625, 2.72607421875, 3.466796875, 4.20751953125, 4.9482421875, 5.68896484375, 6.4296875, 7.17041015625, 7.9111328125, 8.65185546875, 9.392578125, 10.13330078125, 10.8740234375, 11.61474609375, 12.35546875, 13.09619140625, 13.8369140625, 14.57763671875, 15.318359375, 16.05908203125, 16.7998046875, 17.54052734375, 18.28125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 10.0, 11.0, 9.0, 31.0, 76.0, 169.0, 241.0, 215.0, 101.0, 45.0, 26.0, 22.0, 7.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.75, -29.000244140625, -28.25048828125, -27.500732421875, -26.7509765625, -26.001220703125, -25.25146484375, -24.501708984375, -23.751953125, -23.002197265625, -22.25244140625, -21.502685546875, -20.7529296875, -20.003173828125, -19.25341796875, -18.503662109375, -17.75390625, -17.004150390625, -16.25439453125, -15.504638671875, -14.7548828125, -14.005126953125, -13.25537109375, -12.505615234375, -11.755859375, -11.006103515625, -10.25634765625, -9.506591796875, -8.7568359375, -8.007080078125, -7.25732421875, -6.507568359375, -5.7578125, -5.008056640625, -4.25830078125, -3.508544921875, -2.7587890625, -2.009033203125, -1.25927734375, -0.509521484375, 0.240234375, 0.989990234375, 1.73974609375, 2.489501953125, 3.2392578125, 3.989013671875, 4.73876953125, 5.488525390625, 6.23828125, 6.988037109375, 7.73779296875, 8.487548828125, 9.2373046875, 9.987060546875, 10.73681640625, 11.486572265625, 12.236328125, 12.986083984375, 13.73583984375, 14.485595703125, 15.2353515625, 15.985107421875, 16.73486328125, 17.484619140625, 18.234375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 6.0, 5.0, 4.0, 7.0, 12.0, 17.0, 18.0, 17.0, 27.0, 29.0, 29.0, 40.0, 55.0, 59.0, 62.0, 75.0, 76.0, 78.0, 68.0, 68.0, 72.0, 57.0, 38.0, 18.0, 17.0, 12.0, 13.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.45630645751953, -80.62721252441406, -77.7981185913086, -74.9690170288086, -72.13992309570312, -69.31082916259766, -66.48173522949219, -63.65263748168945, -60.82353973388672, -57.99444580078125, -55.165348052978516, -52.33625411987305, -49.50715637207031, -46.678062438964844, -43.848968505859375, -41.01987075805664, -38.19077682495117, -35.3616828918457, -32.53258514404297, -29.7034912109375, -26.874393463134766, -24.045299530029297, -21.216203689575195, -18.387107849121094, -15.558012008666992, -12.72891616821289, -9.899820327758789, -7.070725440979004, -4.241629600524902, -1.4125337600708008, 1.4165611267089844, 4.245656967163086, 7.0747528076171875, 9.903848648071289, 12.73294448852539, 15.562039375305176, 18.391136169433594, 21.220230102539062, 24.049325942993164, 26.878421783447266, 29.707517623901367, 32.53661346435547, 35.36570739746094, 38.19480514526367, 41.02389907836914, 43.852996826171875, 46.682090759277344, 49.51118469238281, 52.34028244018555, 55.169376373291016, 57.99847412109375, 60.82756805419922, 63.65666580200195, 66.48576354980469, 69.31485748291016, 72.14395141601562, 74.9730453491211, 77.80213928222656, 80.63123321533203, 83.46033477783203, 86.2894287109375, 89.11852264404297, 91.94761657714844, 94.77671813964844, 97.6058120727539]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 10.0, 11.0, 14.0, 15.0, 14.0, 20.0, 19.0, 24.0, 30.0, 34.0, 39.0, 45.0, 51.0, 35.0, 52.0, 53.0, 57.0, 50.0, 58.0, 48.0, 42.0, 36.0, 34.0, 34.0, 28.0, 20.0, 20.0, 14.0, 19.0, 11.0, 15.0, 11.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-125.03569030761719, -121.04708099365234, -117.0584716796875, -113.06986236572266, -109.08125305175781, -105.0926513671875, -101.10403442382812, -97.11543273925781, -93.12682342529297, -89.13821411132812, -85.14960479736328, -81.16099548339844, -77.1723861694336, -73.18377685546875, -69.19517517089844, -65.2065658569336, -61.217952728271484, -57.22934341430664, -53.2407341003418, -49.25212860107422, -45.263519287109375, -41.27490997314453, -37.28630065917969, -33.297691345214844, -29.309083938598633, -25.32047462463379, -21.331867218017578, -17.343257904052734, -13.354649543762207, -9.36604118347168, -5.377431869506836, -1.388824462890625, 2.5997848510742188, 6.588393211364746, 10.577001571655273, 14.565610885620117, 18.554218292236328, 22.542827606201172, 26.531436920166016, 30.520044326782227, 34.50865173339844, 38.49726104736328, 42.485870361328125, 46.47447967529297, 50.46308517456055, 54.45169448852539, 58.440303802490234, 62.42890930175781, 66.41752624511719, 70.40613555908203, 74.39474487304688, 78.38335418701172, 82.37196350097656, 86.36056518554688, 90.34918212890625, 94.33778381347656, 98.3263931274414, 102.31500244140625, 106.3036117553711, 110.29222106933594, 114.28083038330078, 118.26943969726562, 122.25804138183594, 126.24665069580078, 130.23526000976562]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 6.0, 11.0, 16.0, 10.0, 15.0, 18.0, 24.0, 41.0, 58.0, 62.0, 100.0, 143.0, 218.0, 406.0, 719.0, 1451.0, 3551.0, 13580.0, 4117241.0, 46084.0, 6091.0, 2078.0, 1009.0, 512.0, 292.0, 155.0, 123.0, 73.0, 40.0, 47.0, 19.0, 20.0, 16.0, 13.0, 11.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.916015625, -23.20703125, -22.498046875, -21.7890625, -21.080078125, -20.37109375, -19.662109375, -18.953125, -18.244140625, -17.53515625, -16.826171875, -16.1171875, -15.408203125, -14.69921875, -13.990234375, -13.28125, -12.572265625, -11.86328125, -11.154296875, -10.4453125, -9.736328125, -9.02734375, -8.318359375, -7.609375, -6.900390625, -6.19140625, -5.482421875, -4.7734375, -4.064453125, -3.35546875, -2.646484375, -1.9375, -1.228515625, -0.51953125, 0.189453125, 0.8984375, 1.607421875, 2.31640625, 3.025390625, 3.734375, 4.443359375, 5.15234375, 5.861328125, 6.5703125, 7.279296875, 7.98828125, 8.697265625, 9.40625, 10.115234375, 10.82421875, 11.533203125, 12.2421875, 12.951171875, 13.66015625, 14.369140625, 15.078125, 15.787109375, 16.49609375, 17.205078125, 17.9140625, 18.623046875, 19.33203125, 20.041015625, 20.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 2.0, 5.0, 8.0, 7.0, 10.0, 8.0, 7.0, 14.0, 12.0, 18.0, 16.0, 39.0, 42.0, 50.0, 56.0, 61.0, 59.0, 69.0, 73.0, 51.0, 78.0, 57.0, 50.0, 40.0, 26.0, 32.0, 26.0, 19.0, 11.0, 16.0, 15.0, 9.0, 6.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.05078125, -6.84320068359375, -6.6356201171875, -6.42803955078125, -6.220458984375, -6.01287841796875, -5.8052978515625, -5.59771728515625, -5.39013671875, -5.18255615234375, -4.9749755859375, -4.76739501953125, -4.559814453125, -4.35223388671875, -4.1446533203125, -3.93707275390625, -3.7294921875, -3.52191162109375, -3.3143310546875, -3.10675048828125, -2.899169921875, -2.69158935546875, -2.4840087890625, -2.27642822265625, -2.06884765625, -1.86126708984375, -1.6536865234375, -1.44610595703125, -1.238525390625, -1.03094482421875, -0.8233642578125, -0.61578369140625, -0.408203125, -0.20062255859375, 0.0069580078125, 0.21453857421875, 0.422119140625, 0.62969970703125, 0.8372802734375, 1.04486083984375, 1.25244140625, 1.46002197265625, 1.6676025390625, 1.87518310546875, 2.082763671875, 2.29034423828125, 2.4979248046875, 2.70550537109375, 2.9130859375, 3.12066650390625, 3.3282470703125, 3.53582763671875, 3.743408203125, 3.95098876953125, 4.1585693359375, 4.36614990234375, 4.57373046875, 4.78131103515625, 4.9888916015625, 5.19647216796875, 5.404052734375, 5.61163330078125, 5.8192138671875, 6.02679443359375, 6.234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 16.0, 18.0, 15.0, 26.0, 35.0, 48.0, 44.0, 74.0, 103.0, 129.0, 180.0, 295.0, 504.0, 796.0, 1649.0, 3733.0, 10902.0, 68640.0, 4073094.0, 22208.0, 6302.0, 2494.0, 1190.0, 596.0, 362.0, 226.0, 166.0, 112.0, 88.0, 49.0, 41.0, 35.0, 33.0, 12.0, 17.0, 15.0, 3.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-41.875, -40.65234375, -39.4296875, -38.20703125, -36.984375, -35.76171875, -34.5390625, -33.31640625, -32.09375, -30.87109375, -29.6484375, -28.42578125, -27.203125, -25.98046875, -24.7578125, -23.53515625, -22.3125, -21.08984375, -19.8671875, -18.64453125, -17.421875, -16.19921875, -14.9765625, -13.75390625, -12.53125, -11.30859375, -10.0859375, -8.86328125, -7.640625, -6.41796875, -5.1953125, -3.97265625, -2.75, -1.52734375, -0.3046875, 0.91796875, 2.140625, 3.36328125, 4.5859375, 5.80859375, 7.03125, 8.25390625, 9.4765625, 10.69921875, 11.921875, 13.14453125, 14.3671875, 15.58984375, 16.8125, 18.03515625, 19.2578125, 20.48046875, 21.703125, 22.92578125, 24.1484375, 25.37109375, 26.59375, 27.81640625, 29.0390625, 30.26171875, 31.484375, 32.70703125, 33.9296875, 35.15234375, 36.375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 13.0, 16.0, 48.0, 3675.0, 215.0, 42.0, 15.0, 15.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.535888671875, -10.15771484375, -9.779541015625, -9.4013671875, -9.023193359375, -8.64501953125, -8.266845703125, -7.888671875, -7.510498046875, -7.13232421875, -6.754150390625, -6.3759765625, -5.997802734375, -5.61962890625, -5.241455078125, -4.86328125, -4.485107421875, -4.10693359375, -3.728759765625, -3.3505859375, -2.972412109375, -2.59423828125, -2.216064453125, -1.837890625, -1.459716796875, -1.08154296875, -0.703369140625, -0.3251953125, 0.052978515625, 0.43115234375, 0.809326171875, 1.1875, 1.565673828125, 1.94384765625, 2.322021484375, 2.7001953125, 3.078369140625, 3.45654296875, 3.834716796875, 4.212890625, 4.591064453125, 4.96923828125, 5.347412109375, 5.7255859375, 6.103759765625, 6.48193359375, 6.860107421875, 7.23828125, 7.616455078125, 7.99462890625, 8.372802734375, 8.7509765625, 9.129150390625, 9.50732421875, 9.885498046875, 10.263671875, 10.641845703125, 11.02001953125, 11.398193359375, 11.7763671875, 12.154541015625, 12.53271484375, 12.910888671875, 13.2890625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 22.0, 38.0, 90.0, 175.0, 212.0, 229.0, 123.0, 52.0, 30.0, 19.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.99620056152344, -31.984651565551758, -29.973102569580078, -27.961551666259766, -25.950002670288086, -23.938453674316406, -21.926902770996094, -19.915353775024414, -17.903804779052734, -15.892255783081055, -13.880705833435059, -11.869155883789062, -9.857606887817383, -7.846057891845703, -5.834507942199707, -3.822957992553711, -1.8114089965820312, 0.20014047622680664, 2.2116899490356445, 4.223239421844482, 6.23478889465332, 8.246337890625, 10.257887840270996, 12.269437789916992, 14.280986785888672, 16.29253578186035, 18.30408477783203, 20.315635681152344, 22.327184677124023, 24.338733673095703, 26.350284576416016, 28.361833572387695, 30.373374938964844, 32.384925842285156, 34.3964729309082, 36.408023834228516, 38.41957092285156, 40.431121826171875, 42.44267272949219, 44.4542236328125, 46.46577072143555, 48.47732162475586, 50.488868713378906, 52.50041961669922, 54.51197052001953, 56.52351760864258, 58.53506851196289, 60.54661560058594, 62.55816650390625, 64.56971740722656, 66.58126831054688, 68.59281158447266, 70.60436248779297, 72.61591339111328, 74.6274642944336, 76.6390151977539, 78.65055847167969, 80.662109375, 82.67366027832031, 84.6852035522461, 86.6967544555664, 88.70830535888672, 90.71985626220703, 92.73140716552734, 94.74295806884766]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 10.0, 3.0, 4.0, 11.0, 13.0, 6.0, 11.0, 10.0, 14.0, 13.0, 14.0, 26.0, 23.0, 19.0, 36.0, 36.0, 34.0, 38.0, 42.0, 37.0, 33.0, 39.0, 37.0, 37.0, 38.0, 38.0, 47.0, 29.0, 33.0, 30.0, 40.0, 26.0, 23.0, 33.0, 26.0, 10.0, 17.0, 10.0, 9.0, 6.0, 9.0, 4.0, 2.0, 4.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-16.866580963134766, -16.35438346862793, -15.842187881469727, -15.329991340637207, -14.817794799804688, -14.305597305297852, -13.793400764465332, -13.281204223632812, -12.769007682800293, -12.256811141967773, -11.744614601135254, -11.232418060302734, -10.720220565795898, -10.208024978637695, -9.69582748413086, -9.18363094329834, -8.67143440246582, -8.1592378616333, -7.647041320800781, -7.1348443031311035, -6.622647762298584, -6.1104512214660645, -5.598254203796387, -5.086057662963867, -4.573861122131348, -4.061664581298828, -3.5494678020477295, -3.037271022796631, -2.5250744819641113, -2.012877941131592, -1.5006811618804932, -0.9884843826293945, -0.4762859344482422, 0.035910725593566895, 0.548107385635376, 1.060304045677185, 1.5725007057189941, 2.0846972465515137, 2.5968940258026123, 3.109090805053711, 3.6212873458862305, 4.13348388671875, 4.6456804275512695, 5.157877445220947, 5.670073986053467, 6.182270526885986, 6.694467544555664, 7.206664085388184, 7.718860626220703, 8.231057167053223, 8.743253707885742, 9.255450248718262, 9.767646789550781, 10.279844284057617, 10.792040824890137, 11.304237365722656, 11.816433906555176, 12.328630447387695, 12.840826988220215, 13.353023529052734, 13.86522102355957, 14.377416610717773, 14.88961410522461, 15.401810646057129, 15.914007186889648]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 11.0, 12.0, 26.0, 26.0, 41.0, 49.0, 90.0, 109.0, 143.0, 213.0, 329.0, 465.0, 714.0, 1165.0, 1664.0, 2776.0, 4196.0, 6819.0, 11845.0, 20923.0, 39342.0, 77646.0, 163801.0, 294256.0, 210714.0, 99714.0, 48969.0, 25634.0, 14294.0, 8386.0, 5122.0, 3181.0, 1945.0, 1304.0, 832.0, 522.0, 399.0, 254.0, 193.0, 126.0, 95.0, 62.0, 34.0, 25.0, 17.0, 15.0, 14.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-8.8359375, -8.5478515625, -8.259765625, -7.9716796875, -7.68359375, -7.3955078125, -7.107421875, -6.8193359375, -6.53125, -6.2431640625, -5.955078125, -5.6669921875, -5.37890625, -5.0908203125, -4.802734375, -4.5146484375, -4.2265625, -3.9384765625, -3.650390625, -3.3623046875, -3.07421875, -2.7861328125, -2.498046875, -2.2099609375, -1.921875, -1.6337890625, -1.345703125, -1.0576171875, -0.76953125, -0.4814453125, -0.193359375, 0.0947265625, 0.3828125, 0.6708984375, 0.958984375, 1.2470703125, 1.53515625, 1.8232421875, 2.111328125, 2.3994140625, 2.6875, 2.9755859375, 3.263671875, 3.5517578125, 3.83984375, 4.1279296875, 4.416015625, 4.7041015625, 4.9921875, 5.2802734375, 5.568359375, 5.8564453125, 6.14453125, 6.4326171875, 6.720703125, 7.0087890625, 7.296875, 7.5849609375, 7.873046875, 8.1611328125, 8.44921875, 8.7373046875, 9.025390625, 9.3134765625, 9.6015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 8.0, 9.0, 12.0, 9.0, 9.0, 6.0, 17.0, 18.0, 23.0, 25.0, 29.0, 33.0, 41.0, 53.0, 46.0, 49.0, 57.0, 79.0, 75.0, 58.0, 55.0, 51.0, 44.0, 35.0, 34.0, 28.0, 20.0, 13.0, 12.0, 18.0, 9.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.368896484375, -7.14013671875, -6.911376953125, -6.6826171875, -6.453857421875, -6.22509765625, -5.996337890625, -5.767578125, -5.538818359375, -5.31005859375, -5.081298828125, -4.8525390625, -4.623779296875, -4.39501953125, -4.166259765625, -3.9375, -3.708740234375, -3.47998046875, -3.251220703125, -3.0224609375, -2.793701171875, -2.56494140625, -2.336181640625, -2.107421875, -1.878662109375, -1.64990234375, -1.421142578125, -1.1923828125, -0.963623046875, -0.73486328125, -0.506103515625, -0.27734375, -0.048583984375, 0.18017578125, 0.408935546875, 0.6376953125, 0.866455078125, 1.09521484375, 1.323974609375, 1.552734375, 1.781494140625, 2.01025390625, 2.239013671875, 2.4677734375, 2.696533203125, 2.92529296875, 3.154052734375, 3.3828125, 3.611572265625, 3.84033203125, 4.069091796875, 4.2978515625, 4.526611328125, 4.75537109375, 4.984130859375, 5.212890625, 5.441650390625, 5.67041015625, 5.899169921875, 6.1279296875, 6.356689453125, 6.58544921875, 6.814208984375, 7.04296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 1.0, 3.0, 1.0, 9.0, 5.0, 7.0, 13.0, 26.0, 37.0, 57.0, 113.0, 195.0, 429.0, 1093.0, 3118.0, 10049.0, 42323.0, 301268.0, 587701.0, 78612.0, 16162.0, 4613.0, 1571.0, 558.0, 259.0, 112.0, 78.0, 44.0, 32.0, 16.0, 12.0, 10.0, 7.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.25, -30.27880859375, -29.3076171875, -28.33642578125, -27.365234375, -26.39404296875, -25.4228515625, -24.45166015625, -23.48046875, -22.50927734375, -21.5380859375, -20.56689453125, -19.595703125, -18.62451171875, -17.6533203125, -16.68212890625, -15.7109375, -14.73974609375, -13.7685546875, -12.79736328125, -11.826171875, -10.85498046875, -9.8837890625, -8.91259765625, -7.94140625, -6.97021484375, -5.9990234375, -5.02783203125, -4.056640625, -3.08544921875, -2.1142578125, -1.14306640625, -0.171875, 0.79931640625, 1.7705078125, 2.74169921875, 3.712890625, 4.68408203125, 5.6552734375, 6.62646484375, 7.59765625, 8.56884765625, 9.5400390625, 10.51123046875, 11.482421875, 12.45361328125, 13.4248046875, 14.39599609375, 15.3671875, 16.33837890625, 17.3095703125, 18.28076171875, 19.251953125, 20.22314453125, 21.1943359375, 22.16552734375, 23.13671875, 24.10791015625, 25.0791015625, 26.05029296875, 27.021484375, 27.99267578125, 28.9638671875, 29.93505859375, 30.90625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 11.0, 12.0, 10.0, 9.0, 10.0, 16.0, 19.0, 20.0, 31.0, 23.0, 37.0, 35.0, 41.0, 33.0, 44.0, 44.0, 51.0, 50.0, 47.0, 40.0, 53.0, 43.0, 37.0, 37.0, 27.0, 31.0, 27.0, 23.0, 23.0, 23.0, 12.0, 7.0, 7.0, 9.0, 5.0, 9.0, 7.0, 7.0, 1.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.453125, -29.368408203125, -28.28369140625, -27.198974609375, -26.1142578125, -25.029541015625, -23.94482421875, -22.860107421875, -21.775390625, -20.690673828125, -19.60595703125, -18.521240234375, -17.4365234375, -16.351806640625, -15.26708984375, -14.182373046875, -13.09765625, -12.012939453125, -10.92822265625, -9.843505859375, -8.7587890625, -7.674072265625, -6.58935546875, -5.504638671875, -4.419921875, -3.335205078125, -2.25048828125, -1.165771484375, -0.0810546875, 1.003662109375, 2.08837890625, 3.173095703125, 4.2578125, 5.342529296875, 6.42724609375, 7.511962890625, 8.5966796875, 9.681396484375, 10.76611328125, 11.850830078125, 12.935546875, 14.020263671875, 15.10498046875, 16.189697265625, 17.2744140625, 18.359130859375, 19.44384765625, 20.528564453125, 21.61328125, 22.697998046875, 23.78271484375, 24.867431640625, 25.9521484375, 27.036865234375, 28.12158203125, 29.206298828125, 30.291015625, 31.375732421875, 32.46044921875, 33.545166015625, 34.6298828125, 35.714599609375, 36.79931640625, 37.884033203125, 38.96875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 8.0, 3.0, 14.0, 15.0, 29.0, 46.0, 74.0, 143.0, 303.0, 686.0, 2000.0, 8082.0, 50265.0, 690262.0, 266121.0, 23326.0, 4680.0, 1424.0, 503.0, 236.0, 110.0, 77.0, 46.0, 30.0, 13.0, 9.0, 14.0, 3.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.9375, -19.310791015625, -18.68408203125, -18.057373046875, -17.4306640625, -16.803955078125, -16.17724609375, -15.550537109375, -14.923828125, -14.297119140625, -13.67041015625, -13.043701171875, -12.4169921875, -11.790283203125, -11.16357421875, -10.536865234375, -9.91015625, -9.283447265625, -8.65673828125, -8.030029296875, -7.4033203125, -6.776611328125, -6.14990234375, -5.523193359375, -4.896484375, -4.269775390625, -3.64306640625, -3.016357421875, -2.3896484375, -1.762939453125, -1.13623046875, -0.509521484375, 0.1171875, 0.743896484375, 1.37060546875, 1.997314453125, 2.6240234375, 3.250732421875, 3.87744140625, 4.504150390625, 5.130859375, 5.757568359375, 6.38427734375, 7.010986328125, 7.6376953125, 8.264404296875, 8.89111328125, 9.517822265625, 10.14453125, 10.771240234375, 11.39794921875, 12.024658203125, 12.6513671875, 13.278076171875, 13.90478515625, 14.531494140625, 15.158203125, 15.784912109375, 16.41162109375, 17.038330078125, 17.6650390625, 18.291748046875, 18.91845703125, 19.545166015625, 20.171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 13.0, 13.0, 24.0, 40.0, 37.0, 52.0, 88.0, 95.0, 98.0, 122.0, 101.0, 82.0, 47.0, 43.0, 24.0, 27.0, 20.0, 13.0, 8.0, 10.0, 2.0, 9.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018930435180664062, -0.0018276721239089966, -0.001762300729751587, -0.0016969293355941772, -0.0016315579414367676, -0.001566186547279358, -0.0015008151531219482, -0.0014354437589645386, -0.001370072364807129, -0.0013047009706497192, -0.0012393295764923096, -0.0011739581823349, -0.0011085867881774902, -0.0010432153940200806, -0.000977843999862671, -0.0009124726057052612, -0.0008471012115478516, -0.0007817298173904419, -0.0007163584232330322, -0.0006509870290756226, -0.0005856156349182129, -0.0005202442407608032, -0.00045487284660339355, -0.0003895014524459839, -0.0003241300582885742, -0.00025875866413116455, -0.00019338726997375488, -0.00012801587581634521, -6.264448165893555e-05, 2.726912498474121e-06, 6.809830665588379e-05, 0.00013346970081329346, 0.00019884109497070312, 0.0002642124891281128, 0.00032958388328552246, 0.00039495527744293213, 0.0004603266716003418, 0.0005256980657577515, 0.0005910694599151611, 0.0006564408540725708, 0.0007218122482299805, 0.0007871836423873901, 0.0008525550365447998, 0.0009179264307022095, 0.0009832978248596191, 0.0010486692190170288, 0.0011140406131744385, 0.0011794120073318481, 0.0012447834014892578, 0.0013101547956466675, 0.0013755261898040771, 0.0014408975839614868, 0.0015062689781188965, 0.0015716403722763062, 0.0016370117664337158, 0.0017023831605911255, 0.0017677545547485352, 0.0018331259489059448, 0.0018984973430633545, 0.001963868737220764, 0.002029240131378174, 0.0020946115255355835, 0.002159982919692993, 0.002225354313850403, 0.0022907257080078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 7.0, 15.0, 24.0, 28.0, 70.0, 101.0, 219.0, 426.0, 1152.0, 4120.0, 28619.0, 657305.0, 334131.0, 17485.0, 3063.0, 943.0, 399.0, 197.0, 92.0, 66.0, 31.0, 11.0, 15.0, 14.0, 4.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.47314453125, -19.7119140625, -18.95068359375, -18.189453125, -17.42822265625, -16.6669921875, -15.90576171875, -15.14453125, -14.38330078125, -13.6220703125, -12.86083984375, -12.099609375, -11.33837890625, -10.5771484375, -9.81591796875, -9.0546875, -8.29345703125, -7.5322265625, -6.77099609375, -6.009765625, -5.24853515625, -4.4873046875, -3.72607421875, -2.96484375, -2.20361328125, -1.4423828125, -0.68115234375, 0.080078125, 0.84130859375, 1.6025390625, 2.36376953125, 3.125, 3.88623046875, 4.6474609375, 5.40869140625, 6.169921875, 6.93115234375, 7.6923828125, 8.45361328125, 9.21484375, 9.97607421875, 10.7373046875, 11.49853515625, 12.259765625, 13.02099609375, 13.7822265625, 14.54345703125, 15.3046875, 16.06591796875, 16.8271484375, 17.58837890625, 18.349609375, 19.11083984375, 19.8720703125, 20.63330078125, 21.39453125, 22.15576171875, 22.9169921875, 23.67822265625, 24.439453125, 25.20068359375, 25.9619140625, 26.72314453125, 27.484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 3.0, 16.0, 13.0, 16.0, 22.0, 21.0, 33.0, 35.0, 53.0, 60.0, 80.0, 92.0, 95.0, 93.0, 73.0, 62.0, 48.0, 32.0, 31.0, 27.0, 21.0, 14.0, 21.0, 11.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.6868896484375, -15.201904296875, -14.7169189453125, -14.23193359375, -13.7469482421875, -13.261962890625, -12.7769775390625, -12.2919921875, -11.8070068359375, -11.322021484375, -10.8370361328125, -10.35205078125, -9.8670654296875, -9.382080078125, -8.8970947265625, -8.412109375, -7.9271240234375, -7.442138671875, -6.9571533203125, -6.47216796875, -5.9871826171875, -5.502197265625, -5.0172119140625, -4.5322265625, -4.0472412109375, -3.562255859375, -3.0772705078125, -2.59228515625, -2.1072998046875, -1.622314453125, -1.1373291015625, -0.65234375, -0.1673583984375, 0.317626953125, 0.8026123046875, 1.28759765625, 1.7725830078125, 2.257568359375, 2.7425537109375, 3.2275390625, 3.7125244140625, 4.197509765625, 4.6824951171875, 5.16748046875, 5.6524658203125, 6.137451171875, 6.6224365234375, 7.107421875, 7.5924072265625, 8.077392578125, 8.5623779296875, 9.04736328125, 9.5323486328125, 10.017333984375, 10.5023193359375, 10.9873046875, 11.4722900390625, 11.957275390625, 12.4422607421875, 12.92724609375, 13.4122314453125, 13.897216796875, 14.3822021484375, 14.8671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 24.0, 39.0, 122.0, 229.0, 280.0, 174.0, 82.0, 29.0, 16.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.04656982421875, -185.9830322265625, -171.91949462890625, -157.85595703125, -143.79241943359375, -129.7288818359375, -115.66535186767578, -101.60181427001953, -87.53827667236328, -73.47473907470703, -59.41120147705078, -45.3476676940918, -31.284130096435547, -17.220596313476562, -3.1570587158203125, 10.906478881835938, 24.970016479492188, 39.03355407714844, 53.09709167480469, 67.16062927246094, 81.22416687011719, 95.2876968383789, 109.35123443603516, 123.4147720336914, 137.47830200195312, 151.54183959960938, 165.60537719726562, 179.66891479492188, 193.73245239257812, 207.79598999023438, 221.85952758789062, 235.92306518554688, 249.98660278320312, 264.0501403808594, 278.1136779785156, 292.1772155761719, 306.2407531738281, 320.3042907714844, 334.3678283691406, 348.4313659667969, 362.4949035644531, 376.5584411621094, 390.6219787597656, 404.6855163574219, 418.7490539550781, 432.8125915527344, 446.8761291503906, 460.9396667480469, 475.003173828125, 489.06671142578125, 503.1302490234375, 517.1937866210938, 531.25732421875, 545.3208618164062, 559.3843994140625, 573.4479370117188, 587.511474609375, 601.5750122070312, 615.6385498046875, 629.7020874023438, 643.765625, 657.8291625976562, 671.8927001953125, 685.9562377929688, 700.019775390625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 5.0, 20.0, 16.0, 21.0, 27.0, 30.0, 33.0, 32.0, 46.0, 48.0, 46.0, 59.0, 60.0, 60.0, 69.0, 60.0, 62.0, 48.0, 34.0, 34.0, 40.0, 26.0, 34.0, 20.0, 16.0, 8.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.64389038085938, -216.002197265625, -209.36050415039062, -202.71881103515625, -196.07711791992188, -189.4354248046875, -182.79373168945312, -176.15203857421875, -169.51034545898438, -162.86865234375, -156.22695922851562, -149.58526611328125, -142.94357299804688, -136.3018798828125, -129.66018676757812, -123.01849365234375, -116.37680053710938, -109.735107421875, -103.09341430664062, -96.45172119140625, -89.81002807617188, -83.1683349609375, -76.52664184570312, -69.88494873046875, -63.243255615234375, -56.6015625, -49.959869384765625, -43.31817626953125, -36.676483154296875, -30.0347900390625, -23.393096923828125, -16.75140380859375, -10.109710693359375, -3.468017578125, 3.173675537109375, 9.81536865234375, 16.457061767578125, 23.0987548828125, 29.740447998046875, 36.38214111328125, 43.023834228515625, 49.66552734375, 56.307220458984375, 62.94891357421875, 69.59060668945312, 76.2322998046875, 82.87399291992188, 89.51568603515625, 96.15737915039062, 102.799072265625, 109.44076538085938, 116.08245849609375, 122.72415161132812, 129.3658447265625, 136.00753784179688, 142.64923095703125, 149.29092407226562, 155.9326171875, 162.57431030273438, 169.21600341796875, 175.85769653320312, 182.4993896484375, 189.14108276367188, 195.78277587890625, 202.42446899414062]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 9.0, 16.0, 12.0, 41.0, 66.0, 90.0, 138.0, 220.0, 369.0, 702.0, 1120.0, 2193.0, 5651.0, 3882806.0, 290332.0, 5584.0, 2164.0, 1151.0, 637.0, 362.0, 225.0, 152.0, 80.0, 42.0, 41.0, 20.0, 22.0, 6.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -35.057373046875, -34.08349609375, -33.109619140625, -32.1357421875, -31.161865234375, -30.18798828125, -29.214111328125, -28.240234375, -27.266357421875, -26.29248046875, -25.318603515625, -24.3447265625, -23.370849609375, -22.39697265625, -21.423095703125, -20.44921875, -19.475341796875, -18.50146484375, -17.527587890625, -16.5537109375, -15.579833984375, -14.60595703125, -13.632080078125, -12.658203125, -11.684326171875, -10.71044921875, -9.736572265625, -8.7626953125, -7.788818359375, -6.81494140625, -5.841064453125, -4.8671875, -3.893310546875, -2.91943359375, -1.945556640625, -0.9716796875, 0.002197265625, 0.97607421875, 1.949951171875, 2.923828125, 3.897705078125, 4.87158203125, 5.845458984375, 6.8193359375, 7.793212890625, 8.76708984375, 9.740966796875, 10.71484375, 11.688720703125, 12.66259765625, 13.636474609375, 14.6103515625, 15.584228515625, 16.55810546875, 17.531982421875, 18.505859375, 19.479736328125, 20.45361328125, 21.427490234375, 22.4013671875, 23.375244140625, 24.34912109375, 25.322998046875, 26.296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 8.0, 12.0, 20.0, 16.0, 24.0, 27.0, 49.0, 52.0, 61.0, 76.0, 78.0, 100.0, 89.0, 80.0, 61.0, 59.0, 45.0, 22.0, 31.0, 10.0, 10.0, 16.0, 8.0, 4.0, 9.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -13.146728515625, -12.76220703125, -12.377685546875, -11.9931640625, -11.608642578125, -11.22412109375, -10.839599609375, -10.455078125, -10.070556640625, -9.68603515625, -9.301513671875, -8.9169921875, -8.532470703125, -8.14794921875, -7.763427734375, -7.37890625, -6.994384765625, -6.60986328125, -6.225341796875, -5.8408203125, -5.456298828125, -5.07177734375, -4.687255859375, -4.302734375, -3.918212890625, -3.53369140625, -3.149169921875, -2.7646484375, -2.380126953125, -1.99560546875, -1.611083984375, -1.2265625, -0.842041015625, -0.45751953125, -0.072998046875, 0.3115234375, 0.696044921875, 1.08056640625, 1.465087890625, 1.849609375, 2.234130859375, 2.61865234375, 3.003173828125, 3.3876953125, 3.772216796875, 4.15673828125, 4.541259765625, 4.92578125, 5.310302734375, 5.69482421875, 6.079345703125, 6.4638671875, 6.848388671875, 7.23291015625, 7.617431640625, 8.001953125, 8.386474609375, 8.77099609375, 9.155517578125, 9.5400390625, 9.924560546875, 10.30908203125, 10.693603515625, 11.078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 9.0, 12.0, 22.0, 34.0, 35.0, 47.0, 88.0, 117.0, 134.0, 220.0, 267.0, 431.0, 722.0, 1113.0, 2289.0, 5795.0, 44245.0, 4122898.0, 8961.0, 2898.0, 1426.0, 811.0, 527.0, 318.0, 250.0, 165.0, 114.0, 81.0, 72.0, 43.0, 35.0, 28.0, 16.0, 12.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.6875, -54.6005859375, -52.513671875, -50.4267578125, -48.33984375, -46.2529296875, -44.166015625, -42.0791015625, -39.9921875, -37.9052734375, -35.818359375, -33.7314453125, -31.64453125, -29.5576171875, -27.470703125, -25.3837890625, -23.296875, -21.2099609375, -19.123046875, -17.0361328125, -14.94921875, -12.8623046875, -10.775390625, -8.6884765625, -6.6015625, -4.5146484375, -2.427734375, -0.3408203125, 1.74609375, 3.8330078125, 5.919921875, 8.0068359375, 10.09375, 12.1806640625, 14.267578125, 16.3544921875, 18.44140625, 20.5283203125, 22.615234375, 24.7021484375, 26.7890625, 28.8759765625, 30.962890625, 33.0498046875, 35.13671875, 37.2236328125, 39.310546875, 41.3974609375, 43.484375, 45.5712890625, 47.658203125, 49.7451171875, 51.83203125, 53.9189453125, 56.005859375, 58.0927734375, 60.1796875, 62.2666015625, 64.353515625, 66.4404296875, 68.52734375, 70.6142578125, 72.701171875, 74.7880859375, 76.875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 19.0, 70.0, 3922.0, 23.0, 12.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.234375, -17.652099609375, -17.06982421875, -16.487548828125, -15.9052734375, -15.322998046875, -14.74072265625, -14.158447265625, -13.576171875, -12.993896484375, -12.41162109375, -11.829345703125, -11.2470703125, -10.664794921875, -10.08251953125, -9.500244140625, -8.91796875, -8.335693359375, -7.75341796875, -7.171142578125, -6.5888671875, -6.006591796875, -5.42431640625, -4.842041015625, -4.259765625, -3.677490234375, -3.09521484375, -2.512939453125, -1.9306640625, -1.348388671875, -0.76611328125, -0.183837890625, 0.3984375, 0.980712890625, 1.56298828125, 2.145263671875, 2.7275390625, 3.309814453125, 3.89208984375, 4.474365234375, 5.056640625, 5.638916015625, 6.22119140625, 6.803466796875, 7.3857421875, 7.968017578125, 8.55029296875, 9.132568359375, 9.71484375, 10.297119140625, 10.87939453125, 11.461669921875, 12.0439453125, 12.626220703125, 13.20849609375, 13.790771484375, 14.373046875, 14.955322265625, 15.53759765625, 16.119873046875, 16.7021484375, 17.284423828125, 17.86669921875, 18.448974609375, 19.03125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 16.0, 12.0, 23.0, 29.0, 35.0, 49.0, 77.0, 84.0, 113.0, 108.0, 96.0, 77.0, 65.0, 65.0, 34.0, 25.0, 22.0, 13.0, 13.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-39.454681396484375, -38.56031799316406, -37.66595458984375, -36.77159118652344, -35.877227783203125, -34.98286437988281, -34.0885009765625, -33.19413757324219, -32.299774169921875, -31.405410766601562, -30.51104736328125, -29.616683959960938, -28.722320556640625, -27.827957153320312, -26.93359375, -26.039230346679688, -25.144865036010742, -24.25050163269043, -23.356138229370117, -22.461774826049805, -21.567411422729492, -20.67304801940918, -19.778682708740234, -18.884319305419922, -17.98995590209961, -17.095592498779297, -16.201229095458984, -15.306865692138672, -14.41250228881836, -13.518138885498047, -12.623774528503418, -11.729411125183105, -10.83504867553711, -9.940685272216797, -9.046321868896484, -8.151958465576172, -7.257594585418701, -6.363231182098389, -5.468867301940918, -4.5745038986206055, -3.680140495300293, -2.7857770919799805, -1.8914134502410889, -0.9970498085021973, -0.10268640518188477, 0.7916769981384277, 1.6860408782958984, 2.580404281616211, 3.4747676849365234, 4.369131088256836, 5.263494491577148, 6.157858371734619, 7.052221775054932, 7.946585178375244, 8.840949058532715, 9.735312461853027, 10.62967586517334, 11.524039268493652, 12.418402671813965, 13.312767028808594, 14.207130432128906, 15.101493835449219, 15.995857238769531, 16.890220642089844, 17.784584045410156]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 6.0, 9.0, 9.0, 9.0, 17.0, 13.0, 19.0, 22.0, 27.0, 36.0, 18.0, 36.0, 36.0, 33.0, 34.0, 39.0, 37.0, 43.0, 43.0, 49.0, 46.0, 43.0, 45.0, 42.0, 43.0, 26.0, 38.0, 30.0, 29.0, 19.0, 24.0, 13.0, 12.0, 16.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.786033630371094, -20.14051055908203, -19.49498748779297, -18.849464416503906, -18.203941345214844, -17.55841827392578, -16.91289520263672, -16.267372131347656, -15.621849060058594, -14.976325988769531, -14.330802917480469, -13.685279846191406, -13.039756774902344, -12.394233703613281, -11.748710632324219, -11.103187561035156, -10.457664489746094, -9.812141418457031, -9.166618347167969, -8.521095275878906, -7.875572204589844, -7.230049133300781, -6.584526062011719, -5.939002990722656, -5.293479919433594, -4.647956848144531, -4.002433776855469, -3.3569107055664062, -2.7113876342773438, -2.0658645629882812, -1.4203414916992188, -0.7748184204101562, -0.12929534912109375, 0.5162277221679688, 1.1617507934570312, 1.8072738647460938, 2.4527969360351562, 3.0983200073242188, 3.7438430786132812, 4.389366149902344, 5.034889221191406, 5.680412292480469, 6.325935363769531, 6.971458435058594, 7.616981506347656, 8.262504577636719, 8.908027648925781, 9.553550720214844, 10.199073791503906, 10.844596862792969, 11.490119934082031, 12.135643005371094, 12.781166076660156, 13.426689147949219, 14.072212219238281, 14.717735290527344, 15.363258361816406, 16.00878143310547, 16.65430450439453, 17.299827575683594, 17.945350646972656, 18.59087371826172, 19.23639678955078, 19.881919860839844, 20.527442932128906]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 5.0, 8.0, 12.0, 15.0, 22.0, 23.0, 52.0, 77.0, 101.0, 165.0, 220.0, 391.0, 592.0, 931.0, 1620.0, 2744.0, 5010.0, 8999.0, 17765.0, 36449.0, 81646.0, 207099.0, 371666.0, 174836.0, 70687.0, 32415.0, 16013.0, 8095.0, 4494.0, 2396.0, 1472.0, 924.0, 567.0, 332.0, 236.0, 159.0, 104.0, 61.0, 45.0, 37.0, 14.0, 21.0, 4.0, 10.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-15.359375, -14.9130859375, -14.466796875, -14.0205078125, -13.57421875, -13.1279296875, -12.681640625, -12.2353515625, -11.7890625, -11.3427734375, -10.896484375, -10.4501953125, -10.00390625, -9.5576171875, -9.111328125, -8.6650390625, -8.21875, -7.7724609375, -7.326171875, -6.8798828125, -6.43359375, -5.9873046875, -5.541015625, -5.0947265625, -4.6484375, -4.2021484375, -3.755859375, -3.3095703125, -2.86328125, -2.4169921875, -1.970703125, -1.5244140625, -1.078125, -0.6318359375, -0.185546875, 0.2607421875, 0.70703125, 1.1533203125, 1.599609375, 2.0458984375, 2.4921875, 2.9384765625, 3.384765625, 3.8310546875, 4.27734375, 4.7236328125, 5.169921875, 5.6162109375, 6.0625, 6.5087890625, 6.955078125, 7.4013671875, 7.84765625, 8.2939453125, 8.740234375, 9.1865234375, 9.6328125, 10.0791015625, 10.525390625, 10.9716796875, 11.41796875, 11.8642578125, 12.310546875, 12.7568359375, 13.203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 5.0, 3.0, 11.0, 6.0, 10.0, 9.0, 14.0, 12.0, 20.0, 25.0, 35.0, 37.0, 41.0, 53.0, 51.0, 64.0, 70.0, 73.0, 67.0, 62.0, 47.0, 55.0, 41.0, 31.0, 33.0, 30.0, 21.0, 12.0, 9.0, 5.0, 9.0, 7.0, 10.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.53076171875, -10.2021484375, -9.87353515625, -9.544921875, -9.21630859375, -8.8876953125, -8.55908203125, -8.23046875, -7.90185546875, -7.5732421875, -7.24462890625, -6.916015625, -6.58740234375, -6.2587890625, -5.93017578125, -5.6015625, -5.27294921875, -4.9443359375, -4.61572265625, -4.287109375, -3.95849609375, -3.6298828125, -3.30126953125, -2.97265625, -2.64404296875, -2.3154296875, -1.98681640625, -1.658203125, -1.32958984375, -1.0009765625, -0.67236328125, -0.34375, -0.01513671875, 0.3134765625, 0.64208984375, 0.970703125, 1.29931640625, 1.6279296875, 1.95654296875, 2.28515625, 2.61376953125, 2.9423828125, 3.27099609375, 3.599609375, 3.92822265625, 4.2568359375, 4.58544921875, 4.9140625, 5.24267578125, 5.5712890625, 5.89990234375, 6.228515625, 6.55712890625, 6.8857421875, 7.21435546875, 7.54296875, 7.87158203125, 8.2001953125, 8.52880859375, 8.857421875, 9.18603515625, 9.5146484375, 9.84326171875, 10.171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 6.0, 17.0, 17.0, 26.0, 45.0, 50.0, 103.0, 143.0, 212.0, 381.0, 677.0, 1574.0, 3808.0, 11522.0, 45600.0, 273010.0, 586220.0, 94334.0, 20344.0, 6031.0, 2175.0, 887.0, 532.0, 279.0, 178.0, 91.0, 88.0, 56.0, 31.0, 30.0, 10.0, 14.0, 16.0, 8.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.28125, -30.3671875, -29.453125, -28.5390625, -27.625, -26.7109375, -25.796875, -24.8828125, -23.96875, -23.0546875, -22.140625, -21.2265625, -20.3125, -19.3984375, -18.484375, -17.5703125, -16.65625, -15.7421875, -14.828125, -13.9140625, -13.0, -12.0859375, -11.171875, -10.2578125, -9.34375, -8.4296875, -7.515625, -6.6015625, -5.6875, -4.7734375, -3.859375, -2.9453125, -2.03125, -1.1171875, -0.203125, 0.7109375, 1.625, 2.5390625, 3.453125, 4.3671875, 5.28125, 6.1953125, 7.109375, 8.0234375, 8.9375, 9.8515625, 10.765625, 11.6796875, 12.59375, 13.5078125, 14.421875, 15.3359375, 16.25, 17.1640625, 18.078125, 18.9921875, 19.90625, 20.8203125, 21.734375, 22.6484375, 23.5625, 24.4765625, 25.390625, 26.3046875, 27.21875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 13.0, 13.0, 15.0, 13.0, 23.0, 36.0, 37.0, 43.0, 52.0, 54.0, 55.0, 56.0, 64.0, 81.0, 57.0, 57.0, 63.0, 57.0, 40.0, 38.0, 24.0, 31.0, 15.0, 15.0, 16.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-71.6875, -69.7666015625, -67.845703125, -65.9248046875, -64.00390625, -62.0830078125, -60.162109375, -58.2412109375, -56.3203125, -54.3994140625, -52.478515625, -50.5576171875, -48.63671875, -46.7158203125, -44.794921875, -42.8740234375, -40.953125, -39.0322265625, -37.111328125, -35.1904296875, -33.26953125, -31.3486328125, -29.427734375, -27.5068359375, -25.5859375, -23.6650390625, -21.744140625, -19.8232421875, -17.90234375, -15.9814453125, -14.060546875, -12.1396484375, -10.21875, -8.2978515625, -6.376953125, -4.4560546875, -2.53515625, -0.6142578125, 1.306640625, 3.2275390625, 5.1484375, 7.0693359375, 8.990234375, 10.9111328125, 12.83203125, 14.7529296875, 16.673828125, 18.5947265625, 20.515625, 22.4365234375, 24.357421875, 26.2783203125, 28.19921875, 30.1201171875, 32.041015625, 33.9619140625, 35.8828125, 37.8037109375, 39.724609375, 41.6455078125, 43.56640625, 45.4873046875, 47.408203125, 49.3291015625, 51.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 14.0, 15.0, 28.0, 57.0, 113.0, 219.0, 524.0, 1613.0, 8297.0, 227297.0, 793024.0, 13724.0, 2367.0, 702.0, 262.0, 127.0, 67.0, 37.0, 21.0, 13.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03125, -37.7353515625, -36.439453125, -35.1435546875, -33.84765625, -32.5517578125, -31.255859375, -29.9599609375, -28.6640625, -27.3681640625, -26.072265625, -24.7763671875, -23.48046875, -22.1845703125, -20.888671875, -19.5927734375, -18.296875, -17.0009765625, -15.705078125, -14.4091796875, -13.11328125, -11.8173828125, -10.521484375, -9.2255859375, -7.9296875, -6.6337890625, -5.337890625, -4.0419921875, -2.74609375, -1.4501953125, -0.154296875, 1.1416015625, 2.4375, 3.7333984375, 5.029296875, 6.3251953125, 7.62109375, 8.9169921875, 10.212890625, 11.5087890625, 12.8046875, 14.1005859375, 15.396484375, 16.6923828125, 17.98828125, 19.2841796875, 20.580078125, 21.8759765625, 23.171875, 24.4677734375, 25.763671875, 27.0595703125, 28.35546875, 29.6513671875, 30.947265625, 32.2431640625, 33.5390625, 34.8349609375, 36.130859375, 37.4267578125, 38.72265625, 40.0185546875, 41.314453125, 42.6103515625, 43.90625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 7.0, 16.0, 46.0, 34.0, 64.0, 91.0, 145.0, 160.0, 134.0, 89.0, 61.0, 37.0, 26.0, 19.0, 14.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002323150634765625, -0.0022316575050354004, -0.0021401643753051758, -0.002048671245574951, -0.0019571781158447266, -0.001865684986114502, -0.0017741918563842773, -0.0016826987266540527, -0.0015912055969238281, -0.0014997124671936035, -0.001408219337463379, -0.0013167262077331543, -0.0012252330780029297, -0.001133739948272705, -0.0010422468185424805, -0.0009507536888122559, -0.0008592605590820312, -0.0007677674293518066, -0.000676274299621582, -0.0005847811698913574, -0.0004932880401611328, -0.0004017949104309082, -0.0003103017807006836, -0.00021880865097045898, -0.00012731552124023438, -3.5822391510009766e-05, 5.5670738220214844e-05, 0.00014716386795043945, 0.00023865699768066406, 0.00033015012741088867, 0.0004216432571411133, 0.0005131363868713379, 0.0006046295166015625, 0.0006961226463317871, 0.0007876157760620117, 0.0008791089057922363, 0.0009706020355224609, 0.0010620951652526855, 0.0011535882949829102, 0.0012450814247131348, 0.0013365745544433594, 0.001428067684173584, 0.0015195608139038086, 0.0016110539436340332, 0.0017025470733642578, 0.0017940402030944824, 0.001885533332824707, 0.0019770264625549316, 0.0020685195922851562, 0.002160012722015381, 0.0022515058517456055, 0.00234299898147583, 0.0024344921112060547, 0.0025259852409362793, 0.002617478370666504, 0.0027089715003967285, 0.002800464630126953, 0.0028919577598571777, 0.0029834508895874023, 0.003074944019317627, 0.0031664371490478516, 0.003257930278778076, 0.0033494234085083008, 0.0034409165382385254, 0.00353240966796875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 8.0, 8.0, 12.0, 24.0, 30.0, 53.0, 85.0, 180.0, 416.0, 1028.0, 3049.0, 15412.0, 514999.0, 492964.0, 15229.0, 3199.0, 1024.0, 401.0, 189.0, 107.0, 54.0, 33.0, 18.0, 9.0, 6.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.453125, -30.368408203125, -29.28369140625, -28.198974609375, -27.1142578125, -26.029541015625, -24.94482421875, -23.860107421875, -22.775390625, -21.690673828125, -20.60595703125, -19.521240234375, -18.4365234375, -17.351806640625, -16.26708984375, -15.182373046875, -14.09765625, -13.012939453125, -11.92822265625, -10.843505859375, -9.7587890625, -8.674072265625, -7.58935546875, -6.504638671875, -5.419921875, -4.335205078125, -3.25048828125, -2.165771484375, -1.0810546875, 0.003662109375, 1.08837890625, 2.173095703125, 3.2578125, 4.342529296875, 5.42724609375, 6.511962890625, 7.5966796875, 8.681396484375, 9.76611328125, 10.850830078125, 11.935546875, 13.020263671875, 14.10498046875, 15.189697265625, 16.2744140625, 17.359130859375, 18.44384765625, 19.528564453125, 20.61328125, 21.697998046875, 22.78271484375, 23.867431640625, 24.9521484375, 26.036865234375, 27.12158203125, 28.206298828125, 29.291015625, 30.375732421875, 31.46044921875, 32.545166015625, 33.6298828125, 34.714599609375, 35.79931640625, 36.884033203125, 37.96875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 16.0, 19.0, 34.0, 137.0, 305.0, 239.0, 115.0, 52.0, 22.0, 11.0, 7.0, 7.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.47265625, -43.5703125, -41.66796875, -39.765625, -37.86328125, -35.9609375, -34.05859375, -32.15625, -30.25390625, -28.3515625, -26.44921875, -24.546875, -22.64453125, -20.7421875, -18.83984375, -16.9375, -15.03515625, -13.1328125, -11.23046875, -9.328125, -7.42578125, -5.5234375, -3.62109375, -1.71875, 0.18359375, 2.0859375, 3.98828125, 5.890625, 7.79296875, 9.6953125, 11.59765625, 13.5, 15.40234375, 17.3046875, 19.20703125, 21.109375, 23.01171875, 24.9140625, 26.81640625, 28.71875, 30.62109375, 32.5234375, 34.42578125, 36.328125, 38.23046875, 40.1328125, 42.03515625, 43.9375, 45.83984375, 47.7421875, 49.64453125, 51.546875, 53.44921875, 55.3515625, 57.25390625, 59.15625, 61.05859375, 62.9609375, 64.86328125, 66.765625, 68.66796875, 70.5703125, 72.47265625, 74.375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 13.0, 24.0, 58.0, 119.0, 206.0, 229.0, 203.0, 95.0, 37.0, 7.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-579.4825439453125, -564.4634399414062, -549.4443359375, -534.42529296875, -519.4061889648438, -504.3870849609375, -489.3680114746094, -474.3489074707031, -459.329833984375, -444.31072998046875, -429.2916564941406, -414.2725524902344, -399.25347900390625, -384.234375, -369.2153015136719, -354.1961975097656, -339.1771240234375, -324.15802001953125, -309.1389465332031, -294.1198425292969, -279.10076904296875, -264.0816650390625, -249.06259155273438, -234.04348754882812, -219.02438354492188, -204.0052947998047, -188.9862060546875, -173.9671173095703, -158.94802856445312, -143.92892456054688, -128.90985107421875, -113.89075469970703, -98.87167358398438, -83.85258483886719, -68.83349609375, -53.81440353393555, -38.79531478881836, -23.776222229003906, -8.757133483886719, 6.261955261230469, 21.281044006347656, 36.300132751464844, 51.31922149658203, 66.33831787109375, 81.35740661621094, 96.37649536132812, 111.39558410644531, 126.4146728515625, 141.4337615966797, 156.45285034179688, 171.47193908691406, 186.49102783203125, 201.51011657714844, 216.52920532226562, 231.54830932617188, 246.5673828125, 261.58648681640625, 276.6055908203125, 291.6246643066406, 306.6437683105469, 321.662841796875, 336.68194580078125, 351.7010192871094, 366.7201232910156, 381.73919677734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 1.0, 6.0, 4.0, 8.0, 11.0, 9.0, 10.0, 18.0, 21.0, 27.0, 29.0, 31.0, 52.0, 33.0, 41.0, 41.0, 51.0, 57.0, 52.0, 59.0, 54.0, 63.0, 46.0, 44.0, 32.0, 27.0, 30.0, 25.0, 15.0, 25.0, 16.0, 13.0, 9.0, 12.0, 4.0, 7.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.02581787109375, -233.4842529296875, -225.9427032470703, -218.40113830566406, -210.85958862304688, -203.31802368164062, -195.77645874023438, -188.23489379882812, -180.69334411621094, -173.1517791748047, -165.6102294921875, -158.06866455078125, -150.527099609375, -142.9855499267578, -135.44398498535156, -127.90242767333984, -120.36087036132812, -112.8193130493164, -105.27775573730469, -97.73619079589844, -90.19463348388672, -82.653076171875, -75.11151123046875, -67.56995391845703, -60.02839660644531, -52.486839294433594, -44.94527816772461, -37.403717041015625, -29.862159729003906, -22.320602416992188, -14.779041290283203, -7.237480163574219, 0.3040924072265625, 7.845651626586914, 15.387210845947266, 22.928770065307617, 30.47032928466797, 38.01188659667969, 45.55344772338867, 53.095008850097656, 60.636566162109375, 68.1781234741211, 75.71968078613281, 83.26124572753906, 90.80280303955078, 98.3443603515625, 105.88592529296875, 113.42748260498047, 120.96903991699219, 128.51060485839844, 136.05215454101562, 143.59371948242188, 151.13528442382812, 158.6768341064453, 166.21839904785156, 173.75994873046875, 181.301513671875, 188.84307861328125, 196.38462829589844, 203.9261932373047, 211.46774291992188, 219.00930786132812, 226.55087280273438, 234.09243774414062, 241.6339874267578]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 8.0, 16.0, 11.0, 14.0, 32.0, 44.0, 56.0, 124.0, 186.0, 380.0, 643.0, 1279.0, 2511.0, 5872.0, 27310.0, 4126907.0, 19157.0, 4988.0, 2186.0, 1106.0, 590.0, 351.0, 188.0, 118.0, 66.0, 41.0, 27.0, 17.0, 13.0, 9.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.3125, -36.0859375, -34.859375, -33.6328125, -32.40625, -31.1796875, -29.953125, -28.7265625, -27.5, -26.2734375, -25.046875, -23.8203125, -22.59375, -21.3671875, -20.140625, -18.9140625, -17.6875, -16.4609375, -15.234375, -14.0078125, -12.78125, -11.5546875, -10.328125, -9.1015625, -7.875, -6.6484375, -5.421875, -4.1953125, -2.96875, -1.7421875, -0.515625, 0.7109375, 1.9375, 3.1640625, 4.390625, 5.6171875, 6.84375, 8.0703125, 9.296875, 10.5234375, 11.75, 12.9765625, 14.203125, 15.4296875, 16.65625, 17.8828125, 19.109375, 20.3359375, 21.5625, 22.7890625, 24.015625, 25.2421875, 26.46875, 27.6953125, 28.921875, 30.1484375, 31.375, 32.6015625, 33.828125, 35.0546875, 36.28125, 37.5078125, 38.734375, 39.9609375, 41.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 8.0, 7.0, 15.0, 23.0, 34.0, 46.0, 52.0, 71.0, 99.0, 94.0, 120.0, 100.0, 77.0, 68.0, 67.0, 33.0, 28.0, 15.0, 11.0, 5.0, 2.0, 7.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.592529296875, -15.06005859375, -14.527587890625, -13.9951171875, -13.462646484375, -12.93017578125, -12.397705078125, -11.865234375, -11.332763671875, -10.80029296875, -10.267822265625, -9.7353515625, -9.202880859375, -8.67041015625, -8.137939453125, -7.60546875, -7.072998046875, -6.54052734375, -6.008056640625, -5.4755859375, -4.943115234375, -4.41064453125, -3.878173828125, -3.345703125, -2.813232421875, -2.28076171875, -1.748291015625, -1.2158203125, -0.683349609375, -0.15087890625, 0.381591796875, 0.9140625, 1.446533203125, 1.97900390625, 2.511474609375, 3.0439453125, 3.576416015625, 4.10888671875, 4.641357421875, 5.173828125, 5.706298828125, 6.23876953125, 6.771240234375, 7.3037109375, 7.836181640625, 8.36865234375, 8.901123046875, 9.43359375, 9.966064453125, 10.49853515625, 11.031005859375, 11.5634765625, 12.095947265625, 12.62841796875, 13.160888671875, 13.693359375, 14.225830078125, 14.75830078125, 15.290771484375, 15.8232421875, 16.355712890625, 16.88818359375, 17.420654296875, 17.953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 8.0, 10.0, 20.0, 15.0, 37.0, 36.0, 51.0, 75.0, 110.0, 156.0, 287.0, 428.0, 749.0, 1324.0, 2737.0, 6459.0, 29194.0, 4099626.0, 38885.0, 7607.0, 2934.0, 1402.0, 765.0, 464.0, 292.0, 183.0, 107.0, 73.0, 58.0, 34.0, 28.0, 29.0, 21.0, 14.0, 14.0, 5.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.125, -47.6162109375, -46.107421875, -44.5986328125, -43.08984375, -41.5810546875, -40.072265625, -38.5634765625, -37.0546875, -35.5458984375, -34.037109375, -32.5283203125, -31.01953125, -29.5107421875, -28.001953125, -26.4931640625, -24.984375, -23.4755859375, -21.966796875, -20.4580078125, -18.94921875, -17.4404296875, -15.931640625, -14.4228515625, -12.9140625, -11.4052734375, -9.896484375, -8.3876953125, -6.87890625, -5.3701171875, -3.861328125, -2.3525390625, -0.84375, 0.6650390625, 2.173828125, 3.6826171875, 5.19140625, 6.7001953125, 8.208984375, 9.7177734375, 11.2265625, 12.7353515625, 14.244140625, 15.7529296875, 17.26171875, 18.7705078125, 20.279296875, 21.7880859375, 23.296875, 24.8056640625, 26.314453125, 27.8232421875, 29.33203125, 30.8408203125, 32.349609375, 33.8583984375, 35.3671875, 36.8759765625, 38.384765625, 39.8935546875, 41.40234375, 42.9111328125, 44.419921875, 45.9287109375, 47.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 19.0, 29.0, 97.0, 3794.0, 80.0, 19.0, 14.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6875, -14.671875, -13.65625, -12.640625, -11.625, -10.609375, -9.59375, -8.578125, -7.5625, -6.546875, -5.53125, -4.515625, -3.5, -2.484375, -1.46875, -0.453125, 0.5625, 1.578125, 2.59375, 3.609375, 4.625, 5.640625, 6.65625, 7.671875, 8.6875, 9.703125, 10.71875, 11.734375, 12.75, 13.765625, 14.78125, 15.796875, 16.8125, 17.828125, 18.84375, 19.859375, 20.875, 21.890625, 22.90625, 23.921875, 24.9375, 25.953125, 26.96875, 27.984375, 29.0, 30.015625, 31.03125, 32.046875, 33.0625, 34.078125, 35.09375, 36.109375, 37.125, 38.140625, 39.15625, 40.171875, 41.1875, 42.203125, 43.21875, 44.234375, 45.25, 46.265625, 47.28125, 48.296875, 49.3125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 31.0, 64.0, 151.0, 236.0, 229.0, 146.0, 79.0, 36.0, 15.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-202.22216796875, -198.413330078125, -194.6044921875, -190.795654296875, -186.98683166503906, -183.17799377441406, -179.36915588378906, -175.56031799316406, -171.75148010253906, -167.94264221191406, -164.13380432128906, -160.32498168945312, -156.51614379882812, -152.70730590820312, -148.89846801757812, -145.08963012695312, -141.28079223632812, -137.47195434570312, -133.66311645507812, -129.85427856445312, -126.04544830322266, -122.23661804199219, -118.42778015136719, -114.61894226074219, -110.81011962890625, -107.00128173828125, -103.19245147705078, -99.38361358642578, -95.57477569580078, -91.76594543457031, -87.95710754394531, -84.14826965332031, -80.33943939208984, -76.53060150146484, -72.72177124023438, -68.91293334960938, -65.10409545898438, -61.29526138305664, -57.486427307128906, -53.677589416503906, -49.86875534057617, -46.05992126464844, -42.25108337402344, -38.4422492980957, -34.63341522216797, -30.82457733154297, -27.015743255615234, -23.206907272338867, -19.3980712890625, -15.589235305786133, -11.780400276184082, -7.971565246582031, -4.162729263305664, -0.3538932800292969, 3.4549407958984375, 7.263776779174805, 11.072612762451172, 14.881448745727539, 18.690284729003906, 22.49911880493164, 26.307954788208008, 30.116790771484375, 33.92562484741211, 37.734458923339844, 41.543296813964844]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 12.0, 16.0, 36.0, 43.0, 65.0, 81.0, 101.0, 115.0, 94.0, 94.0, 98.0, 72.0, 52.0, 40.0, 27.0, 19.0, 8.0, 8.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.82682800292969, -100.86724090576172, -97.90765380859375, -94.94806671142578, -91.98847961425781, -89.02888488769531, -86.06929779052734, -83.10971069335938, -80.1501235961914, -77.19053649902344, -74.23094940185547, -71.2713623046875, -68.311767578125, -65.35218048095703, -62.39259338378906, -59.433006286621094, -56.473419189453125, -53.513832092285156, -50.55424499511719, -47.59465408325195, -44.635066986083984, -41.675479888916016, -38.71588897705078, -35.75630187988281, -32.796714782714844, -29.837127685546875, -26.877538681030273, -23.917949676513672, -20.958362579345703, -17.998775482177734, -15.039186477661133, -12.079597473144531, -9.120010375976562, -6.160422325134277, -3.200834274291992, -0.24124622344970703, 2.718341827392578, 5.677929878234863, 8.637517929077148, 11.59710693359375, 14.556694030761719, 17.516281127929688, 20.47587013244629, 23.43545913696289, 26.39504623413086, 29.354633331298828, 32.31422424316406, 35.27381134033203, 38.2333984375, 41.19298553466797, 44.15257263183594, 47.11216354370117, 50.07175064086914, 53.03133773803711, 55.990928649902344, 58.95051574707031, 61.91010284423828, 64.86968994140625, 67.82927703857422, 70.78886413574219, 73.74845886230469, 76.70804595947266, 79.66763305664062, 82.6272201538086, 85.58680725097656]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 6.0, 7.0, 11.0, 15.0, 20.0, 31.0, 56.0, 78.0, 161.0, 281.0, 515.0, 1151.0, 2982.0, 9292.0, 37717.0, 222848.0, 616707.0, 122647.0, 23621.0, 6230.0, 2276.0, 887.0, 445.0, 241.0, 119.0, 77.0, 50.0, 26.0, 18.0, 14.0, 13.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.7646484375, -24.748046875, -23.7314453125, -22.71484375, -21.6982421875, -20.681640625, -19.6650390625, -18.6484375, -17.6318359375, -16.615234375, -15.5986328125, -14.58203125, -13.5654296875, -12.548828125, -11.5322265625, -10.515625, -9.4990234375, -8.482421875, -7.4658203125, -6.44921875, -5.4326171875, -4.416015625, -3.3994140625, -2.3828125, -1.3662109375, -0.349609375, 0.6669921875, 1.68359375, 2.7001953125, 3.716796875, 4.7333984375, 5.75, 6.7666015625, 7.783203125, 8.7998046875, 9.81640625, 10.8330078125, 11.849609375, 12.8662109375, 13.8828125, 14.8994140625, 15.916015625, 16.9326171875, 17.94921875, 18.9658203125, 19.982421875, 20.9990234375, 22.015625, 23.0322265625, 24.048828125, 25.0654296875, 26.08203125, 27.0986328125, 28.115234375, 29.1318359375, 30.1484375, 31.1650390625, 32.181640625, 33.1982421875, 34.21484375, 35.2314453125, 36.248046875, 37.2646484375, 38.28125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 2.0, 7.0, 8.0, 10.0, 18.0, 23.0, 37.0, 49.0, 69.0, 86.0, 82.0, 102.0, 83.0, 102.0, 77.0, 66.0, 39.0, 36.0, 30.0, 22.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.296875, -12.7666015625, -12.236328125, -11.7060546875, -11.17578125, -10.6455078125, -10.115234375, -9.5849609375, -9.0546875, -8.5244140625, -7.994140625, -7.4638671875, -6.93359375, -6.4033203125, -5.873046875, -5.3427734375, -4.8125, -4.2822265625, -3.751953125, -3.2216796875, -2.69140625, -2.1611328125, -1.630859375, -1.1005859375, -0.5703125, -0.0400390625, 0.490234375, 1.0205078125, 1.55078125, 2.0810546875, 2.611328125, 3.1416015625, 3.671875, 4.2021484375, 4.732421875, 5.2626953125, 5.79296875, 6.3232421875, 6.853515625, 7.3837890625, 7.9140625, 8.4443359375, 8.974609375, 9.5048828125, 10.03515625, 10.5654296875, 11.095703125, 11.6259765625, 12.15625, 12.6865234375, 13.216796875, 13.7470703125, 14.27734375, 14.8076171875, 15.337890625, 15.8681640625, 16.3984375, 16.9287109375, 17.458984375, 17.9892578125, 18.51953125, 19.0498046875, 19.580078125, 20.1103515625, 20.640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 10.0, 9.0, 19.0, 22.0, 27.0, 38.0, 50.0, 65.0, 101.0, 138.0, 255.0, 416.0, 777.0, 1693.0, 4119.0, 12894.0, 56723.0, 415092.0, 470827.0, 63277.0, 13972.0, 4322.0, 1671.0, 780.0, 428.0, 270.0, 166.0, 116.0, 70.0, 48.0, 35.0, 32.0, 17.0, 13.0, 9.0, 7.0, 11.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.59375, -33.5771484375, -32.560546875, -31.5439453125, -30.52734375, -29.5107421875, -28.494140625, -27.4775390625, -26.4609375, -25.4443359375, -24.427734375, -23.4111328125, -22.39453125, -21.3779296875, -20.361328125, -19.3447265625, -18.328125, -17.3115234375, -16.294921875, -15.2783203125, -14.26171875, -13.2451171875, -12.228515625, -11.2119140625, -10.1953125, -9.1787109375, -8.162109375, -7.1455078125, -6.12890625, -5.1123046875, -4.095703125, -3.0791015625, -2.0625, -1.0458984375, -0.029296875, 0.9873046875, 2.00390625, 3.0205078125, 4.037109375, 5.0537109375, 6.0703125, 7.0869140625, 8.103515625, 9.1201171875, 10.13671875, 11.1533203125, 12.169921875, 13.1865234375, 14.203125, 15.2197265625, 16.236328125, 17.2529296875, 18.26953125, 19.2861328125, 20.302734375, 21.3193359375, 22.3359375, 23.3525390625, 24.369140625, 25.3857421875, 26.40234375, 27.4189453125, 28.435546875, 29.4521484375, 30.46875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 8.0, 7.0, 11.0, 14.0, 24.0, 32.0, 29.0, 44.0, 67.0, 58.0, 74.0, 64.0, 75.0, 80.0, 61.0, 75.0, 66.0, 56.0, 45.0, 28.0, 32.0, 14.0, 14.0, 8.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.28125, -49.99365234375, -47.7060546875, -45.41845703125, -43.130859375, -40.84326171875, -38.5556640625, -36.26806640625, -33.98046875, -31.69287109375, -29.4052734375, -27.11767578125, -24.830078125, -22.54248046875, -20.2548828125, -17.96728515625, -15.6796875, -13.39208984375, -11.1044921875, -8.81689453125, -6.529296875, -4.24169921875, -1.9541015625, 0.33349609375, 2.62109375, 4.90869140625, 7.1962890625, 9.48388671875, 11.771484375, 14.05908203125, 16.3466796875, 18.63427734375, 20.921875, 23.20947265625, 25.4970703125, 27.78466796875, 30.072265625, 32.35986328125, 34.6474609375, 36.93505859375, 39.22265625, 41.51025390625, 43.7978515625, 46.08544921875, 48.373046875, 50.66064453125, 52.9482421875, 55.23583984375, 57.5234375, 59.81103515625, 62.0986328125, 64.38623046875, 66.673828125, 68.96142578125, 71.2490234375, 73.53662109375, 75.82421875, 78.11181640625, 80.3994140625, 82.68701171875, 84.974609375, 87.26220703125, 89.5498046875, 91.83740234375, 94.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 8.0, 4.0, 7.0, 12.0, 15.0, 14.0, 22.0, 35.0, 62.0, 77.0, 125.0, 206.0, 367.0, 690.0, 1391.0, 3073.0, 9729.0, 44687.0, 425964.0, 495219.0, 49945.0, 10284.0, 3394.0, 1459.0, 724.0, 387.0, 218.0, 145.0, 87.0, 64.0, 43.0, 29.0, 10.0, 17.0, 12.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.40625, -10.021240234375, -9.63623046875, -9.251220703125, -8.8662109375, -8.481201171875, -8.09619140625, -7.711181640625, -7.326171875, -6.941162109375, -6.55615234375, -6.171142578125, -5.7861328125, -5.401123046875, -5.01611328125, -4.631103515625, -4.24609375, -3.861083984375, -3.47607421875, -3.091064453125, -2.7060546875, -2.321044921875, -1.93603515625, -1.551025390625, -1.166015625, -0.781005859375, -0.39599609375, -0.010986328125, 0.3740234375, 0.759033203125, 1.14404296875, 1.529052734375, 1.9140625, 2.299072265625, 2.68408203125, 3.069091796875, 3.4541015625, 3.839111328125, 4.22412109375, 4.609130859375, 4.994140625, 5.379150390625, 5.76416015625, 6.149169921875, 6.5341796875, 6.919189453125, 7.30419921875, 7.689208984375, 8.07421875, 8.459228515625, 8.84423828125, 9.229248046875, 9.6142578125, 9.999267578125, 10.38427734375, 10.769287109375, 11.154296875, 11.539306640625, 11.92431640625, 12.309326171875, 12.6943359375, 13.079345703125, 13.46435546875, 13.849365234375, 14.234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 9.0, 18.0, 22.0, 51.0, 92.0, 164.0, 236.0, 176.0, 104.0, 54.0, 24.0, 21.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004306793212890625, -0.004178524017333984, -0.004050254821777344, -0.003921985626220703, -0.0037937164306640625, -0.003665447235107422, -0.0035371780395507812, -0.0034089088439941406, -0.0032806396484375, -0.0031523704528808594, -0.0030241012573242188, -0.002895832061767578, -0.0027675628662109375, -0.002639293670654297, -0.0025110244750976562, -0.0023827552795410156, -0.002254486083984375, -0.0021262168884277344, -0.0019979476928710938, -0.0018696784973144531, -0.0017414093017578125, -0.0016131401062011719, -0.0014848709106445312, -0.0013566017150878906, -0.00122833251953125, -0.0011000633239746094, -0.0009717941284179688, -0.0008435249328613281, -0.0007152557373046875, -0.0005869865417480469, -0.00045871734619140625, -0.0003304481506347656, -0.000202178955078125, -7.390975952148438e-05, 5.435943603515625e-05, 0.00018262863159179688, 0.0003108978271484375, 0.0004391670227050781, 0.0005674362182617188, 0.0006957054138183594, 0.000823974609375, 0.0009522438049316406, 0.0010805130004882812, 0.0012087821960449219, 0.0013370513916015625, 0.0014653205871582031, 0.0015935897827148438, 0.0017218589782714844, 0.001850128173828125, 0.0019783973693847656, 0.0021066665649414062, 0.002234935760498047, 0.0023632049560546875, 0.002491474151611328, 0.0026197433471679688, 0.0027480125427246094, 0.00287628173828125, 0.0030045509338378906, 0.0031328201293945312, 0.003261089324951172, 0.0033893585205078125, 0.003517627716064453, 0.0036458969116210938, 0.0037741661071777344, 0.003902435302734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 18.0, 20.0, 61.0, 113.0, 222.0, 564.0, 1609.0, 6429.0, 66657.0, 885227.0, 77860.0, 6982.0, 1712.0, 597.0, 232.0, 102.0, 77.0, 28.0, 13.0, 6.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.046875, -26.362548828125, -25.67822265625, -24.993896484375, -24.3095703125, -23.625244140625, -22.94091796875, -22.256591796875, -21.572265625, -20.887939453125, -20.20361328125, -19.519287109375, -18.8349609375, -18.150634765625, -17.46630859375, -16.781982421875, -16.09765625, -15.413330078125, -14.72900390625, -14.044677734375, -13.3603515625, -12.676025390625, -11.99169921875, -11.307373046875, -10.623046875, -9.938720703125, -9.25439453125, -8.570068359375, -7.8857421875, -7.201416015625, -6.51708984375, -5.832763671875, -5.1484375, -4.464111328125, -3.77978515625, -3.095458984375, -2.4111328125, -1.726806640625, -1.04248046875, -0.358154296875, 0.326171875, 1.010498046875, 1.69482421875, 2.379150390625, 3.0634765625, 3.747802734375, 4.43212890625, 5.116455078125, 5.80078125, 6.485107421875, 7.16943359375, 7.853759765625, 8.5380859375, 9.222412109375, 9.90673828125, 10.591064453125, 11.275390625, 11.959716796875, 12.64404296875, 13.328369140625, 14.0126953125, 14.697021484375, 15.38134765625, 16.065673828125, 16.75]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 13.0, 16.0, 32.0, 51.0, 79.0, 133.0, 184.0, 199.0, 129.0, 78.0, 31.0, 13.0, 10.0, 12.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.03125, -33.10693359375, -32.1826171875, -31.25830078125, -30.333984375, -29.40966796875, -28.4853515625, -27.56103515625, -26.63671875, -25.71240234375, -24.7880859375, -23.86376953125, -22.939453125, -22.01513671875, -21.0908203125, -20.16650390625, -19.2421875, -18.31787109375, -17.3935546875, -16.46923828125, -15.544921875, -14.62060546875, -13.6962890625, -12.77197265625, -11.84765625, -10.92333984375, -9.9990234375, -9.07470703125, -8.150390625, -7.22607421875, -6.3017578125, -5.37744140625, -4.453125, -3.52880859375, -2.6044921875, -1.68017578125, -0.755859375, 0.16845703125, 1.0927734375, 2.01708984375, 2.94140625, 3.86572265625, 4.7900390625, 5.71435546875, 6.638671875, 7.56298828125, 8.4873046875, 9.41162109375, 10.3359375, 11.26025390625, 12.1845703125, 13.10888671875, 14.033203125, 14.95751953125, 15.8818359375, 16.80615234375, 17.73046875, 18.65478515625, 19.5791015625, 20.50341796875, 21.427734375, 22.35205078125, 23.2763671875, 24.20068359375, 25.125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 25.0, 51.0, 124.0, 216.0, 236.0, 157.0, 105.0, 35.0, 20.0, 10.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-697.2694091796875, -683.71484375, -670.1603393554688, -656.6057739257812, -643.05126953125, -629.4967041015625, -615.9421997070312, -602.3876342773438, -588.8331298828125, -575.278564453125, -561.7240600585938, -548.1694946289062, -534.614990234375, -521.0604248046875, -507.5058898925781, -493.95135498046875, -480.39678955078125, -466.8422546386719, -453.2877197265625, -439.7331848144531, -426.17864990234375, -412.62408447265625, -399.0695495605469, -385.5150146484375, -371.9604797363281, -358.40594482421875, -344.8514099121094, -331.296875, -317.7423095703125, -304.18780517578125, -290.63323974609375, -277.0787048339844, -263.524169921875, -249.96963500976562, -236.41510009765625, -222.8605499267578, -209.30601501464844, -195.75148010253906, -182.19692993164062, -168.64239501953125, -155.0878448486328, -141.53330993652344, -127.97876739501953, -114.42422485351562, -100.86968994140625, -87.31515502929688, -73.76061248779297, -60.20606994628906, -46.65153503417969, -33.09699630737305, -19.542457580566406, -5.987918853759766, 7.566619873046875, 21.12115478515625, 34.675697326660156, 48.23023986816406, 61.78477478027344, 75.33930969238281, 88.89385223388672, 102.44839477539062, 116.0029296875, 129.55746459960938, 143.11199951171875, 156.6665496826172, 170.22108459472656]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 10.0, 14.0, 15.0, 11.0, 11.0, 23.0, 15.0, 23.0, 29.0, 26.0, 39.0, 37.0, 44.0, 54.0, 54.0, 46.0, 63.0, 57.0, 47.0, 42.0, 44.0, 37.0, 38.0, 40.0, 36.0, 13.0, 21.0, 20.0, 12.0, 10.0, 7.0, 14.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.46847534179688, -218.4244842529297, -210.3804931640625, -202.33648681640625, -194.29249572753906, -186.24850463867188, -178.20449829101562, -170.16050720214844, -162.11651611328125, -154.07252502441406, -146.02853393554688, -137.98452758789062, -129.94053649902344, -121.89654541015625, -113.85254669189453, -105.80854797363281, -97.76455688476562, -89.72056579589844, -81.67656707763672, -73.632568359375, -65.58857727050781, -57.54458236694336, -49.500587463378906, -41.45659255981445, -33.41259765625, -25.368602752685547, -17.324607849121094, -9.28061294555664, -1.2366180419921875, 6.807376861572266, 14.851371765136719, 22.895366668701172, 30.9393310546875, 38.98332595825195, 47.027320861816406, 55.07131576538086, 63.11531066894531, 71.1593017578125, 79.20330047607422, 87.24729919433594, 95.29129028320312, 103.33528137207031, 111.37928009033203, 119.42327880859375, 127.46726989746094, 135.51126098632812, 143.55526733398438, 151.59925842285156, 159.64324951171875, 167.68724060058594, 175.73123168945312, 183.77523803710938, 191.81922912597656, 199.86322021484375, 207.9072265625, 215.9512176513672, 223.99520874023438, 232.03919982910156, 240.08319091796875, 248.127197265625, 256.17120361328125, 264.2151794433594, 272.2591857910156, 280.30316162109375, 288.34716796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 4.0, 11.0, 12.0, 18.0, 32.0, 46.0, 81.0, 103.0, 198.0, 331.0, 564.0, 1157.0, 2544.0, 6870.0, 26586.0, 225210.0, 3821028.0, 84412.0, 15760.0, 4999.0, 2002.0, 945.0, 508.0, 290.0, 180.0, 130.0, 80.0, 51.0, 37.0, 20.0, 21.0, 11.0, 6.0, 9.0, 4.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.4375, -27.3974609375, -26.357421875, -25.3173828125, -24.27734375, -23.2373046875, -22.197265625, -21.1572265625, -20.1171875, -19.0771484375, -18.037109375, -16.9970703125, -15.95703125, -14.9169921875, -13.876953125, -12.8369140625, -11.796875, -10.7568359375, -9.716796875, -8.6767578125, -7.63671875, -6.5966796875, -5.556640625, -4.5166015625, -3.4765625, -2.4365234375, -1.396484375, -0.3564453125, 0.68359375, 1.7236328125, 2.763671875, 3.8037109375, 4.84375, 5.8837890625, 6.923828125, 7.9638671875, 9.00390625, 10.0439453125, 11.083984375, 12.1240234375, 13.1640625, 14.2041015625, 15.244140625, 16.2841796875, 17.32421875, 18.3642578125, 19.404296875, 20.4443359375, 21.484375, 22.5244140625, 23.564453125, 24.6044921875, 25.64453125, 26.6845703125, 27.724609375, 28.7646484375, 29.8046875, 30.8447265625, 31.884765625, 32.9248046875, 33.96484375, 35.0048828125, 36.044921875, 37.0849609375, 38.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 5.0, 10.0, 12.0, 13.0, 29.0, 45.0, 56.0, 65.0, 89.0, 91.0, 122.0, 104.0, 93.0, 83.0, 60.0, 27.0, 27.0, 24.0, 16.0, 9.0, 9.0, 7.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.81103515625, -10.2626953125, -9.71435546875, -9.166015625, -8.61767578125, -8.0693359375, -7.52099609375, -6.97265625, -6.42431640625, -5.8759765625, -5.32763671875, -4.779296875, -4.23095703125, -3.6826171875, -3.13427734375, -2.5859375, -2.03759765625, -1.4892578125, -0.94091796875, -0.392578125, 0.15576171875, 0.7041015625, 1.25244140625, 1.80078125, 2.34912109375, 2.8974609375, 3.44580078125, 3.994140625, 4.54248046875, 5.0908203125, 5.63916015625, 6.1875, 6.73583984375, 7.2841796875, 7.83251953125, 8.380859375, 8.92919921875, 9.4775390625, 10.02587890625, 10.57421875, 11.12255859375, 11.6708984375, 12.21923828125, 12.767578125, 13.31591796875, 13.8642578125, 14.41259765625, 14.9609375, 15.50927734375, 16.0576171875, 16.60595703125, 17.154296875, 17.70263671875, 18.2509765625, 18.79931640625, 19.34765625, 19.89599609375, 20.4443359375, 20.99267578125, 21.541015625, 22.08935546875, 22.6376953125, 23.18603515625, 23.734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 8.0, 7.0, 12.0, 7.0, 17.0, 25.0, 44.0, 66.0, 162.0, 269.0, 646.0, 1540.0, 5126.0, 23214.0, 275530.0, 3807018.0, 65493.0, 10536.0, 2677.0, 979.0, 414.0, 190.0, 111.0, 61.0, 38.0, 18.0, 17.0, 17.0, 7.0, 9.0, 5.0, 5.0, 0.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.8125, -34.49853515625, -33.1845703125, -31.87060546875, -30.556640625, -29.24267578125, -27.9287109375, -26.61474609375, -25.30078125, -23.98681640625, -22.6728515625, -21.35888671875, -20.044921875, -18.73095703125, -17.4169921875, -16.10302734375, -14.7890625, -13.47509765625, -12.1611328125, -10.84716796875, -9.533203125, -8.21923828125, -6.9052734375, -5.59130859375, -4.27734375, -2.96337890625, -1.6494140625, -0.33544921875, 0.978515625, 2.29248046875, 3.6064453125, 4.92041015625, 6.234375, 7.54833984375, 8.8623046875, 10.17626953125, 11.490234375, 12.80419921875, 14.1181640625, 15.43212890625, 16.74609375, 18.06005859375, 19.3740234375, 20.68798828125, 22.001953125, 23.31591796875, 24.6298828125, 25.94384765625, 27.2578125, 28.57177734375, 29.8857421875, 31.19970703125, 32.513671875, 33.82763671875, 35.1416015625, 36.45556640625, 37.76953125, 39.08349609375, 40.3974609375, 41.71142578125, 43.025390625, 44.33935546875, 45.6533203125, 46.96728515625, 48.28125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 5.0, 13.0, 8.0, 17.0, 22.0, 27.0, 64.0, 126.0, 429.0, 1942.0, 984.0, 198.0, 96.0, 42.0, 27.0, 25.0, 19.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.25, -43.8671875, -42.484375, -41.1015625, -39.71875, -38.3359375, -36.953125, -35.5703125, -34.1875, -32.8046875, -31.421875, -30.0390625, -28.65625, -27.2734375, -25.890625, -24.5078125, -23.125, -21.7421875, -20.359375, -18.9765625, -17.59375, -16.2109375, -14.828125, -13.4453125, -12.0625, -10.6796875, -9.296875, -7.9140625, -6.53125, -5.1484375, -3.765625, -2.3828125, -1.0, 0.3828125, 1.765625, 3.1484375, 4.53125, 5.9140625, 7.296875, 8.6796875, 10.0625, 11.4453125, 12.828125, 14.2109375, 15.59375, 16.9765625, 18.359375, 19.7421875, 21.125, 22.5078125, 23.890625, 25.2734375, 26.65625, 28.0390625, 29.421875, 30.8046875, 32.1875, 33.5703125, 34.953125, 36.3359375, 37.71875, 39.1015625, 40.484375, 41.8671875, 43.25]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 24.0, 44.0, 128.0, 196.0, 233.0, 171.0, 91.0, 40.0, 17.0, 17.0, 10.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.45570373535156, -206.09664916992188, -196.73757934570312, -187.37852478027344, -178.0194549560547, -168.660400390625, -159.30133056640625, -149.94227600097656, -140.58322143554688, -131.2241668701172, -121.86509704589844, -112.50604248046875, -103.14697265625, -93.78791809082031, -84.4288558959961, -75.06979370117188, -65.71072387695312, -56.351661682128906, -46.99259948730469, -37.633541107177734, -28.274478912353516, -18.915416717529297, -9.556358337402344, -0.197296142578125, 9.161766052246094, 18.520828247070312, 27.8798885345459, 37.238948822021484, 46.5980110168457, 55.95707321166992, 65.31613159179688, 74.6751937866211, 84.03427124023438, 93.3933334350586, 102.75239562988281, 112.1114501953125, 121.47052001953125, 130.82957458496094, 140.18862915039062, 149.54769897460938, 158.90676879882812, 168.2658233642578, 177.62489318847656, 186.98394775390625, 196.343017578125, 205.7020721435547, 215.06112670898438, 224.42019653320312, 233.7792510986328, 243.1383056640625, 252.49737548828125, 261.8564453125, 271.2154846191406, 280.5745544433594, 289.9336242675781, 299.29266357421875, 308.6517333984375, 318.01080322265625, 327.3698425292969, 336.7289123535156, 346.0879821777344, 355.4470520019531, 364.80609130859375, 374.1651611328125, 383.52423095703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 12.0, 15.0, 24.0, 35.0, 46.0, 60.0, 70.0, 90.0, 88.0, 93.0, 77.0, 81.0, 79.0, 73.0, 45.0, 32.0, 29.0, 20.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-301.7612609863281, -294.685302734375, -287.609375, -280.5334167480469, -273.45745849609375, -266.38153076171875, -259.3055725097656, -252.22962951660156, -245.1536865234375, -238.07774353027344, -231.0017852783203, -223.92584228515625, -216.8498992919922, -209.77395629882812, -202.697998046875, -195.62205505371094, -188.54611206054688, -181.4701690673828, -174.3942108154297, -167.31826782226562, -160.24232482910156, -153.1663818359375, -146.09042358398438, -139.0144805908203, -131.9385223388672, -124.8625717163086, -117.78662872314453, -110.71067810058594, -103.63473510742188, -96.55878448486328, -89.48283386230469, -82.40689086914062, -75.33094787597656, -68.25499725341797, -61.179054260253906, -54.10310363769531, -47.02716064453125, -39.951210021972656, -32.87526321411133, -25.79931640625, -18.723369598388672, -11.647422790527344, -4.571475028991699, 2.5044727325439453, 9.580419540405273, 16.656368255615234, 23.732315063476562, 30.80826187133789, 37.88420867919922, 44.96015548706055, 52.036102294921875, 59.11205291748047, 66.18799591064453, 73.26394653320312, 80.33988952636719, 87.41584014892578, 94.49179077148438, 101.56774139404297, 108.64368438720703, 115.71963500976562, 122.79557800292969, 129.87152099609375, 136.94747924804688, 144.02342224121094, 151.099365234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 12.0, 11.0, 11.0, 31.0, 53.0, 73.0, 99.0, 191.0, 322.0, 698.0, 1700.0, 4233.0, 13103.0, 50450.0, 233099.0, 549162.0, 146898.0, 33460.0, 9290.0, 3020.0, 1274.0, 618.0, 287.0, 172.0, 87.0, 69.0, 50.0, 23.0, 20.0, 12.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.03125, -31.125244140625, -30.21923828125, -29.313232421875, -28.4072265625, -27.501220703125, -26.59521484375, -25.689208984375, -24.783203125, -23.877197265625, -22.97119140625, -22.065185546875, -21.1591796875, -20.253173828125, -19.34716796875, -18.441162109375, -17.53515625, -16.629150390625, -15.72314453125, -14.817138671875, -13.9111328125, -13.005126953125, -12.09912109375, -11.193115234375, -10.287109375, -9.381103515625, -8.47509765625, -7.569091796875, -6.6630859375, -5.757080078125, -4.85107421875, -3.945068359375, -3.0390625, -2.133056640625, -1.22705078125, -0.321044921875, 0.5849609375, 1.490966796875, 2.39697265625, 3.302978515625, 4.208984375, 5.114990234375, 6.02099609375, 6.927001953125, 7.8330078125, 8.739013671875, 9.64501953125, 10.551025390625, 11.45703125, 12.363037109375, 13.26904296875, 14.175048828125, 15.0810546875, 15.987060546875, 16.89306640625, 17.799072265625, 18.705078125, 19.611083984375, 20.51708984375, 21.423095703125, 22.3291015625, 23.235107421875, 24.14111328125, 25.047119140625, 25.953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 16.0, 14.0, 26.0, 36.0, 39.0, 34.0, 62.0, 67.0, 58.0, 72.0, 96.0, 71.0, 61.0, 63.0, 63.0, 43.0, 35.0, 31.0, 26.0, 20.0, 20.0, 15.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.546875, -12.1385498046875, -11.730224609375, -11.3218994140625, -10.91357421875, -10.5052490234375, -10.096923828125, -9.6885986328125, -9.2802734375, -8.8719482421875, -8.463623046875, -8.0552978515625, -7.64697265625, -7.2386474609375, -6.830322265625, -6.4219970703125, -6.013671875, -5.6053466796875, -5.197021484375, -4.7886962890625, -4.38037109375, -3.9720458984375, -3.563720703125, -3.1553955078125, -2.7470703125, -2.3387451171875, -1.930419921875, -1.5220947265625, -1.11376953125, -0.7054443359375, -0.297119140625, 0.1112060546875, 0.51953125, 0.9278564453125, 1.336181640625, 1.7445068359375, 2.15283203125, 2.5611572265625, 2.969482421875, 3.3778076171875, 3.7861328125, 4.1944580078125, 4.602783203125, 5.0111083984375, 5.41943359375, 5.8277587890625, 6.236083984375, 6.6444091796875, 7.052734375, 7.4610595703125, 7.869384765625, 8.2777099609375, 8.68603515625, 9.0943603515625, 9.502685546875, 9.9110107421875, 10.3193359375, 10.7276611328125, 11.135986328125, 11.5443115234375, 11.95263671875, 12.3609619140625, 12.769287109375, 13.1776123046875, 13.5859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 12.0, 18.0, 31.0, 45.0, 119.0, 195.0, 515.0, 1397.0, 5763.0, 78193.0, 903071.0, 52336.0, 4774.0, 1173.0, 467.0, 207.0, 91.0, 47.0, 39.0, 16.0, 13.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.625, -84.583984375, -82.54296875, -80.501953125, -78.4609375, -76.419921875, -74.37890625, -72.337890625, -70.296875, -68.255859375, -66.21484375, -64.173828125, -62.1328125, -60.091796875, -58.05078125, -56.009765625, -53.96875, -51.927734375, -49.88671875, -47.845703125, -45.8046875, -43.763671875, -41.72265625, -39.681640625, -37.640625, -35.599609375, -33.55859375, -31.517578125, -29.4765625, -27.435546875, -25.39453125, -23.353515625, -21.3125, -19.271484375, -17.23046875, -15.189453125, -13.1484375, -11.107421875, -9.06640625, -7.025390625, -4.984375, -2.943359375, -0.90234375, 1.138671875, 3.1796875, 5.220703125, 7.26171875, 9.302734375, 11.34375, 13.384765625, 15.42578125, 17.466796875, 19.5078125, 21.548828125, 23.58984375, 25.630859375, 27.671875, 29.712890625, 31.75390625, 33.794921875, 35.8359375, 37.876953125, 39.91796875, 41.958984375, 44.0]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 10.0, 16.0, 11.0, 17.0, 23.0, 21.0, 46.0, 48.0, 57.0, 69.0, 71.0, 81.0, 91.0, 74.0, 63.0, 60.0, 51.0, 43.0, 30.0, 38.0, 28.0, 22.0, 10.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-94.5, -92.36767578125, -90.2353515625, -88.10302734375, -85.970703125, -83.83837890625, -81.7060546875, -79.57373046875, -77.44140625, -75.30908203125, -73.1767578125, -71.04443359375, -68.912109375, -66.77978515625, -64.6474609375, -62.51513671875, -60.3828125, -58.25048828125, -56.1181640625, -53.98583984375, -51.853515625, -49.72119140625, -47.5888671875, -45.45654296875, -43.32421875, -41.19189453125, -39.0595703125, -36.92724609375, -34.794921875, -32.66259765625, -30.5302734375, -28.39794921875, -26.265625, -24.13330078125, -22.0009765625, -19.86865234375, -17.736328125, -15.60400390625, -13.4716796875, -11.33935546875, -9.20703125, -7.07470703125, -4.9423828125, -2.81005859375, -0.677734375, 1.45458984375, 3.5869140625, 5.71923828125, 7.8515625, 9.98388671875, 12.1162109375, 14.24853515625, 16.380859375, 18.51318359375, 20.6455078125, 22.77783203125, 24.91015625, 27.04248046875, 29.1748046875, 31.30712890625, 33.439453125, 35.57177734375, 37.7041015625, 39.83642578125, 41.96875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 16.0, 13.0, 35.0, 50.0, 139.0, 269.0, 785.0, 3850.0, 1000927.0, 39567.0, 1966.0, 535.0, 173.0, 88.0, 46.0, 25.0, 20.0, 12.0, 7.0, 11.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-125.125, -121.5302734375, -117.935546875, -114.3408203125, -110.74609375, -107.1513671875, -103.556640625, -99.9619140625, -96.3671875, -92.7724609375, -89.177734375, -85.5830078125, -81.98828125, -78.3935546875, -74.798828125, -71.2041015625, -67.609375, -64.0146484375, -60.419921875, -56.8251953125, -53.23046875, -49.6357421875, -46.041015625, -42.4462890625, -38.8515625, -35.2568359375, -31.662109375, -28.0673828125, -24.47265625, -20.8779296875, -17.283203125, -13.6884765625, -10.09375, -6.4990234375, -2.904296875, 0.6904296875, 4.28515625, 7.8798828125, 11.474609375, 15.0693359375, 18.6640625, 22.2587890625, 25.853515625, 29.4482421875, 33.04296875, 36.6376953125, 40.232421875, 43.8271484375, 47.421875, 51.0166015625, 54.611328125, 58.2060546875, 61.80078125, 65.3955078125, 68.990234375, 72.5849609375, 76.1796875, 79.7744140625, 83.369140625, 86.9638671875, 90.55859375, 94.1533203125, 97.748046875, 101.3427734375, 104.9375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 13.0, 30.0, 60.0, 214.0, 346.0, 206.0, 90.0, 17.0, 15.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0098114013671875, -0.009535074234008789, -0.009258747100830078, -0.008982419967651367, -0.008706092834472656, -0.008429765701293945, -0.008153438568115234, -0.007877111434936523, -0.0076007843017578125, -0.0073244571685791016, -0.007048130035400391, -0.00677180290222168, -0.006495475769042969, -0.006219148635864258, -0.005942821502685547, -0.005666494369506836, -0.005390167236328125, -0.005113840103149414, -0.004837512969970703, -0.004561185836791992, -0.004284858703613281, -0.00400853157043457, -0.0037322044372558594, -0.0034558773040771484, -0.0031795501708984375, -0.0029032230377197266, -0.0026268959045410156, -0.0023505687713623047, -0.0020742416381835938, -0.0017979145050048828, -0.0015215873718261719, -0.001245260238647461, -0.00096893310546875, -0.0006926059722900391, -0.0004162788391113281, -0.0001399517059326172, 0.00013637542724609375, 0.0004127025604248047, 0.0006890296936035156, 0.0009653568267822266, 0.0012416839599609375, 0.0015180110931396484, 0.0017943382263183594, 0.0020706653594970703, 0.0023469924926757812, 0.002623319625854492, 0.002899646759033203, 0.003175973892211914, 0.003452301025390625, 0.003728628158569336, 0.004004955291748047, 0.004281282424926758, 0.004557609558105469, 0.00483393669128418, 0.005110263824462891, 0.0053865909576416016, 0.0056629180908203125, 0.0059392452239990234, 0.006215572357177734, 0.006491899490356445, 0.006768226623535156, 0.007044553756713867, 0.007320880889892578, 0.007597208023071289, 0.00787353515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 17.0, 25.0, 25.0, 37.0, 48.0, 77.0, 139.0, 182.0, 321.0, 550.0, 1063.0, 2353.0, 6225.0, 27936.0, 704024.0, 278660.0, 18179.0, 4720.0, 1806.0, 826.0, 482.0, 281.0, 162.0, 104.0, 78.0, 44.0, 41.0, 39.0, 13.0, 18.0, 15.0, 7.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-27.390625, -26.531494140625, -25.67236328125, -24.813232421875, -23.9541015625, -23.094970703125, -22.23583984375, -21.376708984375, -20.517578125, -19.658447265625, -18.79931640625, -17.940185546875, -17.0810546875, -16.221923828125, -15.36279296875, -14.503662109375, -13.64453125, -12.785400390625, -11.92626953125, -11.067138671875, -10.2080078125, -9.348876953125, -8.48974609375, -7.630615234375, -6.771484375, -5.912353515625, -5.05322265625, -4.194091796875, -3.3349609375, -2.475830078125, -1.61669921875, -0.757568359375, 0.1015625, 0.960693359375, 1.81982421875, 2.678955078125, 3.5380859375, 4.397216796875, 5.25634765625, 6.115478515625, 6.974609375, 7.833740234375, 8.69287109375, 9.552001953125, 10.4111328125, 11.270263671875, 12.12939453125, 12.988525390625, 13.84765625, 14.706787109375, 15.56591796875, 16.425048828125, 17.2841796875, 18.143310546875, 19.00244140625, 19.861572265625, 20.720703125, 21.579833984375, 22.43896484375, 23.298095703125, 24.1572265625, 25.016357421875, 25.87548828125, 26.734619140625, 27.59375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 15.0, 24.0, 63.0, 126.0, 301.0, 244.0, 117.0, 44.0, 13.0, 6.0, 6.0, 3.0, 5.0, 3.0, 7.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.75, -63.68359375, -61.6171875, -59.55078125, -57.484375, -55.41796875, -53.3515625, -51.28515625, -49.21875, -47.15234375, -45.0859375, -43.01953125, -40.953125, -38.88671875, -36.8203125, -34.75390625, -32.6875, -30.62109375, -28.5546875, -26.48828125, -24.421875, -22.35546875, -20.2890625, -18.22265625, -16.15625, -14.08984375, -12.0234375, -9.95703125, -7.890625, -5.82421875, -3.7578125, -1.69140625, 0.375, 2.44140625, 4.5078125, 6.57421875, 8.640625, 10.70703125, 12.7734375, 14.83984375, 16.90625, 18.97265625, 21.0390625, 23.10546875, 25.171875, 27.23828125, 29.3046875, 31.37109375, 33.4375, 35.50390625, 37.5703125, 39.63671875, 41.703125, 43.76953125, 45.8359375, 47.90234375, 49.96875, 52.03515625, 54.1015625, 56.16796875, 58.234375, 60.30078125, 62.3671875, 64.43359375, 66.5]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 20.0, 53.0, 150.0, 302.0, 312.0, 96.0, 27.0, 18.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-429.8560791015625, -404.48046875, -379.1048278808594, -353.7292175292969, -328.3536071777344, -302.97796630859375, -277.60235595703125, -252.22674560546875, -226.8511199951172, -201.47549438476562, -176.09988403320312, -150.72425842285156, -125.34864044189453, -99.9730224609375, -74.59739685058594, -49.22178649902344, -23.846160888671875, 1.529458999633789, 26.905078887939453, 52.28070068359375, 77.65631866455078, 103.03193664550781, 128.40756225585938, 153.78317260742188, 179.15879821777344, 204.534423828125, 229.9100341796875, 255.28565979003906, 280.6612854003906, 306.0368957519531, 331.41253662109375, 356.78814697265625, 382.16375732421875, 407.53936767578125, 432.9150085449219, 458.2906188964844, 483.6662292480469, 509.0418701171875, 534.41748046875, 559.7930908203125, 585.168701171875, 610.5443115234375, 635.919921875, 661.2955322265625, 686.6712036132812, 712.0468139648438, 737.4224243164062, 762.7980346679688, 788.1737060546875, 813.54931640625, 838.9249267578125, 864.300537109375, 889.6762084960938, 915.0518188476562, 940.4274291992188, 965.8030395507812, 991.1786499023438, 1016.5542602539062, 1041.929931640625, 1067.3055419921875, 1092.68115234375, 1118.0567626953125, 1143.432373046875, 1168.8079833984375, 1194.18359375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 6.0, 11.0, 17.0, 22.0, 29.0, 41.0, 41.0, 51.0, 77.0, 94.0, 102.0, 97.0, 85.0, 65.0, 58.0, 42.0, 40.0, 32.0, 27.0, 23.0, 10.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-552.1994018554688, -538.7743530273438, -525.349365234375, -511.92431640625, -498.4992980957031, -485.07427978515625, -471.64923095703125, -458.2242126464844, -444.7991943359375, -431.3741760253906, -417.9491271972656, -404.52410888671875, -391.0990905761719, -377.674072265625, -364.2490234375, -350.8240051269531, -337.3989562988281, -323.97393798828125, -310.54888916015625, -297.1238708496094, -283.6988525390625, -270.2738037109375, -256.8487854003906, -243.42376708984375, -229.9987335205078, -216.57369995117188, -203.148681640625, -189.72364807128906, -176.29861450195312, -162.87359619140625, -149.4485626220703, -136.02352905273438, -122.59848022460938, -109.17345428466797, -95.74842834472656, -82.32339477539062, -68.89836883544922, -55.47334289550781, -42.048309326171875, -28.62328338623047, -15.198257446289062, -1.7732295989990234, 11.651798248291016, 25.076828002929688, 38.501853942871094, 51.9268798828125, 65.35191345214844, 78.77693939208984, 92.20196533203125, 105.62699127197266, 119.05201721191406, 132.47705078125, 145.90206909179688, 159.3271026611328, 172.75213623046875, 186.17715454101562, 199.60218811035156, 213.0272216796875, 226.45223999023438, 239.8772735595703, 253.30230712890625, 266.7273254394531, 280.15234375, 293.577392578125, 307.0024108886719]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 0.0, 6.0, 8.0, 8.0, 6.0, 11.0, 22.0, 17.0, 22.0, 53.0, 53.0, 94.0, 155.0, 327.0, 779.0, 2909.0, 44656.0, 4120401.0, 21032.0, 2687.0, 604.0, 200.0, 107.0, 50.0, 28.0, 18.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.0625, -117.013671875, -113.96484375, -110.916015625, -107.8671875, -104.818359375, -101.76953125, -98.720703125, -95.671875, -92.623046875, -89.57421875, -86.525390625, -83.4765625, -80.427734375, -77.37890625, -74.330078125, -71.28125, -68.232421875, -65.18359375, -62.134765625, -59.0859375, -56.037109375, -52.98828125, -49.939453125, -46.890625, -43.841796875, -40.79296875, -37.744140625, -34.6953125, -31.646484375, -28.59765625, -25.548828125, -22.5, -19.451171875, -16.40234375, -13.353515625, -10.3046875, -7.255859375, -4.20703125, -1.158203125, 1.890625, 4.939453125, 7.98828125, 11.037109375, 14.0859375, 17.134765625, 20.18359375, 23.232421875, 26.28125, 29.330078125, 32.37890625, 35.427734375, 38.4765625, 41.525390625, 44.57421875, 47.623046875, 50.671875, 53.720703125, 56.76953125, 59.818359375, 62.8671875, 65.916015625, 68.96484375, 72.013671875, 75.0625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 8.0, 10.0, 20.0, 53.0, 134.0, 220.0, 258.0, 158.0, 88.0, 37.0, 16.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-75.875, -74.297607421875, -72.72021484375, -71.142822265625, -69.5654296875, -67.988037109375, -66.41064453125, -64.833251953125, -63.255859375, -61.678466796875, -60.10107421875, -58.523681640625, -56.9462890625, -55.368896484375, -53.79150390625, -52.214111328125, -50.63671875, -49.059326171875, -47.48193359375, -45.904541015625, -44.3271484375, -42.749755859375, -41.17236328125, -39.594970703125, -38.017578125, -36.440185546875, -34.86279296875, -33.285400390625, -31.7080078125, -30.130615234375, -28.55322265625, -26.975830078125, -25.3984375, -23.821044921875, -22.24365234375, -20.666259765625, -19.0888671875, -17.511474609375, -15.93408203125, -14.356689453125, -12.779296875, -11.201904296875, -9.62451171875, -8.047119140625, -6.4697265625, -4.892333984375, -3.31494140625, -1.737548828125, -0.16015625, 1.417236328125, 2.99462890625, 4.572021484375, 6.1494140625, 7.726806640625, 9.30419921875, 10.881591796875, 12.458984375, 14.036376953125, 15.61376953125, 17.191162109375, 18.7685546875, 20.345947265625, 21.92333984375, 23.500732421875, 25.078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 9.0, 11.0, 20.0, 19.0, 19.0, 23.0, 42.0, 68.0, 51.0, 89.0, 116.0, 173.0, 223.0, 381.0, 650.0, 1213.0, 2792.0, 8757.0, 49893.0, 3806017.0, 296503.0, 18957.0, 4524.0, 1717.0, 738.0, 404.0, 222.0, 152.0, 116.0, 89.0, 67.0, 47.0, 34.0, 33.0, 23.0, 17.0, 13.0, 8.0, 12.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.96875, -56.98779296875, -55.0068359375, -53.02587890625, -51.044921875, -49.06396484375, -47.0830078125, -45.10205078125, -43.12109375, -41.14013671875, -39.1591796875, -37.17822265625, -35.197265625, -33.21630859375, -31.2353515625, -29.25439453125, -27.2734375, -25.29248046875, -23.3115234375, -21.33056640625, -19.349609375, -17.36865234375, -15.3876953125, -13.40673828125, -11.42578125, -9.44482421875, -7.4638671875, -5.48291015625, -3.501953125, -1.52099609375, 0.4599609375, 2.44091796875, 4.421875, 6.40283203125, 8.3837890625, 10.36474609375, 12.345703125, 14.32666015625, 16.3076171875, 18.28857421875, 20.26953125, 22.25048828125, 24.2314453125, 26.21240234375, 28.193359375, 30.17431640625, 32.1552734375, 34.13623046875, 36.1171875, 38.09814453125, 40.0791015625, 42.06005859375, 44.041015625, 46.02197265625, 48.0029296875, 49.98388671875, 51.96484375, 53.94580078125, 55.9267578125, 57.90771484375, 59.888671875, 61.86962890625, 63.8505859375, 65.83154296875, 67.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 22.0, 23.0, 73.0, 247.0, 2557.0, 960.0, 102.0, 39.0, 21.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.875, -118.2666015625, -114.658203125, -111.0498046875, -107.44140625, -103.8330078125, -100.224609375, -96.6162109375, -93.0078125, -89.3994140625, -85.791015625, -82.1826171875, -78.57421875, -74.9658203125, -71.357421875, -67.7490234375, -64.140625, -60.5322265625, -56.923828125, -53.3154296875, -49.70703125, -46.0986328125, -42.490234375, -38.8818359375, -35.2734375, -31.6650390625, -28.056640625, -24.4482421875, -20.83984375, -17.2314453125, -13.623046875, -10.0146484375, -6.40625, -2.7978515625, 0.810546875, 4.4189453125, 8.02734375, 11.6357421875, 15.244140625, 18.8525390625, 22.4609375, 26.0693359375, 29.677734375, 33.2861328125, 36.89453125, 40.5029296875, 44.111328125, 47.7197265625, 51.328125, 54.9365234375, 58.544921875, 62.1533203125, 65.76171875, 69.3701171875, 72.978515625, 76.5869140625, 80.1953125, 83.8037109375, 87.412109375, 91.0205078125, 94.62890625, 98.2373046875, 101.845703125, 105.4541015625, 109.0625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 12.0, 20.0, 24.0, 45.0, 79.0, 203.0, 313.0, 190.0, 72.0, 19.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-742.1420288085938, -724.8027954101562, -707.4635620117188, -690.1243286132812, -672.7850952148438, -655.4458618164062, -638.1066284179688, -620.7674560546875, -603.42822265625, -586.0889892578125, -568.749755859375, -551.4105224609375, -534.0712890625, -516.7320556640625, -499.3928527832031, -482.0536193847656, -464.71435546875, -447.3751220703125, -430.035888671875, -412.6966552734375, -395.357421875, -378.0181884765625, -360.6789855957031, -343.3397521972656, -326.0005187988281, -308.6612854003906, -291.3220520019531, -273.9828186035156, -256.64361572265625, -239.3043670654297, -221.96514892578125, -204.62591552734375, -187.28662109375, -169.9473876953125, -152.608154296875, -135.26893615722656, -117.92970275878906, -100.59046936035156, -83.2512435913086, -65.91201782226562, -48.572784423828125, -31.23355484008789, -13.894325256347656, 3.444904327392578, 20.784133911132812, 38.12336730957031, 55.46259307861328, 72.80181884765625, 90.14105224609375, 107.48028564453125, 124.81951141357422, 142.1587371826172, 159.4979705810547, 176.8372039794922, 194.17642211914062, 211.51565551757812, 228.85488891601562, 246.19412231445312, 263.5333557128906, 280.8725891113281, 298.2117919921875, 315.551025390625, 332.8902587890625, 350.2294921875, 367.5687255859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 25.0, 12.0, 23.0, 34.0, 33.0, 40.0, 49.0, 59.0, 64.0, 61.0, 75.0, 84.0, 63.0, 66.0, 61.0, 45.0, 37.0, 29.0, 27.0, 20.0, 16.0, 12.0, 13.0, 8.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.80238342285156, -167.9599609375, -158.11753845214844, -148.27511596679688, -138.4326934814453, -128.59027099609375, -118.74784851074219, -108.90542602539062, -99.06300354003906, -89.2205810546875, -79.37815856933594, -69.53573608398438, -59.69331359863281, -49.85089111328125, -40.00846862792969, -30.166046142578125, -20.323623657226562, -10.481201171875, -0.6387786865234375, 9.203643798828125, 19.046066284179688, 28.88848876953125, 38.73091125488281, 48.573333740234375, 58.41575622558594, 68.2581787109375, 78.10060119628906, 87.94302368164062, 97.78544616699219, 107.62786865234375, 117.47029113769531, 127.31271362304688, 137.1551513671875, 146.99757385253906, 156.83999633789062, 166.6824188232422, 176.52484130859375, 186.3672637939453, 196.20968627929688, 206.05210876464844, 215.89453125, 225.73695373535156, 235.57937622070312, 245.4217987060547, 255.26422119140625, 265.10662841796875, 274.9490661621094, 284.79150390625, 294.6339111328125, 304.476318359375, 314.3187561035156, 324.16119384765625, 334.00360107421875, 343.84600830078125, 353.6884460449219, 363.5308837890625, 373.373291015625, 383.2156982421875, 393.0581359863281, 402.90057373046875, 412.74298095703125, 422.58538818359375, 432.4278259277344, 442.270263671875, 452.1126708984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 6.0, 10.0, 8.0, 18.0, 19.0, 25.0, 41.0, 44.0, 67.0, 105.0, 174.0, 289.0, 357.0, 635.0, 972.0, 1568.0, 2656.0, 4922.0, 9049.0, 18785.0, 43719.0, 115733.0, 339874.0, 320889.0, 108959.0, 41386.0, 18071.0, 8724.0, 4694.0, 2621.0, 1523.0, 925.0, 591.0, 386.0, 237.0, 166.0, 100.0, 74.0, 40.0, 34.0, 11.0, 12.0, 12.0, 5.0, 9.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.828125, -24.051513671875, -23.27490234375, -22.498291015625, -21.7216796875, -20.945068359375, -20.16845703125, -19.391845703125, -18.615234375, -17.838623046875, -17.06201171875, -16.285400390625, -15.5087890625, -14.732177734375, -13.95556640625, -13.178955078125, -12.40234375, -11.625732421875, -10.84912109375, -10.072509765625, -9.2958984375, -8.519287109375, -7.74267578125, -6.966064453125, -6.189453125, -5.412841796875, -4.63623046875, -3.859619140625, -3.0830078125, -2.306396484375, -1.52978515625, -0.753173828125, 0.0234375, 0.800048828125, 1.57666015625, 2.353271484375, 3.1298828125, 3.906494140625, 4.68310546875, 5.459716796875, 6.236328125, 7.012939453125, 7.78955078125, 8.566162109375, 9.3427734375, 10.119384765625, 10.89599609375, 11.672607421875, 12.44921875, 13.225830078125, 14.00244140625, 14.779052734375, 15.5556640625, 16.332275390625, 17.10888671875, 17.885498046875, 18.662109375, 19.438720703125, 20.21533203125, 20.991943359375, 21.7685546875, 22.545166015625, 23.32177734375, 24.098388671875, 24.875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 7.0, 7.0, 7.0, 13.0, 27.0, 24.0, 35.0, 39.0, 39.0, 44.0, 68.0, 75.0, 87.0, 80.0, 76.0, 67.0, 54.0, 52.0, 43.0, 34.0, 35.0, 13.0, 22.0, 15.0, 12.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.126220703125, -17.48681640625, -16.847412109375, -16.2080078125, -15.568603515625, -14.92919921875, -14.289794921875, -13.650390625, -13.010986328125, -12.37158203125, -11.732177734375, -11.0927734375, -10.453369140625, -9.81396484375, -9.174560546875, -8.53515625, -7.895751953125, -7.25634765625, -6.616943359375, -5.9775390625, -5.338134765625, -4.69873046875, -4.059326171875, -3.419921875, -2.780517578125, -2.14111328125, -1.501708984375, -0.8623046875, -0.222900390625, 0.41650390625, 1.055908203125, 1.6953125, 2.334716796875, 2.97412109375, 3.613525390625, 4.2529296875, 4.892333984375, 5.53173828125, 6.171142578125, 6.810546875, 7.449951171875, 8.08935546875, 8.728759765625, 9.3681640625, 10.007568359375, 10.64697265625, 11.286376953125, 11.92578125, 12.565185546875, 13.20458984375, 13.843994140625, 14.4833984375, 15.122802734375, 15.76220703125, 16.401611328125, 17.041015625, 17.680419921875, 18.31982421875, 18.959228515625, 19.5986328125, 20.238037109375, 20.87744140625, 21.516845703125, 22.15625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 10.0, 20.0, 20.0, 31.0, 38.0, 76.0, 112.0, 226.0, 457.0, 1014.0, 2616.0, 9089.0, 49956.0, 678207.0, 270132.0, 27127.0, 5826.0, 1942.0, 783.0, 368.0, 208.0, 113.0, 66.0, 47.0, 26.0, 14.0, 5.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-86.1875, -83.84814453125, -81.5087890625, -79.16943359375, -76.830078125, -74.49072265625, -72.1513671875, -69.81201171875, -67.47265625, -65.13330078125, -62.7939453125, -60.45458984375, -58.115234375, -55.77587890625, -53.4365234375, -51.09716796875, -48.7578125, -46.41845703125, -44.0791015625, -41.73974609375, -39.400390625, -37.06103515625, -34.7216796875, -32.38232421875, -30.04296875, -27.70361328125, -25.3642578125, -23.02490234375, -20.685546875, -18.34619140625, -16.0068359375, -13.66748046875, -11.328125, -8.98876953125, -6.6494140625, -4.31005859375, -1.970703125, 0.36865234375, 2.7080078125, 5.04736328125, 7.38671875, 9.72607421875, 12.0654296875, 14.40478515625, 16.744140625, 19.08349609375, 21.4228515625, 23.76220703125, 26.1015625, 28.44091796875, 30.7802734375, 33.11962890625, 35.458984375, 37.79833984375, 40.1376953125, 42.47705078125, 44.81640625, 47.15576171875, 49.4951171875, 51.83447265625, 54.173828125, 56.51318359375, 58.8525390625, 61.19189453125, 63.53125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 3.0, 3.0, 6.0, 10.0, 15.0, 16.0, 29.0, 24.0, 33.0, 30.0, 33.0, 42.0, 57.0, 64.0, 69.0, 70.0, 67.0, 62.0, 70.0, 40.0, 39.0, 47.0, 40.0, 36.0, 17.0, 20.0, 7.0, 9.0, 13.0, 8.0, 5.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-88.625, -85.8310546875, -83.037109375, -80.2431640625, -77.44921875, -74.6552734375, -71.861328125, -69.0673828125, -66.2734375, -63.4794921875, -60.685546875, -57.8916015625, -55.09765625, -52.3037109375, -49.509765625, -46.7158203125, -43.921875, -41.1279296875, -38.333984375, -35.5400390625, -32.74609375, -29.9521484375, -27.158203125, -24.3642578125, -21.5703125, -18.7763671875, -15.982421875, -13.1884765625, -10.39453125, -7.6005859375, -4.806640625, -2.0126953125, 0.78125, 3.5751953125, 6.369140625, 9.1630859375, 11.95703125, 14.7509765625, 17.544921875, 20.3388671875, 23.1328125, 25.9267578125, 28.720703125, 31.5146484375, 34.30859375, 37.1025390625, 39.896484375, 42.6904296875, 45.484375, 48.2783203125, 51.072265625, 53.8662109375, 56.66015625, 59.4541015625, 62.248046875, 65.0419921875, 67.8359375, 70.6298828125, 73.423828125, 76.2177734375, 79.01171875, 81.8056640625, 84.599609375, 87.3935546875, 90.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 13.0, 13.0, 21.0, 24.0, 57.0, 79.0, 122.0, 271.0, 506.0, 1470.0, 5854.0, 51788.0, 928237.0, 51814.0, 5656.0, 1540.0, 518.0, 246.0, 137.0, 59.0, 37.0, 28.0, 22.0, 16.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.8125, -42.21923828125, -40.6259765625, -39.03271484375, -37.439453125, -35.84619140625, -34.2529296875, -32.65966796875, -31.06640625, -29.47314453125, -27.8798828125, -26.28662109375, -24.693359375, -23.10009765625, -21.5068359375, -19.91357421875, -18.3203125, -16.72705078125, -15.1337890625, -13.54052734375, -11.947265625, -10.35400390625, -8.7607421875, -7.16748046875, -5.57421875, -3.98095703125, -2.3876953125, -0.79443359375, 0.798828125, 2.39208984375, 3.9853515625, 5.57861328125, 7.171875, 8.76513671875, 10.3583984375, 11.95166015625, 13.544921875, 15.13818359375, 16.7314453125, 18.32470703125, 19.91796875, 21.51123046875, 23.1044921875, 24.69775390625, 26.291015625, 27.88427734375, 29.4775390625, 31.07080078125, 32.6640625, 34.25732421875, 35.8505859375, 37.44384765625, 39.037109375, 40.63037109375, 42.2236328125, 43.81689453125, 45.41015625, 47.00341796875, 48.5966796875, 50.18994140625, 51.783203125, 53.37646484375, 54.9697265625, 56.56298828125, 58.15625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 8.0, 5.0, 15.0, 43.0, 68.0, 224.0, 371.0, 153.0, 46.0, 24.0, 16.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0147247314453125, -0.014283418655395508, -0.013842105865478516, -0.013400793075561523, -0.012959480285644531, -0.012518167495727539, -0.012076854705810547, -0.011635541915893555, -0.011194229125976562, -0.01075291633605957, -0.010311603546142578, -0.009870290756225586, -0.009428977966308594, -0.008987665176391602, -0.00854635238647461, -0.008105039596557617, -0.007663726806640625, -0.007222414016723633, -0.006781101226806641, -0.0063397884368896484, -0.005898475646972656, -0.005457162857055664, -0.005015850067138672, -0.00457453727722168, -0.0041332244873046875, -0.0036919116973876953, -0.003250598907470703, -0.002809286117553711, -0.0023679733276367188, -0.0019266605377197266, -0.0014853477478027344, -0.0010440349578857422, -0.00060272216796875, -0.0001614093780517578, 0.0002799034118652344, 0.0007212162017822266, 0.0011625289916992188, 0.001603841781616211, 0.002045154571533203, 0.0024864673614501953, 0.0029277801513671875, 0.0033690929412841797, 0.003810405731201172, 0.004251718521118164, 0.004693031311035156, 0.0051343441009521484, 0.005575656890869141, 0.006016969680786133, 0.006458282470703125, 0.006899595260620117, 0.007340908050537109, 0.0077822208404541016, 0.008223533630371094, 0.008664846420288086, 0.009106159210205078, 0.00954747200012207, 0.009988784790039062, 0.010430097579956055, 0.010871410369873047, 0.011312723159790039, 0.011754035949707031, 0.012195348739624023, 0.012636661529541016, 0.013077974319458008, 0.013519287109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 6.0, 11.0, 13.0, 18.0, 23.0, 48.0, 61.0, 128.0, 292.0, 636.0, 1708.0, 4995.0, 22256.0, 291933.0, 680699.0, 35202.0, 6850.0, 2139.0, 812.0, 305.0, 175.0, 95.0, 44.0, 21.0, 28.0, 13.0, 11.0, 10.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.28125, -34.304443359375, -33.32763671875, -32.350830078125, -31.3740234375, -30.397216796875, -29.42041015625, -28.443603515625, -27.466796875, -26.489990234375, -25.51318359375, -24.536376953125, -23.5595703125, -22.582763671875, -21.60595703125, -20.629150390625, -19.65234375, -18.675537109375, -17.69873046875, -16.721923828125, -15.7451171875, -14.768310546875, -13.79150390625, -12.814697265625, -11.837890625, -10.861083984375, -9.88427734375, -8.907470703125, -7.9306640625, -6.953857421875, -5.97705078125, -5.000244140625, -4.0234375, -3.046630859375, -2.06982421875, -1.093017578125, -0.1162109375, 0.860595703125, 1.83740234375, 2.814208984375, 3.791015625, 4.767822265625, 5.74462890625, 6.721435546875, 7.6982421875, 8.675048828125, 9.65185546875, 10.628662109375, 11.60546875, 12.582275390625, 13.55908203125, 14.535888671875, 15.5126953125, 16.489501953125, 17.46630859375, 18.443115234375, 19.419921875, 20.396728515625, 21.37353515625, 22.350341796875, 23.3271484375, 24.303955078125, 25.28076171875, 26.257568359375, 27.234375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 10.0, 12.0, 11.0, 12.0, 19.0, 24.0, 60.0, 45.0, 81.0, 69.0, 97.0, 105.0, 92.0, 88.0, 48.0, 62.0, 32.0, 24.0, 22.0, 14.0, 16.0, 14.0, 4.0, 4.0, 9.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.1875, -23.363037109375, -22.53857421875, -21.714111328125, -20.8896484375, -20.065185546875, -19.24072265625, -18.416259765625, -17.591796875, -16.767333984375, -15.94287109375, -15.118408203125, -14.2939453125, -13.469482421875, -12.64501953125, -11.820556640625, -10.99609375, -10.171630859375, -9.34716796875, -8.522705078125, -7.6982421875, -6.873779296875, -6.04931640625, -5.224853515625, -4.400390625, -3.575927734375, -2.75146484375, -1.927001953125, -1.1025390625, -0.278076171875, 0.54638671875, 1.370849609375, 2.1953125, 3.019775390625, 3.84423828125, 4.668701171875, 5.4931640625, 6.317626953125, 7.14208984375, 7.966552734375, 8.791015625, 9.615478515625, 10.43994140625, 11.264404296875, 12.0888671875, 12.913330078125, 13.73779296875, 14.562255859375, 15.38671875, 16.211181640625, 17.03564453125, 17.860107421875, 18.6845703125, 19.509033203125, 20.33349609375, 21.157958984375, 21.982421875, 22.806884765625, 23.63134765625, 24.455810546875, 25.2802734375, 26.104736328125, 26.92919921875, 27.753662109375, 28.578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 23.0, 40.0, 65.0, 140.0, 174.0, 237.0, 148.0, 64.0, 35.0, 21.0, 11.0, 4.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-530.8134155273438, -514.8673095703125, -498.9211730957031, -482.97503662109375, -467.0289306640625, -451.08282470703125, -435.1366882324219, -419.1905517578125, -403.24444580078125, -387.29833984375, -371.3522033691406, -355.40606689453125, -339.4599609375, -323.51385498046875, -307.5677185058594, -291.62158203125, -275.67547607421875, -259.7293701171875, -243.78323364257812, -227.8371124267578, -211.8909912109375, -195.9448699951172, -179.99874877929688, -164.05262756347656, -148.10650634765625, -132.16038513183594, -116.21426391601562, -100.26814270019531, -84.322021484375, -68.37590026855469, -52.429779052734375, -36.48365783691406, -20.537567138671875, -4.5914459228515625, 11.35467529296875, 27.300796508789062, 43.246917724609375, 59.19303894042969, 75.13916015625, 91.08528137207031, 107.03140258789062, 122.97752380371094, 138.92364501953125, 154.86976623535156, 170.81588745117188, 186.7620086669922, 202.7081298828125, 218.6542510986328, 234.60037231445312, 250.54649353027344, 266.49261474609375, 282.438720703125, 298.3848571777344, 314.33099365234375, 330.277099609375, 346.22320556640625, 362.1693420410156, 378.115478515625, 394.06158447265625, 410.0076904296875, 425.9538269042969, 441.89996337890625, 457.8460693359375, 473.79217529296875, 489.7383117675781]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 10.0, 10.0, 15.0, 19.0, 21.0, 27.0, 32.0, 34.0, 36.0, 60.0, 55.0, 59.0, 66.0, 70.0, 60.0, 67.0, 51.0, 55.0, 51.0, 30.0, 30.0, 32.0, 27.0, 23.0, 13.0, 7.0, 9.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-404.99822998046875, -393.9899597167969, -382.981689453125, -371.97344970703125, -360.9651794433594, -349.9569091796875, -338.94866943359375, -327.9403991699219, -316.93212890625, -305.9238586425781, -294.91558837890625, -283.9073486328125, -272.8990783691406, -261.89080810546875, -250.88255310058594, -239.87429809570312, -228.86602783203125, -217.85775756835938, -206.84950256347656, -195.84124755859375, -184.83297729492188, -173.82470703125, -162.8164520263672, -151.80819702148438, -140.7999267578125, -129.79165649414062, -118.78340148925781, -107.77513885498047, -96.76687622070312, -85.75861358642578, -74.75035095214844, -63.742088317871094, -52.733795166015625, -41.72553253173828, -30.717269897460938, -19.709007263183594, -8.70074462890625, 2.3075180053710938, 13.315780639648438, 24.32404327392578, 35.332305908203125, 46.34056854248047, 57.34883117675781, 68.35709381103516, 79.3653564453125, 90.37361907958984, 101.38188171386719, 112.39014434814453, 123.39840698242188, 134.40667724609375, 145.41493225097656, 156.42318725585938, 167.43145751953125, 178.43972778320312, 189.44798278808594, 200.45623779296875, 211.46450805664062, 222.4727783203125, 233.4810333251953, 244.48928833007812, 255.49755859375, 266.5058288574219, 277.51409912109375, 288.5223388671875, 299.5306091308594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 10.0, 10.0, 18.0, 25.0, 46.0, 67.0, 120.0, 227.0, 540.0, 1410.0, 4529.0, 19364.0, 229810.0, 3726078.0, 185563.0, 18524.0, 5014.0, 1662.0, 656.0, 293.0, 140.0, 75.0, 44.0, 16.0, 9.0, 13.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.75, -48.550537109375, -47.35107421875, -46.151611328125, -44.9521484375, -43.752685546875, -42.55322265625, -41.353759765625, -40.154296875, -38.954833984375, -37.75537109375, -36.555908203125, -35.3564453125, -34.156982421875, -32.95751953125, -31.758056640625, -30.55859375, -29.359130859375, -28.15966796875, -26.960205078125, -25.7607421875, -24.561279296875, -23.36181640625, -22.162353515625, -20.962890625, -19.763427734375, -18.56396484375, -17.364501953125, -16.1650390625, -14.965576171875, -13.76611328125, -12.566650390625, -11.3671875, -10.167724609375, -8.96826171875, -7.768798828125, -6.5693359375, -5.369873046875, -4.17041015625, -2.970947265625, -1.771484375, -0.572021484375, 0.62744140625, 1.826904296875, 3.0263671875, 4.225830078125, 5.42529296875, 6.624755859375, 7.82421875, 9.023681640625, 10.22314453125, 11.422607421875, 12.6220703125, 13.821533203125, 15.02099609375, 16.220458984375, 17.419921875, 18.619384765625, 19.81884765625, 21.018310546875, 22.2177734375, 23.417236328125, 24.61669921875, 25.816162109375, 27.015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 23.0, 31.0, 30.0, 66.0, 67.0, 93.0, 101.0, 114.0, 99.0, 93.0, 78.0, 53.0, 39.0, 37.0, 22.0, 16.0, 12.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.59375, -36.750732421875, -35.90771484375, -35.064697265625, -34.2216796875, -33.378662109375, -32.53564453125, -31.692626953125, -30.849609375, -30.006591796875, -29.16357421875, -28.320556640625, -27.4775390625, -26.634521484375, -25.79150390625, -24.948486328125, -24.10546875, -23.262451171875, -22.41943359375, -21.576416015625, -20.7333984375, -19.890380859375, -19.04736328125, -18.204345703125, -17.361328125, -16.518310546875, -15.67529296875, -14.832275390625, -13.9892578125, -13.146240234375, -12.30322265625, -11.460205078125, -10.6171875, -9.774169921875, -8.93115234375, -8.088134765625, -7.2451171875, -6.402099609375, -5.55908203125, -4.716064453125, -3.873046875, -3.030029296875, -2.18701171875, -1.343994140625, -0.5009765625, 0.342041015625, 1.18505859375, 2.028076171875, 2.87109375, 3.714111328125, 4.55712890625, 5.400146484375, 6.2431640625, 7.086181640625, 7.92919921875, 8.772216796875, 9.615234375, 10.458251953125, 11.30126953125, 12.144287109375, 12.9873046875, 13.830322265625, 14.67333984375, 15.516357421875, 16.359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 11.0, 19.0, 36.0, 36.0, 47.0, 96.0, 155.0, 300.0, 561.0, 1099.0, 2587.0, 7215.0, 25789.0, 165073.0, 3639098.0, 300603.0, 36984.0, 8996.0, 3160.0, 1176.0, 561.0, 250.0, 156.0, 95.0, 56.0, 34.0, 32.0, 12.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.15625, -43.7275390625, -42.298828125, -40.8701171875, -39.44140625, -38.0126953125, -36.583984375, -35.1552734375, -33.7265625, -32.2978515625, -30.869140625, -29.4404296875, -28.01171875, -26.5830078125, -25.154296875, -23.7255859375, -22.296875, -20.8681640625, -19.439453125, -18.0107421875, -16.58203125, -15.1533203125, -13.724609375, -12.2958984375, -10.8671875, -9.4384765625, -8.009765625, -6.5810546875, -5.15234375, -3.7236328125, -2.294921875, -0.8662109375, 0.5625, 1.9912109375, 3.419921875, 4.8486328125, 6.27734375, 7.7060546875, 9.134765625, 10.5634765625, 11.9921875, 13.4208984375, 14.849609375, 16.2783203125, 17.70703125, 19.1357421875, 20.564453125, 21.9931640625, 23.421875, 24.8505859375, 26.279296875, 27.7080078125, 29.13671875, 30.5654296875, 31.994140625, 33.4228515625, 34.8515625, 36.2802734375, 37.708984375, 39.1376953125, 40.56640625, 41.9951171875, 43.423828125, 44.8525390625, 46.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 9.0, 2.0, 10.0, 5.0, 9.0, 9.0, 11.0, 12.0, 24.0, 38.0, 50.0, 75.0, 133.0, 323.0, 804.0, 1214.0, 662.0, 266.0, 131.0, 84.0, 61.0, 37.0, 37.0, 24.0, 11.0, 7.0, 5.0, 5.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-60.125, -58.521484375, -56.91796875, -55.314453125, -53.7109375, -52.107421875, -50.50390625, -48.900390625, -47.296875, -45.693359375, -44.08984375, -42.486328125, -40.8828125, -39.279296875, -37.67578125, -36.072265625, -34.46875, -32.865234375, -31.26171875, -29.658203125, -28.0546875, -26.451171875, -24.84765625, -23.244140625, -21.640625, -20.037109375, -18.43359375, -16.830078125, -15.2265625, -13.623046875, -12.01953125, -10.416015625, -8.8125, -7.208984375, -5.60546875, -4.001953125, -2.3984375, -0.794921875, 0.80859375, 2.412109375, 4.015625, 5.619140625, 7.22265625, 8.826171875, 10.4296875, 12.033203125, 13.63671875, 15.240234375, 16.84375, 18.447265625, 20.05078125, 21.654296875, 23.2578125, 24.861328125, 26.46484375, 28.068359375, 29.671875, 31.275390625, 32.87890625, 34.482421875, 36.0859375, 37.689453125, 39.29296875, 40.896484375, 42.5]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 11.0, 16.0, 139.0, 604.0, 193.0, 27.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1625.5699462890625, -1580.9776611328125, -1536.3853759765625, -1491.7930908203125, -1447.2008056640625, -1402.608642578125, -1358.016357421875, -1313.424072265625, -1268.831787109375, -1224.239501953125, -1179.647216796875, -1135.054931640625, -1090.462646484375, -1045.870361328125, -1001.2781372070312, -956.6859130859375, -912.0935668945312, -867.5012817382812, -822.9089965820312, -778.3167724609375, -733.7244873046875, -689.1322021484375, -644.5399169921875, -599.9476318359375, -555.3553466796875, -510.7630615234375, -466.1708068847656, -421.5785217285156, -376.98626708984375, -332.39398193359375, -287.80169677734375, -243.20944213867188, -198.6171875, -154.02491760253906, -109.4326400756836, -64.84036254882812, -20.248092651367188, 24.34417724609375, 68.93646240234375, 113.52871704101562, 158.12100219726562, 202.71327209472656, 247.3055419921875, 291.8978271484375, 336.4901123046875, 381.0823669433594, 425.6746520996094, 470.26690673828125, 514.8591918945312, 559.4514770507812, 604.0437622070312, 648.635986328125, 693.228271484375, 737.820556640625, 782.412841796875, 827.005126953125, 871.597412109375, 916.189697265625, 960.781982421875, 1005.374267578125, 1049.966552734375, 1094.558837890625, 1139.151123046875, 1183.7432861328125, 1228.3355712890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 3.0, 12.0, 7.0, 9.0, 14.0, 15.0, 19.0, 14.0, 30.0, 32.0, 29.0, 35.0, 46.0, 45.0, 41.0, 47.0, 48.0, 58.0, 61.0, 53.0, 51.0, 52.0, 48.0, 35.0, 35.0, 26.0, 19.0, 9.0, 21.0, 16.0, 11.0, 18.0, 5.0, 11.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-202.57273864746094, -195.14317321777344, -187.71360778808594, -180.28404235839844, -172.85447692871094, -165.42491149902344, -157.995361328125, -150.5657958984375, -143.13623046875, -135.7066650390625, -128.277099609375, -120.8475341796875, -113.41796875, -105.9884033203125, -98.55884552001953, -91.12928009033203, -83.69970703125, -76.2701416015625, -68.840576171875, -61.411014556884766, -53.981449127197266, -46.551883697509766, -39.12232208251953, -31.69275665283203, -24.26319122314453, -16.83362579345703, -9.404062271118164, -1.9744987487792969, 5.455066680908203, 12.884632110595703, 20.314193725585938, 27.743759155273438, 35.17333984375, 42.6029052734375, 50.032470703125, 57.462032318115234, 64.8916015625, 72.3211669921875, 79.75072479248047, 87.18029022216797, 94.60985565185547, 102.03942108154297, 109.46898651123047, 116.89854431152344, 124.32810974121094, 131.75767517089844, 139.18724060058594, 146.61680603027344, 154.04637145996094, 161.47593688964844, 168.90550231933594, 176.33506774902344, 183.76463317871094, 191.19419860839844, 198.62374877929688, 206.05331420898438, 213.48287963867188, 220.91244506835938, 228.34201049804688, 235.77157592773438, 243.20114135742188, 250.63070678710938, 258.0602722167969, 265.4898376464844, 272.9194030761719]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 13.0, 15.0, 32.0, 55.0, 83.0, 127.0, 215.0, 365.0, 746.0, 1385.0, 2675.0, 5443.0, 11762.0, 26176.0, 60221.0, 140933.0, 313815.0, 273999.0, 117952.0, 50632.0, 22280.0, 9946.0, 4713.0, 2290.0, 1147.0, 630.0, 365.0, 208.0, 134.0, 86.0, 39.0, 28.0, 12.0, 8.0, 6.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.8564453125, -15.244140625, -14.6318359375, -14.01953125, -13.4072265625, -12.794921875, -12.1826171875, -11.5703125, -10.9580078125, -10.345703125, -9.7333984375, -9.12109375, -8.5087890625, -7.896484375, -7.2841796875, -6.671875, -6.0595703125, -5.447265625, -4.8349609375, -4.22265625, -3.6103515625, -2.998046875, -2.3857421875, -1.7734375, -1.1611328125, -0.548828125, 0.0634765625, 0.67578125, 1.2880859375, 1.900390625, 2.5126953125, 3.125, 3.7373046875, 4.349609375, 4.9619140625, 5.57421875, 6.1865234375, 6.798828125, 7.4111328125, 8.0234375, 8.6357421875, 9.248046875, 9.8603515625, 10.47265625, 11.0849609375, 11.697265625, 12.3095703125, 12.921875, 13.5341796875, 14.146484375, 14.7587890625, 15.37109375, 15.9833984375, 16.595703125, 17.2080078125, 17.8203125, 18.4326171875, 19.044921875, 19.6572265625, 20.26953125, 20.8818359375, 21.494140625, 22.1064453125, 22.71875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 5.0, 7.0, 15.0, 23.0, 15.0, 27.0, 27.0, 42.0, 42.0, 63.0, 48.0, 82.0, 73.0, 62.0, 65.0, 65.0, 55.0, 57.0, 41.0, 38.0, 23.0, 25.0, 25.0, 13.0, 13.0, 7.0, 9.0, 8.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.8255615234375, -17.322998046875, -16.8204345703125, -16.31787109375, -15.8153076171875, -15.312744140625, -14.8101806640625, -14.3076171875, -13.8050537109375, -13.302490234375, -12.7999267578125, -12.29736328125, -11.7947998046875, -11.292236328125, -10.7896728515625, -10.287109375, -9.7845458984375, -9.281982421875, -8.7794189453125, -8.27685546875, -7.7742919921875, -7.271728515625, -6.7691650390625, -6.2666015625, -5.7640380859375, -5.261474609375, -4.7589111328125, -4.25634765625, -3.7537841796875, -3.251220703125, -2.7486572265625, -2.24609375, -1.7435302734375, -1.240966796875, -0.7384033203125, -0.23583984375, 0.2667236328125, 0.769287109375, 1.2718505859375, 1.7744140625, 2.2769775390625, 2.779541015625, 3.2821044921875, 3.78466796875, 4.2872314453125, 4.789794921875, 5.2923583984375, 5.794921875, 6.2974853515625, 6.800048828125, 7.3026123046875, 7.80517578125, 8.3077392578125, 8.810302734375, 9.3128662109375, 9.8154296875, 10.3179931640625, 10.820556640625, 11.3231201171875, 11.82568359375, 12.3282470703125, 12.830810546875, 13.3333740234375, 13.8359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 13.0, 17.0, 29.0, 34.0, 47.0, 73.0, 110.0, 162.0, 249.0, 358.0, 560.0, 917.0, 1768.0, 4595.0, 17443.0, 116646.0, 720047.0, 153658.0, 21912.0, 5233.0, 2057.0, 960.0, 564.0, 338.0, 237.0, 162.0, 97.0, 76.0, 50.0, 32.0, 31.0, 22.0, 15.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.72705078125, -41.3291015625, -39.93115234375, -38.533203125, -37.13525390625, -35.7373046875, -34.33935546875, -32.94140625, -31.54345703125, -30.1455078125, -28.74755859375, -27.349609375, -25.95166015625, -24.5537109375, -23.15576171875, -21.7578125, -20.35986328125, -18.9619140625, -17.56396484375, -16.166015625, -14.76806640625, -13.3701171875, -11.97216796875, -10.57421875, -9.17626953125, -7.7783203125, -6.38037109375, -4.982421875, -3.58447265625, -2.1865234375, -0.78857421875, 0.609375, 2.00732421875, 3.4052734375, 4.80322265625, 6.201171875, 7.59912109375, 8.9970703125, 10.39501953125, 11.79296875, 13.19091796875, 14.5888671875, 15.98681640625, 17.384765625, 18.78271484375, 20.1806640625, 21.57861328125, 22.9765625, 24.37451171875, 25.7724609375, 27.17041015625, 28.568359375, 29.96630859375, 31.3642578125, 32.76220703125, 34.16015625, 35.55810546875, 36.9560546875, 38.35400390625, 39.751953125, 41.14990234375, 42.5478515625, 43.94580078125, 45.34375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 9.0, 13.0, 17.0, 19.0, 22.0, 20.0, 33.0, 33.0, 38.0, 29.0, 51.0, 41.0, 56.0, 52.0, 54.0, 68.0, 53.0, 63.0, 40.0, 43.0, 41.0, 36.0, 33.0, 31.0, 30.0, 11.0, 10.0, 7.0, 9.0, 8.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.09375, -55.2451171875, -53.396484375, -51.5478515625, -49.69921875, -47.8505859375, -46.001953125, -44.1533203125, -42.3046875, -40.4560546875, -38.607421875, -36.7587890625, -34.91015625, -33.0615234375, -31.212890625, -29.3642578125, -27.515625, -25.6669921875, -23.818359375, -21.9697265625, -20.12109375, -18.2724609375, -16.423828125, -14.5751953125, -12.7265625, -10.8779296875, -9.029296875, -7.1806640625, -5.33203125, -3.4833984375, -1.634765625, 0.2138671875, 2.0625, 3.9111328125, 5.759765625, 7.6083984375, 9.45703125, 11.3056640625, 13.154296875, 15.0029296875, 16.8515625, 18.7001953125, 20.548828125, 22.3974609375, 24.24609375, 26.0947265625, 27.943359375, 29.7919921875, 31.640625, 33.4892578125, 35.337890625, 37.1865234375, 39.03515625, 40.8837890625, 42.732421875, 44.5810546875, 46.4296875, 48.2783203125, 50.126953125, 51.9755859375, 53.82421875, 55.6728515625, 57.521484375, 59.3701171875, 61.21875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 12.0, 13.0, 24.0, 23.0, 52.0, 72.0, 115.0, 236.0, 410.0, 1018.0, 2941.0, 12710.0, 96739.0, 768951.0, 142769.0, 16672.0, 3597.0, 1135.0, 479.0, 214.0, 124.0, 76.0, 50.0, 30.0, 28.0, 11.0, 12.0, 9.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.3671875, -12.915283203125, -12.46337890625, -12.011474609375, -11.5595703125, -11.107666015625, -10.65576171875, -10.203857421875, -9.751953125, -9.300048828125, -8.84814453125, -8.396240234375, -7.9443359375, -7.492431640625, -7.04052734375, -6.588623046875, -6.13671875, -5.684814453125, -5.23291015625, -4.781005859375, -4.3291015625, -3.877197265625, -3.42529296875, -2.973388671875, -2.521484375, -2.069580078125, -1.61767578125, -1.165771484375, -0.7138671875, -0.261962890625, 0.18994140625, 0.641845703125, 1.09375, 1.545654296875, 1.99755859375, 2.449462890625, 2.9013671875, 3.353271484375, 3.80517578125, 4.257080078125, 4.708984375, 5.160888671875, 5.61279296875, 6.064697265625, 6.5166015625, 6.968505859375, 7.42041015625, 7.872314453125, 8.32421875, 8.776123046875, 9.22802734375, 9.679931640625, 10.1318359375, 10.583740234375, 11.03564453125, 11.487548828125, 11.939453125, 12.391357421875, 12.84326171875, 13.295166015625, 13.7470703125, 14.198974609375, 14.65087890625, 15.102783203125, 15.5546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 12.0, 13.0, 21.0, 24.0, 27.0, 26.0, 49.0, 46.0, 60.0, 80.0, 92.0, 91.0, 92.0, 67.0, 61.0, 57.0, 34.0, 41.0, 25.0, 14.0, 14.0, 11.0, 9.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027484893798828125, -0.0026638805866241455, -0.0025792717933654785, -0.0024946630001068115, -0.0024100542068481445, -0.0023254454135894775, -0.0022408366203308105, -0.0021562278270721436, -0.0020716190338134766, -0.0019870102405548096, -0.0019024014472961426, -0.0018177926540374756, -0.0017331838607788086, -0.0016485750675201416, -0.0015639662742614746, -0.0014793574810028076, -0.0013947486877441406, -0.0013101398944854736, -0.0012255311012268066, -0.0011409223079681396, -0.0010563135147094727, -0.0009717047214508057, -0.0008870959281921387, -0.0008024871349334717, -0.0007178783416748047, -0.0006332695484161377, -0.0005486607551574707, -0.0004640519618988037, -0.0003794431686401367, -0.0002948343753814697, -0.00021022558212280273, -0.00012561678886413574, -4.100799560546875e-05, 4.360079765319824e-05, 0.00012820959091186523, 0.00021281838417053223, 0.0002974271774291992, 0.0003820359706878662, 0.0004666447639465332, 0.0005512535572052002, 0.0006358623504638672, 0.0007204711437225342, 0.0008050799369812012, 0.0008896887302398682, 0.0009742975234985352, 0.0010589063167572021, 0.0011435151100158691, 0.0012281239032745361, 0.0013127326965332031, 0.0013973414897918701, 0.0014819502830505371, 0.001566559076309204, 0.001651167869567871, 0.001735776662826538, 0.001820385456085205, 0.001904994249343872, 0.001989603042602539, 0.002074211835861206, 0.002158820629119873, 0.00224342942237854, 0.002328038215637207, 0.002412647008895874, 0.002497255802154541, 0.002581864595413208, 0.002666473388671875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 13.0, 8.0, 7.0, 14.0, 25.0, 35.0, 40.0, 62.0, 95.0, 159.0, 254.0, 391.0, 719.0, 1534.0, 3662.0, 11903.0, 61821.0, 597656.0, 314662.0, 40650.0, 8950.0, 3015.0, 1249.0, 640.0, 349.0, 206.0, 139.0, 83.0, 63.0, 43.0, 28.0, 11.0, 20.0, 10.0, 8.0, 9.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.59375, -10.22705078125, -9.8603515625, -9.49365234375, -9.126953125, -8.76025390625, -8.3935546875, -8.02685546875, -7.66015625, -7.29345703125, -6.9267578125, -6.56005859375, -6.193359375, -5.82666015625, -5.4599609375, -5.09326171875, -4.7265625, -4.35986328125, -3.9931640625, -3.62646484375, -3.259765625, -2.89306640625, -2.5263671875, -2.15966796875, -1.79296875, -1.42626953125, -1.0595703125, -0.69287109375, -0.326171875, 0.04052734375, 0.4072265625, 0.77392578125, 1.140625, 1.50732421875, 1.8740234375, 2.24072265625, 2.607421875, 2.97412109375, 3.3408203125, 3.70751953125, 4.07421875, 4.44091796875, 4.8076171875, 5.17431640625, 5.541015625, 5.90771484375, 6.2744140625, 6.64111328125, 7.0078125, 7.37451171875, 7.7412109375, 8.10791015625, 8.474609375, 8.84130859375, 9.2080078125, 9.57470703125, 9.94140625, 10.30810546875, 10.6748046875, 11.04150390625, 11.408203125, 11.77490234375, 12.1416015625, 12.50830078125, 12.875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 13.0, 9.0, 10.0, 14.0, 17.0, 26.0, 16.0, 24.0, 32.0, 31.0, 38.0, 43.0, 42.0, 60.0, 45.0, 48.0, 52.0, 53.0, 56.0, 54.0, 34.0, 40.0, 36.0, 25.0, 24.0, 28.0, 21.0, 19.0, 17.0, 11.0, 12.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.01953125, -6.75213623046875, -6.4847412109375, -6.21734619140625, -5.949951171875, -5.68255615234375, -5.4151611328125, -5.14776611328125, -4.88037109375, -4.61297607421875, -4.3455810546875, -4.07818603515625, -3.810791015625, -3.54339599609375, -3.2760009765625, -3.00860595703125, -2.7412109375, -2.47381591796875, -2.2064208984375, -1.93902587890625, -1.671630859375, -1.40423583984375, -1.1368408203125, -0.86944580078125, -0.60205078125, -0.33465576171875, -0.0672607421875, 0.20013427734375, 0.467529296875, 0.73492431640625, 1.0023193359375, 1.26971435546875, 1.537109375, 1.80450439453125, 2.0718994140625, 2.33929443359375, 2.606689453125, 2.87408447265625, 3.1414794921875, 3.40887451171875, 3.67626953125, 3.94366455078125, 4.2110595703125, 4.47845458984375, 4.745849609375, 5.01324462890625, 5.2806396484375, 5.54803466796875, 5.8154296875, 6.08282470703125, 6.3502197265625, 6.61761474609375, 6.885009765625, 7.15240478515625, 7.4197998046875, 7.68719482421875, 7.95458984375, 8.22198486328125, 8.4893798828125, 8.75677490234375, 9.024169921875, 9.29156494140625, 9.5589599609375, 9.82635498046875, 10.09375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 9.0, 11.0, 56.0, 109.0, 244.0, 364.0, 141.0, 40.0, 16.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.8962707519531, -258.9575500488281, -243.018798828125, -227.080078125, -211.14134216308594, -195.20260620117188, -179.26388549804688, -163.3251495361328, -147.38641357421875, -131.4476776123047, -115.50894927978516, -99.57022094726562, -83.63148498535156, -67.6927490234375, -51.75402069091797, -35.81529235839844, -19.876556396484375, -3.937824249267578, 12.000907897949219, 27.939640045166016, 43.87837219238281, 59.817108154296875, 75.7558364868164, 91.69456481933594, 107.63330078125, 123.57203674316406, 139.51077270507812, 155.44949340820312, 171.3882293701172, 187.32696533203125, 203.26568603515625, 219.2044219970703, 235.14312744140625, 251.0818634033203, 267.0205993652344, 282.9593200683594, 298.8980712890625, 314.8367919921875, 330.7755126953125, 346.7142333984375, 362.6529846191406, 378.5917053222656, 394.53045654296875, 410.46917724609375, 426.40789794921875, 442.3466491699219, 458.2853698730469, 474.22412109375, 490.162841796875, 506.1015625, 522.040283203125, 537.9790649414062, 553.9177856445312, 569.8565063476562, 585.7952270507812, 601.7339477539062, 617.6727294921875, 633.6114501953125, 649.5501708984375, 665.4889526367188, 681.4276733398438, 697.3663940429688, 713.3051147460938, 729.2438354492188, 745.1825561523438]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 11.0, 7.0, 11.0, 14.0, 22.0, 16.0, 29.0, 35.0, 32.0, 40.0, 40.0, 46.0, 77.0, 83.0, 106.0, 78.0, 52.0, 46.0, 38.0, 43.0, 28.0, 27.0, 15.0, 21.0, 16.0, 17.0, 7.0, 13.0, 5.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.1094207763672, -245.22860717773438, -237.34779357910156, -229.46697998046875, -221.58615112304688, -213.70535278320312, -205.82452392578125, -197.94371032714844, -190.06289672851562, -182.1820831298828, -174.30126953125, -166.4204559326172, -158.53964233398438, -150.6588134765625, -142.7779998779297, -134.89718627929688, -127.01637268066406, -119.13555908203125, -111.25474548339844, -103.3739242553711, -95.49311065673828, -87.61229705810547, -79.73147583007812, -71.85066223144531, -63.9698486328125, -56.08903503417969, -48.20821762084961, -40.32740020751953, -32.44658660888672, -24.565773010253906, -16.684955596923828, -8.80413818359375, -0.923309326171875, 6.95750617980957, 14.838321685791016, 22.71913719177246, 30.599952697753906, 38.48076629638672, 46.3615837097168, 54.242401123046875, 62.12321472167969, 70.0040283203125, 77.88484191894531, 85.76566314697266, 93.64647674560547, 101.52729034423828, 109.40811157226562, 117.28892517089844, 125.16973876953125, 133.05055236816406, 140.93136596679688, 148.8121795654297, 156.6929931640625, 164.57382202148438, 172.4546356201172, 180.33544921875, 188.2162628173828, 196.09707641601562, 203.97789001464844, 211.85870361328125, 219.73953247070312, 227.62033081054688, 235.50115966796875, 243.38197326660156, 251.26278686523438]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 5.0, 9.0, 6.0, 21.0, 36.0, 38.0, 83.0, 106.0, 218.0, 378.0, 705.0, 1204.0, 2327.0, 4780.0, 10474.0, 27586.0, 109752.0, 729316.0, 2619558.0, 559123.0, 85089.0, 24054.0, 9583.0, 4554.0, 2345.0, 1281.0, 646.0, 380.0, 225.0, 138.0, 85.0, 51.0, 48.0, 23.0, 17.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.21875, -16.7587890625, -16.298828125, -15.8388671875, -15.37890625, -14.9189453125, -14.458984375, -13.9990234375, -13.5390625, -13.0791015625, -12.619140625, -12.1591796875, -11.69921875, -11.2392578125, -10.779296875, -10.3193359375, -9.859375, -9.3994140625, -8.939453125, -8.4794921875, -8.01953125, -7.5595703125, -7.099609375, -6.6396484375, -6.1796875, -5.7197265625, -5.259765625, -4.7998046875, -4.33984375, -3.8798828125, -3.419921875, -2.9599609375, -2.5, -2.0400390625, -1.580078125, -1.1201171875, -0.66015625, -0.2001953125, 0.259765625, 0.7197265625, 1.1796875, 1.6396484375, 2.099609375, 2.5595703125, 3.01953125, 3.4794921875, 3.939453125, 4.3994140625, 4.859375, 5.3193359375, 5.779296875, 6.2392578125, 6.69921875, 7.1591796875, 7.619140625, 8.0791015625, 8.5390625, 8.9990234375, 9.458984375, 9.9189453125, 10.37890625, 10.8388671875, 11.298828125, 11.7587890625, 12.21875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 17.0, 30.0, 18.0, 20.0, 32.0, 50.0, 47.0, 61.0, 54.0, 60.0, 69.0, 64.0, 59.0, 67.0, 61.0, 62.0, 54.0, 37.0, 30.0, 18.0, 16.0, 11.0, 11.0, 12.0, 6.0, 9.0, 5.0, 1.0, 4.0, 0.0, 3.0], "bins": [-21.5, -21.01318359375, -20.5263671875, -20.03955078125, -19.552734375, -19.06591796875, -18.5791015625, -18.09228515625, -17.60546875, -17.11865234375, -16.6318359375, -16.14501953125, -15.658203125, -15.17138671875, -14.6845703125, -14.19775390625, -13.7109375, -13.22412109375, -12.7373046875, -12.25048828125, -11.763671875, -11.27685546875, -10.7900390625, -10.30322265625, -9.81640625, -9.32958984375, -8.8427734375, -8.35595703125, -7.869140625, -7.38232421875, -6.8955078125, -6.40869140625, -5.921875, -5.43505859375, -4.9482421875, -4.46142578125, -3.974609375, -3.48779296875, -3.0009765625, -2.51416015625, -2.02734375, -1.54052734375, -1.0537109375, -0.56689453125, -0.080078125, 0.40673828125, 0.8935546875, 1.38037109375, 1.8671875, 2.35400390625, 2.8408203125, 3.32763671875, 3.814453125, 4.30126953125, 4.7880859375, 5.27490234375, 5.76171875, 6.24853515625, 6.7353515625, 7.22216796875, 7.708984375, 8.19580078125, 8.6826171875, 9.16943359375, 9.65625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 14.0, 27.0, 45.0, 54.0, 102.0, 151.0, 291.0, 528.0, 1077.0, 2286.0, 5603.0, 15355.0, 54108.0, 314657.0, 3353999.0, 366507.0, 54521.0, 15285.0, 5368.0, 2201.0, 956.0, 494.0, 266.0, 122.0, 78.0, 57.0, 31.0, 22.0, 12.0, 13.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.183837890625, -22.39892578125, -21.614013671875, -20.8291015625, -20.044189453125, -19.25927734375, -18.474365234375, -17.689453125, -16.904541015625, -16.11962890625, -15.334716796875, -14.5498046875, -13.764892578125, -12.97998046875, -12.195068359375, -11.41015625, -10.625244140625, -9.84033203125, -9.055419921875, -8.2705078125, -7.485595703125, -6.70068359375, -5.915771484375, -5.130859375, -4.345947265625, -3.56103515625, -2.776123046875, -1.9912109375, -1.206298828125, -0.42138671875, 0.363525390625, 1.1484375, 1.933349609375, 2.71826171875, 3.503173828125, 4.2880859375, 5.072998046875, 5.85791015625, 6.642822265625, 7.427734375, 8.212646484375, 8.99755859375, 9.782470703125, 10.5673828125, 11.352294921875, 12.13720703125, 12.922119140625, 13.70703125, 14.491943359375, 15.27685546875, 16.061767578125, 16.8466796875, 17.631591796875, 18.41650390625, 19.201416015625, 19.986328125, 20.771240234375, 21.55615234375, 22.341064453125, 23.1259765625, 23.910888671875, 24.69580078125, 25.480712890625, 26.265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 2.0, 4.0, 10.0, 6.0, 14.0, 10.0, 22.0, 21.0, 19.0, 47.0, 49.0, 69.0, 68.0, 125.0, 209.0, 368.0, 684.0, 835.0, 618.0, 338.0, 193.0, 108.0, 64.0, 40.0, 32.0, 30.0, 21.0, 15.0, 13.0, 5.0, 5.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-33.4375, -32.518798828125, -31.60009765625, -30.681396484375, -29.7626953125, -28.843994140625, -27.92529296875, -27.006591796875, -26.087890625, -25.169189453125, -24.25048828125, -23.331787109375, -22.4130859375, -21.494384765625, -20.57568359375, -19.656982421875, -18.73828125, -17.819580078125, -16.90087890625, -15.982177734375, -15.0634765625, -14.144775390625, -13.22607421875, -12.307373046875, -11.388671875, -10.469970703125, -9.55126953125, -8.632568359375, -7.7138671875, -6.795166015625, -5.87646484375, -4.957763671875, -4.0390625, -3.120361328125, -2.20166015625, -1.282958984375, -0.3642578125, 0.554443359375, 1.47314453125, 2.391845703125, 3.310546875, 4.229248046875, 5.14794921875, 6.066650390625, 6.9853515625, 7.904052734375, 8.82275390625, 9.741455078125, 10.66015625, 11.578857421875, 12.49755859375, 13.416259765625, 14.3349609375, 15.253662109375, 16.17236328125, 17.091064453125, 18.009765625, 18.928466796875, 19.84716796875, 20.765869140625, 21.6845703125, 22.603271484375, 23.52197265625, 24.440673828125, 25.359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 9.0, 10.0, 33.0, 176.0, 402.0, 288.0, 58.0, 15.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-819.5448608398438, -799.463134765625, -779.38134765625, -759.2996215820312, -739.2178955078125, -719.1361083984375, -699.0543823242188, -678.97265625, -658.890869140625, -638.8091430664062, -618.7273559570312, -598.6456298828125, -578.5639038085938, -558.482177734375, -538.400390625, -518.3186645507812, -498.2369384765625, -478.1551818847656, -458.0734558105469, -437.99169921875, -417.90997314453125, -397.8282165527344, -377.7464599609375, -357.66473388671875, -337.5829772949219, -317.501220703125, -297.41949462890625, -277.3377380371094, -257.2559814453125, -237.17425537109375, -217.09249877929688, -197.01075744628906, -176.92901611328125, -156.84727478027344, -136.76553344726562, -116.68377685546875, -96.60203552246094, -76.52029418945312, -56.43854522705078, -36.35679626464844, -16.275054931640625, 3.806690216064453, 23.88843536376953, 43.97018051147461, 64.05192565917969, 84.1336669921875, 104.21541595458984, 124.29716491699219, 144.37890625, 164.4606475830078, 184.54238891601562, 204.6241455078125, 224.7058868408203, 244.78762817382812, 264.869384765625, 284.95111083984375, 305.0328674316406, 325.1146240234375, 345.19635009765625, 365.2781066894531, 385.35986328125, 405.44158935546875, 425.5233459472656, 445.6051025390625, 465.68682861328125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 1.0, 6.0, 7.0, 9.0, 11.0, 21.0, 14.0, 19.0, 16.0, 25.0, 34.0, 18.0, 29.0, 37.0, 37.0, 49.0, 40.0, 46.0, 47.0, 32.0, 41.0, 45.0, 48.0, 45.0, 38.0, 38.0, 29.0, 32.0, 32.0, 28.0, 23.0, 15.0, 22.0, 19.0, 9.0, 7.0, 11.0, 1.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.44758605957031, -116.98771667480469, -112.52783966064453, -108.06796264648438, -103.60809326171875, -99.14822387695312, -94.68834686279297, -90.22846984863281, -85.76860046386719, -81.30873107910156, -76.8488540649414, -72.38897705078125, -67.92910766601562, -63.469234466552734, -59.009361267089844, -54.54948806762695, -50.08961486816406, -45.62974166870117, -41.16986846923828, -36.70999526977539, -32.2501220703125, -27.79024887084961, -23.33037567138672, -18.870502471923828, -14.410629272460938, -9.950756072998047, -5.490882873535156, -1.0310096740722656, 3.428863525390625, 7.888736724853516, 12.348609924316406, 16.808483123779297, 21.268356323242188, 25.728229522705078, 30.18810272216797, 34.64797592163086, 39.10784912109375, 43.56772232055664, 48.02759552001953, 52.48746871948242, 56.94734191894531, 61.4072151184082, 65.8670883178711, 70.32696533203125, 74.78683471679688, 79.2467041015625, 83.70658111572266, 88.16645812988281, 92.62632751464844, 97.08619689941406, 101.54607391357422, 106.00595092773438, 110.4658203125, 114.92568969726562, 119.38556671142578, 123.84544372558594, 128.30531311035156, 132.7651824951172, 137.22506713867188, 141.6849365234375, 146.14480590820312, 150.60467529296875, 155.06454467773438, 159.52442932128906, 163.9842987060547]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 10.0, 13.0, 14.0, 21.0, 34.0, 52.0, 68.0, 95.0, 163.0, 244.0, 373.0, 634.0, 984.0, 1722.0, 2804.0, 4808.0, 8504.0, 15309.0, 27546.0, 52327.0, 101582.0, 202176.0, 278698.0, 168217.0, 84002.0, 43975.0, 23607.0, 12729.0, 7427.0, 4142.0, 2417.0, 1399.0, 899.0, 567.0, 333.0, 223.0, 145.0, 105.0, 72.0, 39.0, 26.0, 22.0, 13.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.135986328125, -13.67041015625, -13.204833984375, -12.7392578125, -12.273681640625, -11.80810546875, -11.342529296875, -10.876953125, -10.411376953125, -9.94580078125, -9.480224609375, -9.0146484375, -8.549072265625, -8.08349609375, -7.617919921875, -7.15234375, -6.686767578125, -6.22119140625, -5.755615234375, -5.2900390625, -4.824462890625, -4.35888671875, -3.893310546875, -3.427734375, -2.962158203125, -2.49658203125, -2.031005859375, -1.5654296875, -1.099853515625, -0.63427734375, -0.168701171875, 0.296875, 0.762451171875, 1.22802734375, 1.693603515625, 2.1591796875, 2.624755859375, 3.09033203125, 3.555908203125, 4.021484375, 4.487060546875, 4.95263671875, 5.418212890625, 5.8837890625, 6.349365234375, 6.81494140625, 7.280517578125, 7.74609375, 8.211669921875, 8.67724609375, 9.142822265625, 9.6083984375, 10.073974609375, 10.53955078125, 11.005126953125, 11.470703125, 11.936279296875, 12.40185546875, 12.867431640625, 13.3330078125, 13.798583984375, 14.26416015625, 14.729736328125, 15.1953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 4.0, 4.0, 10.0, 7.0, 7.0, 11.0, 19.0, 19.0, 15.0, 26.0, 24.0, 20.0, 25.0, 35.0, 34.0, 46.0, 50.0, 38.0, 49.0, 50.0, 47.0, 38.0, 34.0, 40.0, 47.0, 36.0, 29.0, 41.0, 28.0, 24.0, 29.0, 20.0, 18.0, 14.0, 16.0, 11.0, 7.0, 9.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.1856689453125, -8.847900390625, -8.5101318359375, -8.17236328125, -7.8345947265625, -7.496826171875, -7.1590576171875, -6.8212890625, -6.4835205078125, -6.145751953125, -5.8079833984375, -5.47021484375, -5.1324462890625, -4.794677734375, -4.4569091796875, -4.119140625, -3.7813720703125, -3.443603515625, -3.1058349609375, -2.76806640625, -2.4302978515625, -2.092529296875, -1.7547607421875, -1.4169921875, -1.0792236328125, -0.741455078125, -0.4036865234375, -0.06591796875, 0.2718505859375, 0.609619140625, 0.9473876953125, 1.28515625, 1.6229248046875, 1.960693359375, 2.2984619140625, 2.63623046875, 2.9739990234375, 3.311767578125, 3.6495361328125, 3.9873046875, 4.3250732421875, 4.662841796875, 5.0006103515625, 5.33837890625, 5.6761474609375, 6.013916015625, 6.3516845703125, 6.689453125, 7.0272216796875, 7.364990234375, 7.7027587890625, 8.04052734375, 8.3782958984375, 8.716064453125, 9.0538330078125, 9.3916015625, 9.7293701171875, 10.067138671875, 10.4049072265625, 10.74267578125, 11.0804443359375, 11.418212890625, 11.7559814453125, 12.09375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 5.0, 5.0, 8.0, 10.0, 11.0, 9.0, 25.0, 41.0, 62.0, 45.0, 97.0, 126.0, 164.0, 258.0, 411.0, 668.0, 1114.0, 2363.0, 6196.0, 26182.0, 163105.0, 702655.0, 115368.0, 19565.0, 5122.0, 2034.0, 1017.0, 607.0, 379.0, 274.0, 165.0, 110.0, 105.0, 61.0, 53.0, 41.0, 24.0, 19.0, 16.0, 9.0, 6.0, 11.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-40.5625, -39.31103515625, -38.0595703125, -36.80810546875, -35.556640625, -34.30517578125, -33.0537109375, -31.80224609375, -30.55078125, -29.29931640625, -28.0478515625, -26.79638671875, -25.544921875, -24.29345703125, -23.0419921875, -21.79052734375, -20.5390625, -19.28759765625, -18.0361328125, -16.78466796875, -15.533203125, -14.28173828125, -13.0302734375, -11.77880859375, -10.52734375, -9.27587890625, -8.0244140625, -6.77294921875, -5.521484375, -4.27001953125, -3.0185546875, -1.76708984375, -0.515625, 0.73583984375, 1.9873046875, 3.23876953125, 4.490234375, 5.74169921875, 6.9931640625, 8.24462890625, 9.49609375, 10.74755859375, 11.9990234375, 13.25048828125, 14.501953125, 15.75341796875, 17.0048828125, 18.25634765625, 19.5078125, 20.75927734375, 22.0107421875, 23.26220703125, 24.513671875, 25.76513671875, 27.0166015625, 28.26806640625, 29.51953125, 30.77099609375, 32.0224609375, 33.27392578125, 34.525390625, 35.77685546875, 37.0283203125, 38.27978515625, 39.53125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 3.0, 4.0, 10.0, 12.0, 20.0, 13.0, 27.0, 25.0, 29.0, 26.0, 34.0, 31.0, 53.0, 50.0, 52.0, 51.0, 54.0, 53.0, 63.0, 45.0, 49.0, 31.0, 49.0, 37.0, 22.0, 23.0, 24.0, 19.0, 28.0, 16.0, 8.0, 12.0, 4.0, 8.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.125, -44.61328125, -43.1015625, -41.58984375, -40.078125, -38.56640625, -37.0546875, -35.54296875, -34.03125, -32.51953125, -31.0078125, -29.49609375, -27.984375, -26.47265625, -24.9609375, -23.44921875, -21.9375, -20.42578125, -18.9140625, -17.40234375, -15.890625, -14.37890625, -12.8671875, -11.35546875, -9.84375, -8.33203125, -6.8203125, -5.30859375, -3.796875, -2.28515625, -0.7734375, 0.73828125, 2.25, 3.76171875, 5.2734375, 6.78515625, 8.296875, 9.80859375, 11.3203125, 12.83203125, 14.34375, 15.85546875, 17.3671875, 18.87890625, 20.390625, 21.90234375, 23.4140625, 24.92578125, 26.4375, 27.94921875, 29.4609375, 30.97265625, 32.484375, 33.99609375, 35.5078125, 37.01953125, 38.53125, 40.04296875, 41.5546875, 43.06640625, 44.578125, 46.08984375, 47.6015625, 49.11328125, 50.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 12.0, 30.0, 35.0, 69.0, 76.0, 133.0, 209.0, 373.0, 767.0, 1644.0, 4698.0, 17413.0, 96548.0, 686744.0, 198096.0, 29947.0, 7276.0, 2295.0, 1001.0, 464.0, 274.0, 154.0, 88.0, 44.0, 41.0, 26.0, 23.0, 18.0, 4.0, 11.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.484375, -11.1531982421875, -10.822021484375, -10.4908447265625, -10.15966796875, -9.8284912109375, -9.497314453125, -9.1661376953125, -8.8349609375, -8.5037841796875, -8.172607421875, -7.8414306640625, -7.51025390625, -7.1790771484375, -6.847900390625, -6.5167236328125, -6.185546875, -5.8543701171875, -5.523193359375, -5.1920166015625, -4.86083984375, -4.5296630859375, -4.198486328125, -3.8673095703125, -3.5361328125, -3.2049560546875, -2.873779296875, -2.5426025390625, -2.21142578125, -1.8802490234375, -1.549072265625, -1.2178955078125, -0.88671875, -0.5555419921875, -0.224365234375, 0.1068115234375, 0.43798828125, 0.7691650390625, 1.100341796875, 1.4315185546875, 1.7626953125, 2.0938720703125, 2.425048828125, 2.7562255859375, 3.08740234375, 3.4185791015625, 3.749755859375, 4.0809326171875, 4.412109375, 4.7432861328125, 5.074462890625, 5.4056396484375, 5.73681640625, 6.0679931640625, 6.399169921875, 6.7303466796875, 7.0615234375, 7.3927001953125, 7.723876953125, 8.0550537109375, 8.38623046875, 8.7174072265625, 9.048583984375, 9.3797607421875, 9.7109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 11.0, 11.0, 6.0, 8.0, 16.0, 16.0, 22.0, 24.0, 27.0, 42.0, 45.0, 54.0, 59.0, 102.0, 96.0, 90.0, 79.0, 50.0, 58.0, 38.0, 26.0, 24.0, 18.0, 19.0, 15.0, 11.0, 12.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00191497802734375, -0.0018402040004730225, -0.001765429973602295, -0.0016906559467315674, -0.0016158819198608398, -0.0015411078929901123, -0.0014663338661193848, -0.0013915598392486572, -0.0013167858123779297, -0.0012420117855072021, -0.0011672377586364746, -0.001092463731765747, -0.0010176897048950195, -0.000942915678024292, -0.0008681416511535645, -0.0007933676242828369, -0.0007185935974121094, -0.0006438195705413818, -0.0005690455436706543, -0.0004942715167999268, -0.0004194974899291992, -0.0003447234630584717, -0.00026994943618774414, -0.0001951754093170166, -0.00012040138244628906, -4.5627355575561523e-05, 2.9146671295166016e-05, 0.00010392069816589355, 0.0001786947250366211, 0.00025346875190734863, 0.00032824277877807617, 0.0004030168056488037, 0.00047779083251953125, 0.0005525648593902588, 0.0006273388862609863, 0.0007021129131317139, 0.0007768869400024414, 0.0008516609668731689, 0.0009264349937438965, 0.001001209020614624, 0.0010759830474853516, 0.001150757074356079, 0.0012255311012268066, 0.0013003051280975342, 0.0013750791549682617, 0.0014498531818389893, 0.0015246272087097168, 0.0015994012355804443, 0.0016741752624511719, 0.0017489492893218994, 0.001823723316192627, 0.0018984973430633545, 0.001973271369934082, 0.0020480453968048096, 0.002122819423675537, 0.0021975934505462646, 0.002272367477416992, 0.0023471415042877197, 0.0024219155311584473, 0.002496689558029175, 0.0025714635848999023, 0.00264623761177063, 0.0027210116386413574, 0.002795785665512085, 0.0028705596923828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 5.0, 4.0, 13.0, 7.0, 28.0, 33.0, 51.0, 65.0, 102.0, 147.0, 252.0, 402.0, 684.0, 1290.0, 2754.0, 7099.0, 26718.0, 164039.0, 681354.0, 129305.0, 22427.0, 6486.0, 2393.0, 1197.0, 648.0, 370.0, 215.0, 128.0, 96.0, 61.0, 41.0, 34.0, 23.0, 20.0, 11.0, 12.0, 6.0, 8.0, 3.0, 6.0, 10.0, 0.0, 2.0, 3.0], "bins": [-11.015625, -10.72906494140625, -10.4425048828125, -10.15594482421875, -9.869384765625, -9.58282470703125, -9.2962646484375, -9.00970458984375, -8.72314453125, -8.43658447265625, -8.1500244140625, -7.86346435546875, -7.576904296875, -7.29034423828125, -7.0037841796875, -6.71722412109375, -6.4306640625, -6.14410400390625, -5.8575439453125, -5.57098388671875, -5.284423828125, -4.99786376953125, -4.7113037109375, -4.42474365234375, -4.13818359375, -3.85162353515625, -3.5650634765625, -3.27850341796875, -2.991943359375, -2.70538330078125, -2.4188232421875, -2.13226318359375, -1.845703125, -1.55914306640625, -1.2725830078125, -0.98602294921875, -0.699462890625, -0.41290283203125, -0.1263427734375, 0.16021728515625, 0.44677734375, 0.73333740234375, 1.0198974609375, 1.30645751953125, 1.593017578125, 1.87957763671875, 2.1661376953125, 2.45269775390625, 2.7392578125, 3.02581787109375, 3.3123779296875, 3.59893798828125, 3.885498046875, 4.17205810546875, 4.4586181640625, 4.74517822265625, 5.03173828125, 5.31829833984375, 5.6048583984375, 5.89141845703125, 6.177978515625, 6.46453857421875, 6.7510986328125, 7.03765869140625, 7.32421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 9.0, 9.0, 18.0, 22.0, 21.0, 25.0, 30.0, 37.0, 41.0, 67.0, 69.0, 53.0, 80.0, 59.0, 67.0, 64.0, 46.0, 50.0, 44.0, 43.0, 30.0, 14.0, 21.0, 12.0, 5.0, 10.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1328125, -7.8712158203125, -7.609619140625, -7.3480224609375, -7.08642578125, -6.8248291015625, -6.563232421875, -6.3016357421875, -6.0400390625, -5.7784423828125, -5.516845703125, -5.2552490234375, -4.99365234375, -4.7320556640625, -4.470458984375, -4.2088623046875, -3.947265625, -3.6856689453125, -3.424072265625, -3.1624755859375, -2.90087890625, -2.6392822265625, -2.377685546875, -2.1160888671875, -1.8544921875, -1.5928955078125, -1.331298828125, -1.0697021484375, -0.80810546875, -0.5465087890625, -0.284912109375, -0.0233154296875, 0.23828125, 0.4998779296875, 0.761474609375, 1.0230712890625, 1.28466796875, 1.5462646484375, 1.807861328125, 2.0694580078125, 2.3310546875, 2.5926513671875, 2.854248046875, 3.1158447265625, 3.37744140625, 3.6390380859375, 3.900634765625, 4.1622314453125, 4.423828125, 4.6854248046875, 4.947021484375, 5.2086181640625, 5.47021484375, 5.7318115234375, 5.993408203125, 6.2550048828125, 6.5166015625, 6.7781982421875, 7.039794921875, 7.3013916015625, 7.56298828125, 7.8245849609375, 8.086181640625, 8.3477783203125, 8.609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 11.0, 9.0, 5.0, 19.0, 25.0, 33.0, 63.0, 77.0, 169.0, 207.0, 116.0, 81.0, 67.0, 49.0, 25.0, 13.0, 8.0, 5.0, 3.0, 2.0, 3.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.98703002929688, -200.41229248046875, -193.8375701904297, -187.26283264160156, -180.68809509277344, -174.11337280273438, -167.53863525390625, -160.96389770507812, -154.38916015625, -147.81442260742188, -141.2397003173828, -134.6649627685547, -128.09022521972656, -121.51549530029297, -114.94076538085938, -108.36602783203125, -101.79130554199219, -95.2165756225586, -88.64183807373047, -82.06710815429688, -75.49237060546875, -68.91764068603516, -62.34291076660156, -55.7681770324707, -49.193443298339844, -42.618709564208984, -36.043975830078125, -29.46924591064453, -22.894512176513672, -16.319778442382812, -9.745048522949219, -3.1703147888183594, 3.4044036865234375, 9.97913646697998, 16.553869247436523, 23.12860107421875, 29.70333480834961, 36.27806854248047, 42.85279846191406, 49.42753219604492, 56.00226593017578, 62.57699966430664, 69.1517333984375, 75.7264633178711, 82.30119323730469, 88.87593078613281, 95.4506607055664, 102.025390625, 108.60012817382812, 115.17485809326172, 121.74959564208984, 128.32432556152344, 134.89906311035156, 141.47378540039062, 148.04852294921875, 154.62326049804688, 161.197998046875, 167.77273559570312, 174.3474578857422, 180.9221954345703, 187.49693298339844, 194.0716552734375, 200.64639282226562, 207.22113037109375, 213.7958526611328]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 10.0, 12.0, 11.0, 16.0, 8.0, 12.0, 18.0, 25.0, 19.0, 21.0, 25.0, 26.0, 38.0, 38.0, 32.0, 49.0, 46.0, 64.0, 63.0, 95.0, 43.0, 39.0, 34.0, 39.0, 26.0, 23.0, 26.0, 16.0, 24.0, 13.0, 17.0, 9.0, 16.0, 7.0, 4.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-196.14195251464844, -190.37557983398438, -184.6092071533203, -178.84283447265625, -173.07647705078125, -167.3101043701172, -161.54373168945312, -155.77735900878906, -150.010986328125, -144.24461364746094, -138.47824096679688, -132.71188354492188, -126.94551086425781, -121.17913818359375, -115.41276550292969, -109.64639282226562, -103.88003540039062, -98.11366271972656, -92.34729766845703, -86.58092498779297, -80.81455993652344, -75.04818725585938, -69.28181457519531, -63.515445709228516, -57.74907684326172, -51.98270797729492, -46.216339111328125, -40.44996643066406, -34.683597564697266, -28.91722869873047, -23.150856018066406, -17.38448715209961, -11.618133544921875, -5.851763725280762, -0.08539390563964844, 5.680976867675781, 11.447345733642578, 17.213714599609375, 22.980087280273438, 28.746456146240234, 34.51282501220703, 40.27919387817383, 46.045562744140625, 51.81193542480469, 57.578304290771484, 63.34467315673828, 69.11104583740234, 74.87741088867188, 80.64378356933594, 86.41015625, 92.17652130126953, 97.9428939819336, 103.70925903320312, 109.47563171386719, 115.24200439453125, 121.00837707519531, 126.77474212646484, 132.54110717773438, 138.30747985839844, 144.0738525390625, 149.84022521972656, 155.60659790039062, 161.37295532226562, 167.1393280029297, 172.90570068359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 9.0, 16.0, 16.0, 12.0, 25.0, 42.0, 74.0, 97.0, 157.0, 245.0, 498.0, 869.0, 1785.0, 3766.0, 9546.0, 32548.0, 178370.0, 1321177.0, 2232361.0, 342193.0, 48127.0, 12348.0, 4929.0, 2252.0, 1161.0, 632.0, 375.0, 216.0, 146.0, 90.0, 68.0, 40.0, 24.0, 16.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.56494140625, -10.1611328125, -9.75732421875, -9.353515625, -8.94970703125, -8.5458984375, -8.14208984375, -7.73828125, -7.33447265625, -6.9306640625, -6.52685546875, -6.123046875, -5.71923828125, -5.3154296875, -4.91162109375, -4.5078125, -4.10400390625, -3.7001953125, -3.29638671875, -2.892578125, -2.48876953125, -2.0849609375, -1.68115234375, -1.27734375, -0.87353515625, -0.4697265625, -0.06591796875, 0.337890625, 0.74169921875, 1.1455078125, 1.54931640625, 1.953125, 2.35693359375, 2.7607421875, 3.16455078125, 3.568359375, 3.97216796875, 4.3759765625, 4.77978515625, 5.18359375, 5.58740234375, 5.9912109375, 6.39501953125, 6.798828125, 7.20263671875, 7.6064453125, 8.01025390625, 8.4140625, 8.81787109375, 9.2216796875, 9.62548828125, 10.029296875, 10.43310546875, 10.8369140625, 11.24072265625, 11.64453125, 12.04833984375, 12.4521484375, 12.85595703125, 13.259765625, 13.66357421875, 14.0673828125, 14.47119140625, 14.875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 10.0, 3.0, 7.0, 7.0, 6.0, 11.0, 16.0, 14.0, 17.0, 28.0, 18.0, 31.0, 19.0, 37.0, 37.0, 38.0, 46.0, 31.0, 36.0, 41.0, 33.0, 39.0, 37.0, 45.0, 39.0, 37.0, 44.0, 28.0, 32.0, 25.0, 26.0, 27.0, 27.0, 19.0, 17.0, 17.0, 11.0, 14.0, 3.0, 7.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.921875, -8.62841796875, -8.3349609375, -8.04150390625, -7.748046875, -7.45458984375, -7.1611328125, -6.86767578125, -6.57421875, -6.28076171875, -5.9873046875, -5.69384765625, -5.400390625, -5.10693359375, -4.8134765625, -4.52001953125, -4.2265625, -3.93310546875, -3.6396484375, -3.34619140625, -3.052734375, -2.75927734375, -2.4658203125, -2.17236328125, -1.87890625, -1.58544921875, -1.2919921875, -0.99853515625, -0.705078125, -0.41162109375, -0.1181640625, 0.17529296875, 0.46875, 0.76220703125, 1.0556640625, 1.34912109375, 1.642578125, 1.93603515625, 2.2294921875, 2.52294921875, 2.81640625, 3.10986328125, 3.4033203125, 3.69677734375, 3.990234375, 4.28369140625, 4.5771484375, 4.87060546875, 5.1640625, 5.45751953125, 5.7509765625, 6.04443359375, 6.337890625, 6.63134765625, 6.9248046875, 7.21826171875, 7.51171875, 7.80517578125, 8.0986328125, 8.39208984375, 8.685546875, 8.97900390625, 9.2724609375, 9.56591796875, 9.859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 12.0, 19.0, 33.0, 56.0, 77.0, 189.0, 376.0, 931.0, 2872.0, 12417.0, 93518.0, 3631890.0, 417207.0, 27015.0, 5151.0, 1423.0, 502.0, 256.0, 117.0, 72.0, 46.0, 38.0, 24.0, 10.0, 6.0, 8.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-35.375, -34.384521484375, -33.39404296875, -32.403564453125, -31.4130859375, -30.422607421875, -29.43212890625, -28.441650390625, -27.451171875, -26.460693359375, -25.47021484375, -24.479736328125, -23.4892578125, -22.498779296875, -21.50830078125, -20.517822265625, -19.52734375, -18.536865234375, -17.54638671875, -16.555908203125, -15.5654296875, -14.574951171875, -13.58447265625, -12.593994140625, -11.603515625, -10.613037109375, -9.62255859375, -8.632080078125, -7.6416015625, -6.651123046875, -5.66064453125, -4.670166015625, -3.6796875, -2.689208984375, -1.69873046875, -0.708251953125, 0.2822265625, 1.272705078125, 2.26318359375, 3.253662109375, 4.244140625, 5.234619140625, 6.22509765625, 7.215576171875, 8.2060546875, 9.196533203125, 10.18701171875, 11.177490234375, 12.16796875, 13.158447265625, 14.14892578125, 15.139404296875, 16.1298828125, 17.120361328125, 18.11083984375, 19.101318359375, 20.091796875, 21.082275390625, 22.07275390625, 23.063232421875, 24.0537109375, 25.044189453125, 26.03466796875, 27.025146484375, 28.015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 13.0, 11.0, 24.0, 32.0, 41.0, 77.0, 148.0, 311.0, 641.0, 1048.0, 798.0, 424.0, 207.0, 104.0, 53.0, 34.0, 20.0, 16.0, 12.0, 15.0, 9.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.5, -23.54736328125, -22.5947265625, -21.64208984375, -20.689453125, -19.73681640625, -18.7841796875, -17.83154296875, -16.87890625, -15.92626953125, -14.9736328125, -14.02099609375, -13.068359375, -12.11572265625, -11.1630859375, -10.21044921875, -9.2578125, -8.30517578125, -7.3525390625, -6.39990234375, -5.447265625, -4.49462890625, -3.5419921875, -2.58935546875, -1.63671875, -0.68408203125, 0.2685546875, 1.22119140625, 2.173828125, 3.12646484375, 4.0791015625, 5.03173828125, 5.984375, 6.93701171875, 7.8896484375, 8.84228515625, 9.794921875, 10.74755859375, 11.7001953125, 12.65283203125, 13.60546875, 14.55810546875, 15.5107421875, 16.46337890625, 17.416015625, 18.36865234375, 19.3212890625, 20.27392578125, 21.2265625, 22.17919921875, 23.1318359375, 24.08447265625, 25.037109375, 25.98974609375, 26.9423828125, 27.89501953125, 28.84765625, 29.80029296875, 30.7529296875, 31.70556640625, 32.658203125, 33.61083984375, 34.5634765625, 35.51611328125, 36.46875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 17.0, 35.0, 131.0, 243.0, 316.0, 172.0, 44.0, 21.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-492.08074951171875, -481.1924133300781, -470.3040771484375, -459.4157409667969, -448.52740478515625, -437.6390380859375, -426.7507019042969, -415.86236572265625, -404.9740295410156, -394.085693359375, -383.1973571777344, -372.30902099609375, -361.420654296875, -350.5323181152344, -339.64398193359375, -328.7556457519531, -317.8673095703125, -306.9789733886719, -296.09063720703125, -285.2023010253906, -274.31396484375, -263.42559814453125, -252.53726196289062, -241.64892578125, -230.76058959960938, -219.87225341796875, -208.98391723632812, -198.09556579589844, -187.2072296142578, -176.3188934326172, -165.4305419921875, -154.54220581054688, -143.6538543701172, -132.76551818847656, -121.8771743774414, -110.98883056640625, -100.10049438476562, -89.212158203125, -78.32381439208984, -67.43547058105469, -56.54713439941406, -45.65879440307617, -34.77045440673828, -23.88211441040039, -12.9937744140625, -2.1054344177246094, 8.782905578613281, 19.671249389648438, 30.559585571289062, 41.44792556762695, 52.336265563964844, 63.224605560302734, 74.11294555664062, 85.00128173828125, 95.8896255493164, 106.77796936035156, 117.66630554199219, 128.5546417236328, 139.4429931640625, 150.33132934570312, 161.21966552734375, 172.10800170898438, 182.996337890625, 193.8846893310547, 204.7730255126953]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 9.0, 8.0, 11.0, 14.0, 17.0, 12.0, 21.0, 19.0, 19.0, 33.0, 32.0, 34.0, 35.0, 54.0, 34.0, 38.0, 33.0, 38.0, 53.0, 45.0, 42.0, 31.0, 41.0, 31.0, 38.0, 37.0, 33.0, 32.0, 24.0, 13.0, 16.0, 14.0, 14.0, 15.0, 7.0, 5.0, 7.0, 11.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-103.19453430175781, -100.13896942138672, -97.08340454101562, -94.02784729003906, -90.97228240966797, -87.91671752929688, -84.86116027832031, -81.80559539794922, -78.75003051757812, -75.69446563720703, -72.63890075683594, -69.58334350585938, -66.52777862548828, -63.47221374511719, -60.41665267944336, -57.36109161376953, -54.30552673339844, -51.249961853027344, -48.194400787353516, -45.13883972167969, -42.083274841308594, -39.0277099609375, -35.97214889526367, -32.916587829589844, -29.86102294921875, -26.80545997619629, -23.749897003173828, -20.694334030151367, -17.638771057128906, -14.583208084106445, -11.527645111083984, -8.472082138061523, -5.4165191650390625, -2.3609561920166016, 0.6946067810058594, 3.7501697540283203, 6.805732727050781, 9.861295700073242, 12.916858673095703, 15.972421646118164, 19.027984619140625, 22.083547592163086, 25.139110565185547, 28.194673538208008, 31.25023651123047, 34.30580139160156, 37.36136245727539, 40.41692352294922, 43.47248840332031, 46.528053283691406, 49.583614349365234, 52.63917541503906, 55.694740295410156, 58.75030517578125, 61.80586624145508, 64.8614273071289, 67.9169921875, 70.9725570678711, 74.02812194824219, 77.08367919921875, 80.13924407958984, 83.19480895996094, 86.2503662109375, 89.3059310913086, 92.36149597167969]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 15.0, 31.0, 31.0, 37.0, 72.0, 119.0, 175.0, 254.0, 407.0, 739.0, 1143.0, 2004.0, 3326.0, 5804.0, 10513.0, 19145.0, 35071.0, 65851.0, 124046.0, 215650.0, 242009.0, 148226.0, 79959.0, 42418.0, 22629.0, 12314.0, 6977.0, 3802.0, 2287.0, 1348.0, 786.0, 515.0, 305.0, 180.0, 120.0, 76.0, 52.0, 38.0, 27.0, 12.0, 9.0, 6.0, 2.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.197021484375, -9.84716796875, -9.497314453125, -9.1474609375, -8.797607421875, -8.44775390625, -8.097900390625, -7.748046875, -7.398193359375, -7.04833984375, -6.698486328125, -6.3486328125, -5.998779296875, -5.64892578125, -5.299072265625, -4.94921875, -4.599365234375, -4.24951171875, -3.899658203125, -3.5498046875, -3.199951171875, -2.85009765625, -2.500244140625, -2.150390625, -1.800537109375, -1.45068359375, -1.100830078125, -0.7509765625, -0.401123046875, -0.05126953125, 0.298583984375, 0.6484375, 0.998291015625, 1.34814453125, 1.697998046875, 2.0478515625, 2.397705078125, 2.74755859375, 3.097412109375, 3.447265625, 3.797119140625, 4.14697265625, 4.496826171875, 4.8466796875, 5.196533203125, 5.54638671875, 5.896240234375, 6.24609375, 6.595947265625, 6.94580078125, 7.295654296875, 7.6455078125, 7.995361328125, 8.34521484375, 8.695068359375, 9.044921875, 9.394775390625, 9.74462890625, 10.094482421875, 10.4443359375, 10.794189453125, 11.14404296875, 11.493896484375, 11.84375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 15.0, 11.0, 11.0, 14.0, 17.0, 17.0, 22.0, 22.0, 25.0, 35.0, 34.0, 30.0, 39.0, 54.0, 44.0, 44.0, 44.0, 39.0, 34.0, 40.0, 47.0, 36.0, 39.0, 39.0, 31.0, 31.0, 27.0, 23.0, 28.0, 17.0, 11.0, 10.0, 10.0, 8.0, 5.0, 9.0, 3.0, 6.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.859375, -8.5361328125, -8.212890625, -7.8896484375, -7.56640625, -7.2431640625, -6.919921875, -6.5966796875, -6.2734375, -5.9501953125, -5.626953125, -5.3037109375, -4.98046875, -4.6572265625, -4.333984375, -4.0107421875, -3.6875, -3.3642578125, -3.041015625, -2.7177734375, -2.39453125, -2.0712890625, -1.748046875, -1.4248046875, -1.1015625, -0.7783203125, -0.455078125, -0.1318359375, 0.19140625, 0.5146484375, 0.837890625, 1.1611328125, 1.484375, 1.8076171875, 2.130859375, 2.4541015625, 2.77734375, 3.1005859375, 3.423828125, 3.7470703125, 4.0703125, 4.3935546875, 4.716796875, 5.0400390625, 5.36328125, 5.6865234375, 6.009765625, 6.3330078125, 6.65625, 6.9794921875, 7.302734375, 7.6259765625, 7.94921875, 8.2724609375, 8.595703125, 8.9189453125, 9.2421875, 9.5654296875, 9.888671875, 10.2119140625, 10.53515625, 10.8583984375, 11.181640625, 11.5048828125, 11.828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 15.0, 7.0, 4.0, 15.0, 16.0, 15.0, 34.0, 51.0, 70.0, 118.0, 198.0, 306.0, 636.0, 1342.0, 3265.0, 10040.0, 38745.0, 189601.0, 637005.0, 126863.0, 27557.0, 7719.0, 2549.0, 1047.0, 553.0, 283.0, 159.0, 110.0, 62.0, 55.0, 34.0, 20.0, 14.0, 16.0, 6.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-31.96875, -31.065185546875, -30.16162109375, -29.258056640625, -28.3544921875, -27.450927734375, -26.54736328125, -25.643798828125, -24.740234375, -23.836669921875, -22.93310546875, -22.029541015625, -21.1259765625, -20.222412109375, -19.31884765625, -18.415283203125, -17.51171875, -16.608154296875, -15.70458984375, -14.801025390625, -13.8974609375, -12.993896484375, -12.09033203125, -11.186767578125, -10.283203125, -9.379638671875, -8.47607421875, -7.572509765625, -6.6689453125, -5.765380859375, -4.86181640625, -3.958251953125, -3.0546875, -2.151123046875, -1.24755859375, -0.343994140625, 0.5595703125, 1.463134765625, 2.36669921875, 3.270263671875, 4.173828125, 5.077392578125, 5.98095703125, 6.884521484375, 7.7880859375, 8.691650390625, 9.59521484375, 10.498779296875, 11.40234375, 12.305908203125, 13.20947265625, 14.113037109375, 15.0166015625, 15.920166015625, 16.82373046875, 17.727294921875, 18.630859375, 19.534423828125, 20.43798828125, 21.341552734375, 22.2451171875, 23.148681640625, 24.05224609375, 24.955810546875, 25.859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 10.0, 12.0, 14.0, 21.0, 22.0, 21.0, 40.0, 33.0, 62.0, 47.0, 57.0, 65.0, 50.0, 58.0, 59.0, 61.0, 69.0, 42.0, 40.0, 30.0, 35.0, 24.0, 18.0, 21.0, 12.0, 12.0, 13.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.03125, -45.46875, -43.90625, -42.34375, -40.78125, -39.21875, -37.65625, -36.09375, -34.53125, -32.96875, -31.40625, -29.84375, -28.28125, -26.71875, -25.15625, -23.59375, -22.03125, -20.46875, -18.90625, -17.34375, -15.78125, -14.21875, -12.65625, -11.09375, -9.53125, -7.96875, -6.40625, -4.84375, -3.28125, -1.71875, -0.15625, 1.40625, 2.96875, 4.53125, 6.09375, 7.65625, 9.21875, 10.78125, 12.34375, 13.90625, 15.46875, 17.03125, 18.59375, 20.15625, 21.71875, 23.28125, 24.84375, 26.40625, 27.96875, 29.53125, 31.09375, 32.65625, 34.21875, 35.78125, 37.34375, 38.90625, 40.46875, 42.03125, 43.59375, 45.15625, 46.71875, 48.28125, 49.84375, 51.40625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 7.0, 17.0, 14.0, 26.0, 32.0, 41.0, 69.0, 134.0, 212.0, 377.0, 764.0, 1547.0, 3341.0, 8336.0, 23227.0, 74854.0, 253071.0, 516445.0, 112841.0, 33380.0, 11257.0, 4510.0, 1890.0, 934.0, 494.0, 268.0, 163.0, 92.0, 69.0, 41.0, 30.0, 13.0, 10.0, 7.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-6.6640625, -6.47454833984375, -6.2850341796875, -6.09552001953125, -5.906005859375, -5.71649169921875, -5.5269775390625, -5.33746337890625, -5.14794921875, -4.95843505859375, -4.7689208984375, -4.57940673828125, -4.389892578125, -4.20037841796875, -4.0108642578125, -3.82135009765625, -3.6318359375, -3.44232177734375, -3.2528076171875, -3.06329345703125, -2.873779296875, -2.68426513671875, -2.4947509765625, -2.30523681640625, -2.11572265625, -1.92620849609375, -1.7366943359375, -1.54718017578125, -1.357666015625, -1.16815185546875, -0.9786376953125, -0.78912353515625, -0.599609375, -0.41009521484375, -0.2205810546875, -0.03106689453125, 0.158447265625, 0.34796142578125, 0.5374755859375, 0.72698974609375, 0.91650390625, 1.10601806640625, 1.2955322265625, 1.48504638671875, 1.674560546875, 1.86407470703125, 2.0535888671875, 2.24310302734375, 2.4326171875, 2.62213134765625, 2.8116455078125, 3.00115966796875, 3.190673828125, 3.38018798828125, 3.5697021484375, 3.75921630859375, 3.94873046875, 4.13824462890625, 4.3277587890625, 4.51727294921875, 4.706787109375, 4.89630126953125, 5.0858154296875, 5.27532958984375, 5.46484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 5.0, 10.0, 15.0, 32.0, 29.0, 64.0, 72.0, 92.0, 154.0, 141.0, 135.0, 76.0, 57.0, 36.0, 25.0, 17.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0041351318359375, -0.004006326198577881, -0.0038775205612182617, -0.0037487149238586426, -0.0036199092864990234, -0.0034911036491394043, -0.003362298011779785, -0.003233492374420166, -0.003104686737060547, -0.0029758810997009277, -0.0028470754623413086, -0.0027182698249816895, -0.0025894641876220703, -0.002460658550262451, -0.002331852912902832, -0.002203047275543213, -0.0020742416381835938, -0.0019454360008239746, -0.0018166303634643555, -0.0016878247261047363, -0.0015590190887451172, -0.001430213451385498, -0.001301407814025879, -0.0011726021766662598, -0.0010437965393066406, -0.0009149909019470215, -0.0007861852645874023, -0.0006573796272277832, -0.0005285739898681641, -0.0003997683525085449, -0.0002709627151489258, -0.00014215707778930664, -1.33514404296875e-05, 0.00011545419692993164, 0.0002442598342895508, 0.0003730654716491699, 0.0005018711090087891, 0.0006306767463684082, 0.0007594823837280273, 0.0008882880210876465, 0.0010170936584472656, 0.0011458992958068848, 0.001274704933166504, 0.001403510570526123, 0.0015323162078857422, 0.0016611218452453613, 0.0017899274826049805, 0.0019187331199645996, 0.0020475387573242188, 0.002176344394683838, 0.002305150032043457, 0.002433955669403076, 0.0025627613067626953, 0.0026915669441223145, 0.0028203725814819336, 0.0029491782188415527, 0.003077983856201172, 0.003206789493560791, 0.00333559513092041, 0.0034644007682800293, 0.0035932064056396484, 0.0037220120429992676, 0.0038508176803588867, 0.003979623317718506, 0.004108428955078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 10.0, 14.0, 25.0, 57.0, 120.0, 323.0, 1345.0, 10185.0, 220968.0, 782419.0, 29598.0, 2669.0, 531.0, 178.0, 65.0, 31.0, 6.0, 10.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.421875, -22.879638671875, -22.33740234375, -21.795166015625, -21.2529296875, -20.710693359375, -20.16845703125, -19.626220703125, -19.083984375, -18.541748046875, -17.99951171875, -17.457275390625, -16.9150390625, -16.372802734375, -15.83056640625, -15.288330078125, -14.74609375, -14.203857421875, -13.66162109375, -13.119384765625, -12.5771484375, -12.034912109375, -11.49267578125, -10.950439453125, -10.408203125, -9.865966796875, -9.32373046875, -8.781494140625, -8.2392578125, -7.697021484375, -7.15478515625, -6.612548828125, -6.0703125, -5.528076171875, -4.98583984375, -4.443603515625, -3.9013671875, -3.359130859375, -2.81689453125, -2.274658203125, -1.732421875, -1.190185546875, -0.64794921875, -0.105712890625, 0.4365234375, 0.978759765625, 1.52099609375, 2.063232421875, 2.60546875, 3.147705078125, 3.68994140625, 4.232177734375, 4.7744140625, 5.316650390625, 5.85888671875, 6.401123046875, 6.943359375, 7.485595703125, 8.02783203125, 8.570068359375, 9.1123046875, 9.654541015625, 10.19677734375, 10.739013671875, 11.28125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 8.0, 8.0, 17.0, 12.0, 22.0, 23.0, 28.0, 36.0, 56.0, 59.0, 82.0, 92.0, 99.0, 89.0, 50.0, 69.0, 49.0, 57.0, 35.0, 25.0, 22.0, 14.0, 13.0, 5.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.291259765625, -8.95751953125, -8.623779296875, -8.2900390625, -7.956298828125, -7.62255859375, -7.288818359375, -6.955078125, -6.621337890625, -6.28759765625, -5.953857421875, -5.6201171875, -5.286376953125, -4.95263671875, -4.618896484375, -4.28515625, -3.951416015625, -3.61767578125, -3.283935546875, -2.9501953125, -2.616455078125, -2.28271484375, -1.948974609375, -1.615234375, -1.281494140625, -0.94775390625, -0.614013671875, -0.2802734375, 0.053466796875, 0.38720703125, 0.720947265625, 1.0546875, 1.388427734375, 1.72216796875, 2.055908203125, 2.3896484375, 2.723388671875, 3.05712890625, 3.390869140625, 3.724609375, 4.058349609375, 4.39208984375, 4.725830078125, 5.0595703125, 5.393310546875, 5.72705078125, 6.060791015625, 6.39453125, 6.728271484375, 7.06201171875, 7.395751953125, 7.7294921875, 8.063232421875, 8.39697265625, 8.730712890625, 9.064453125, 9.398193359375, 9.73193359375, 10.065673828125, 10.3994140625, 10.733154296875, 11.06689453125, 11.400634765625, 11.734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 18.0, 40.0, 66.0, 179.0, 340.0, 167.0, 85.0, 48.0, 16.0, 8.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.2515869140625, -308.0432434082031, -298.83489990234375, -289.6265869140625, -280.4182434082031, -271.20989990234375, -262.0015869140625, -252.79324340820312, -243.58489990234375, -234.37655639648438, -225.16822814941406, -215.95989990234375, -206.75155639648438, -197.543212890625, -188.3348846435547, -179.12655639648438, -169.918212890625, -160.70986938476562, -151.5015411376953, -142.293212890625, -133.08486938476562, -123.87653350830078, -114.66819763183594, -105.4598617553711, -96.25152587890625, -87.0431900024414, -77.83485412597656, -68.62651824951172, -59.418182373046875, -50.20984649658203, -41.00151062011719, -31.793174743652344, -22.5848388671875, -13.376502990722656, -4.1681671142578125, 5.040168762207031, 14.248504638671875, 23.45684051513672, 32.66517639160156, 41.873512268066406, 51.08184814453125, 60.290184020996094, 69.49851989746094, 78.70685577392578, 87.91519165039062, 97.12352752685547, 106.33186340332031, 115.54019927978516, 124.74853515625, 133.95687866210938, 143.1652069091797, 152.37353515625, 161.58187866210938, 170.79022216796875, 179.99855041503906, 189.20687866210938, 198.41522216796875, 207.62356567382812, 216.83189392089844, 226.04022216796875, 235.24856567382812, 244.4569091796875, 253.6652374267578, 262.8735656738281, 272.0819091796875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 11.0, 3.0, 8.0, 12.0, 11.0, 10.0, 15.0, 20.0, 15.0, 21.0, 26.0, 18.0, 30.0, 33.0, 31.0, 39.0, 41.0, 76.0, 93.0, 78.0, 49.0, 40.0, 33.0, 37.0, 29.0, 26.0, 29.0, 32.0, 21.0, 26.0, 9.0, 17.0, 17.0, 10.0, 7.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.8644561767578, -154.66317749023438, -149.46188354492188, -144.26060485839844, -139.059326171875, -133.85804748535156, -128.65676879882812, -123.45547485351562, -118.25419616699219, -113.05291748046875, -107.85163116455078, -102.65034484863281, -97.44906616210938, -92.24778747558594, -87.04650115966797, -81.84521484375, -76.64393615722656, -71.44265747070312, -66.24137115478516, -61.04008865356445, -55.83880615234375, -50.63752365112305, -45.436241149902344, -40.23495864868164, -35.03367614746094, -29.832393646240234, -24.63111114501953, -19.429828643798828, -14.228546142578125, -9.027263641357422, -3.8259811401367188, 1.3753013610839844, 6.576568603515625, 11.777851104736328, 16.97913360595703, 22.180416107177734, 27.381698608398438, 32.58298110961914, 37.784263610839844, 42.98554611206055, 48.18682861328125, 53.38811111450195, 58.589393615722656, 63.79067611694336, 68.99195861816406, 74.1932373046875, 79.39452362060547, 84.59580993652344, 89.79708862304688, 94.99836730957031, 100.19965362548828, 105.40093994140625, 110.60221862792969, 115.80349731445312, 121.0047836303711, 126.20606994628906, 131.4073486328125, 136.60862731933594, 141.80990600585938, 147.01119995117188, 152.2124786376953, 157.41375732421875, 162.61505126953125, 167.8163299560547, 173.01760864257812]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 17.0, 16.0, 34.0, 42.0, 80.0, 104.0, 184.0, 312.0, 455.0, 805.0, 1295.0, 2513.0, 5324.0, 12711.0, 35323.0, 118160.0, 416128.0, 1368073.0, 1548904.0, 488988.0, 132822.0, 38364.0, 12314.0, 5114.0, 2510.0, 1385.0, 799.0, 518.0, 339.0, 226.0, 148.0, 96.0, 53.0, 50.0, 28.0, 21.0, 7.0, 4.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.1822509765625, -7.927001953125, -7.6717529296875, -7.41650390625, -7.1612548828125, -6.906005859375, -6.6507568359375, -6.3955078125, -6.1402587890625, -5.885009765625, -5.6297607421875, -5.37451171875, -5.1192626953125, -4.864013671875, -4.6087646484375, -4.353515625, -4.0982666015625, -3.843017578125, -3.5877685546875, -3.33251953125, -3.0772705078125, -2.822021484375, -2.5667724609375, -2.3115234375, -2.0562744140625, -1.801025390625, -1.5457763671875, -1.29052734375, -1.0352783203125, -0.780029296875, -0.5247802734375, -0.26953125, -0.0142822265625, 0.240966796875, 0.4962158203125, 0.75146484375, 1.0067138671875, 1.261962890625, 1.5172119140625, 1.7724609375, 2.0277099609375, 2.282958984375, 2.5382080078125, 2.79345703125, 3.0487060546875, 3.303955078125, 3.5592041015625, 3.814453125, 4.0697021484375, 4.324951171875, 4.5802001953125, 4.83544921875, 5.0906982421875, 5.345947265625, 5.6011962890625, 5.8564453125, 6.1116943359375, 6.366943359375, 6.6221923828125, 6.87744140625, 7.1326904296875, 7.387939453125, 7.6431884765625, 7.8984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 3.0, 13.0, 10.0, 13.0, 12.0, 30.0, 20.0, 28.0, 27.0, 31.0, 31.0, 41.0, 39.0, 38.0, 43.0, 31.0, 48.0, 43.0, 46.0, 58.0, 43.0, 36.0, 36.0, 27.0, 28.0, 24.0, 36.0, 19.0, 18.0, 24.0, 16.0, 9.0, 15.0, 13.0, 9.0, 8.0, 1.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.736083984375, -8.41748046875, -8.098876953125, -7.7802734375, -7.461669921875, -7.14306640625, -6.824462890625, -6.505859375, -6.187255859375, -5.86865234375, -5.550048828125, -5.2314453125, -4.912841796875, -4.59423828125, -4.275634765625, -3.95703125, -3.638427734375, -3.31982421875, -3.001220703125, -2.6826171875, -2.364013671875, -2.04541015625, -1.726806640625, -1.408203125, -1.089599609375, -0.77099609375, -0.452392578125, -0.1337890625, 0.184814453125, 0.50341796875, 0.822021484375, 1.140625, 1.459228515625, 1.77783203125, 2.096435546875, 2.4150390625, 2.733642578125, 3.05224609375, 3.370849609375, 3.689453125, 4.008056640625, 4.32666015625, 4.645263671875, 4.9638671875, 5.282470703125, 5.60107421875, 5.919677734375, 6.23828125, 6.556884765625, 6.87548828125, 7.194091796875, 7.5126953125, 7.831298828125, 8.14990234375, 8.468505859375, 8.787109375, 9.105712890625, 9.42431640625, 9.742919921875, 10.0615234375, 10.380126953125, 10.69873046875, 11.017333984375, 11.3359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 6.0, 7.0, 11.0, 19.0, 30.0, 63.0, 101.0, 236.0, 521.0, 1451.0, 5585.0, 47261.0, 3462076.0, 652643.0, 19251.0, 3343.0, 965.0, 355.0, 122.0, 75.0, 53.0, 34.0, 19.0, 9.0, 12.0, 7.0, 3.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.052734375, -31.98046875, -30.908203125, -29.8359375, -28.763671875, -27.69140625, -26.619140625, -25.546875, -24.474609375, -23.40234375, -22.330078125, -21.2578125, -20.185546875, -19.11328125, -18.041015625, -16.96875, -15.896484375, -14.82421875, -13.751953125, -12.6796875, -11.607421875, -10.53515625, -9.462890625, -8.390625, -7.318359375, -6.24609375, -5.173828125, -4.1015625, -3.029296875, -1.95703125, -0.884765625, 0.1875, 1.259765625, 2.33203125, 3.404296875, 4.4765625, 5.548828125, 6.62109375, 7.693359375, 8.765625, 9.837890625, 10.91015625, 11.982421875, 13.0546875, 14.126953125, 15.19921875, 16.271484375, 17.34375, 18.416015625, 19.48828125, 20.560546875, 21.6328125, 22.705078125, 23.77734375, 24.849609375, 25.921875, 26.994140625, 28.06640625, 29.138671875, 30.2109375, 31.283203125, 32.35546875, 33.427734375, 34.5]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 13.0, 28.0, 38.0, 39.0, 62.0, 129.0, 237.0, 394.0, 719.0, 884.0, 643.0, 351.0, 203.0, 114.0, 54.0, 38.0, 28.0, 29.0, 8.0, 9.0, 11.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.984375, -26.220458984375, -25.45654296875, -24.692626953125, -23.9287109375, -23.164794921875, -22.40087890625, -21.636962890625, -20.873046875, -20.109130859375, -19.34521484375, -18.581298828125, -17.8173828125, -17.053466796875, -16.28955078125, -15.525634765625, -14.76171875, -13.997802734375, -13.23388671875, -12.469970703125, -11.7060546875, -10.942138671875, -10.17822265625, -9.414306640625, -8.650390625, -7.886474609375, -7.12255859375, -6.358642578125, -5.5947265625, -4.830810546875, -4.06689453125, -3.302978515625, -2.5390625, -1.775146484375, -1.01123046875, -0.247314453125, 0.5166015625, 1.280517578125, 2.04443359375, 2.808349609375, 3.572265625, 4.336181640625, 5.10009765625, 5.864013671875, 6.6279296875, 7.391845703125, 8.15576171875, 8.919677734375, 9.68359375, 10.447509765625, 11.21142578125, 11.975341796875, 12.7392578125, 13.503173828125, 14.26708984375, 15.031005859375, 15.794921875, 16.558837890625, 17.32275390625, 18.086669921875, 18.8505859375, 19.614501953125, 20.37841796875, 21.142333984375, 21.90625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 12.0, 7.0, 21.0, 31.0, 60.0, 78.0, 137.0, 173.0, 159.0, 119.0, 70.0, 47.0, 35.0, 16.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.80923461914062, -167.7176513671875, -162.62608337402344, -157.5345001220703, -152.44293212890625, -147.35134887695312, -142.25978088378906, -137.16819763183594, -132.07662963867188, -126.98505401611328, -121.89347839355469, -116.8019027709961, -111.7103271484375, -106.61874389648438, -101.52716827392578, -96.43559265136719, -91.34400939941406, -86.25243377685547, -81.16085815429688, -76.06928253173828, -70.97770690917969, -65.88612365722656, -60.79454803466797, -55.702972412109375, -50.61139678955078, -45.51982116699219, -40.428245544433594, -35.336666107177734, -30.24509048461914, -25.153514862060547, -20.06193733215332, -14.970359802246094, -9.878799438476562, -4.787222862243652, 0.3043537139892578, 5.395930290222168, 10.487506866455078, 15.579082489013672, 20.6706600189209, 25.762237548828125, 30.85381317138672, 35.94538879394531, 41.036964416503906, 46.128543853759766, 51.22011947631836, 56.31169509887695, 61.40327453613281, 66.4948501586914, 71.58642578125, 76.6780014038086, 81.76957702636719, 86.86115264892578, 91.95272827148438, 97.0443115234375, 102.1358871459961, 107.22746276855469, 112.31903839111328, 117.41061401367188, 122.50218963623047, 127.59376525878906, 132.6853485107422, 137.77691650390625, 142.86849975585938, 147.9600830078125, 153.05165100097656]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 13.0, 11.0, 15.0, 14.0, 13.0, 24.0, 20.0, 29.0, 26.0, 44.0, 41.0, 40.0, 53.0, 40.0, 60.0, 46.0, 44.0, 56.0, 51.0, 51.0, 29.0, 36.0, 37.0, 34.0, 17.0, 25.0, 23.0, 13.0, 18.0, 13.0, 10.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-95.15423583984375, -91.95326232910156, -88.75228118896484, -85.55130004882812, -82.35032653808594, -79.14935302734375, -75.94837188720703, -72.74739074707031, -69.54641723632812, -66.34544372558594, -63.14446258544922, -59.943485260009766, -56.74250793457031, -53.54153060913086, -50.340553283691406, -47.13957595825195, -43.9385986328125, -40.73762130737305, -37.536643981933594, -34.33566665649414, -31.134689331054688, -27.933712005615234, -24.73273468017578, -21.531757354736328, -18.330780029296875, -15.129802703857422, -11.928825378417969, -8.727848052978516, -5.5268707275390625, -2.3258934020996094, 0.8750839233398438, 4.076061248779297, 7.27703857421875, 10.478015899658203, 13.678993225097656, 16.87997055053711, 20.080947875976562, 23.281925201416016, 26.48290252685547, 29.683879852294922, 32.884857177734375, 36.08583450317383, 39.28681182861328, 42.487789154052734, 45.68876647949219, 48.88974380493164, 52.090721130371094, 55.29169845581055, 58.49267578125, 61.69365310668945, 64.8946304321289, 68.09561157226562, 71.29658508300781, 74.49755859375, 77.69853973388672, 80.89952087402344, 84.10049438476562, 87.30146789550781, 90.50244903564453, 93.70343017578125, 96.90440368652344, 100.10537719726562, 103.30635833740234, 106.50733947753906, 109.70831298828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 13.0, 18.0, 27.0, 25.0, 53.0, 70.0, 111.0, 180.0, 247.0, 384.0, 601.0, 949.0, 1464.0, 2340.0, 3931.0, 6687.0, 11754.0, 20933.0, 38684.0, 74060.0, 142609.0, 253529.0, 227047.0, 122119.0, 63592.0, 33553.0, 17964.0, 10357.0, 5921.0, 3542.0, 2124.0, 1270.0, 850.0, 529.0, 349.0, 237.0, 153.0, 91.0, 72.0, 34.0, 29.0, 17.0, 13.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.484375, -10.155517578125, -9.82666015625, -9.497802734375, -9.1689453125, -8.840087890625, -8.51123046875, -8.182373046875, -7.853515625, -7.524658203125, -7.19580078125, -6.866943359375, -6.5380859375, -6.209228515625, -5.88037109375, -5.551513671875, -5.22265625, -4.893798828125, -4.56494140625, -4.236083984375, -3.9072265625, -3.578369140625, -3.24951171875, -2.920654296875, -2.591796875, -2.262939453125, -1.93408203125, -1.605224609375, -1.2763671875, -0.947509765625, -0.61865234375, -0.289794921875, 0.0390625, 0.367919921875, 0.69677734375, 1.025634765625, 1.3544921875, 1.683349609375, 2.01220703125, 2.341064453125, 2.669921875, 2.998779296875, 3.32763671875, 3.656494140625, 3.9853515625, 4.314208984375, 4.64306640625, 4.971923828125, 5.30078125, 5.629638671875, 5.95849609375, 6.287353515625, 6.6162109375, 6.945068359375, 7.27392578125, 7.602783203125, 7.931640625, 8.260498046875, 8.58935546875, 8.918212890625, 9.2470703125, 9.575927734375, 9.90478515625, 10.233642578125, 10.5625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 5.0, 3.0, 7.0, 3.0, 10.0, 13.0, 15.0, 15.0, 24.0, 23.0, 26.0, 34.0, 37.0, 33.0, 34.0, 41.0, 52.0, 44.0, 53.0, 40.0, 48.0, 42.0, 41.0, 41.0, 41.0, 38.0, 36.0, 32.0, 31.0, 26.0, 19.0, 18.0, 14.0, 7.0, 14.0, 6.0, 9.0, 0.0, 7.0, 6.0, 8.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.375, -10.03759765625, -9.7001953125, -9.36279296875, -9.025390625, -8.68798828125, -8.3505859375, -8.01318359375, -7.67578125, -7.33837890625, -7.0009765625, -6.66357421875, -6.326171875, -5.98876953125, -5.6513671875, -5.31396484375, -4.9765625, -4.63916015625, -4.3017578125, -3.96435546875, -3.626953125, -3.28955078125, -2.9521484375, -2.61474609375, -2.27734375, -1.93994140625, -1.6025390625, -1.26513671875, -0.927734375, -0.59033203125, -0.2529296875, 0.08447265625, 0.421875, 0.75927734375, 1.0966796875, 1.43408203125, 1.771484375, 2.10888671875, 2.4462890625, 2.78369140625, 3.12109375, 3.45849609375, 3.7958984375, 4.13330078125, 4.470703125, 4.80810546875, 5.1455078125, 5.48291015625, 5.8203125, 6.15771484375, 6.4951171875, 6.83251953125, 7.169921875, 7.50732421875, 7.8447265625, 8.18212890625, 8.51953125, 8.85693359375, 9.1943359375, 9.53173828125, 9.869140625, 10.20654296875, 10.5439453125, 10.88134765625, 11.21875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 6.0, 7.0, 8.0, 19.0, 14.0, 17.0, 29.0, 42.0, 44.0, 49.0, 80.0, 154.0, 174.0, 317.0, 500.0, 936.0, 2047.0, 4886.0, 16295.0, 76843.0, 681233.0, 214195.0, 35303.0, 8844.0, 3151.0, 1327.0, 713.0, 393.0, 248.0, 181.0, 134.0, 97.0, 65.0, 45.0, 42.0, 28.0, 21.0, 17.0, 9.0, 8.0, 5.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.796875, -29.85693359375, -28.9169921875, -27.97705078125, -27.037109375, -26.09716796875, -25.1572265625, -24.21728515625, -23.27734375, -22.33740234375, -21.3974609375, -20.45751953125, -19.517578125, -18.57763671875, -17.6376953125, -16.69775390625, -15.7578125, -14.81787109375, -13.8779296875, -12.93798828125, -11.998046875, -11.05810546875, -10.1181640625, -9.17822265625, -8.23828125, -7.29833984375, -6.3583984375, -5.41845703125, -4.478515625, -3.53857421875, -2.5986328125, -1.65869140625, -0.71875, 0.22119140625, 1.1611328125, 2.10107421875, 3.041015625, 3.98095703125, 4.9208984375, 5.86083984375, 6.80078125, 7.74072265625, 8.6806640625, 9.62060546875, 10.560546875, 11.50048828125, 12.4404296875, 13.38037109375, 14.3203125, 15.26025390625, 16.2001953125, 17.14013671875, 18.080078125, 19.02001953125, 19.9599609375, 20.89990234375, 21.83984375, 22.77978515625, 23.7197265625, 24.65966796875, 25.599609375, 26.53955078125, 27.4794921875, 28.41943359375, 29.359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 3.0, 0.0, 12.0, 16.0, 18.0, 14.0, 25.0, 23.0, 31.0, 43.0, 35.0, 48.0, 44.0, 55.0, 57.0, 53.0, 70.0, 67.0, 57.0, 47.0, 50.0, 32.0, 32.0, 25.0, 21.0, 14.0, 15.0, 17.0, 13.0, 9.0, 9.0, 5.0, 8.0, 6.0, 1.0, 0.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.65625, -41.26806640625, -39.8798828125, -38.49169921875, -37.103515625, -35.71533203125, -34.3271484375, -32.93896484375, -31.55078125, -30.16259765625, -28.7744140625, -27.38623046875, -25.998046875, -24.60986328125, -23.2216796875, -21.83349609375, -20.4453125, -19.05712890625, -17.6689453125, -16.28076171875, -14.892578125, -13.50439453125, -12.1162109375, -10.72802734375, -9.33984375, -7.95166015625, -6.5634765625, -5.17529296875, -3.787109375, -2.39892578125, -1.0107421875, 0.37744140625, 1.765625, 3.15380859375, 4.5419921875, 5.93017578125, 7.318359375, 8.70654296875, 10.0947265625, 11.48291015625, 12.87109375, 14.25927734375, 15.6474609375, 17.03564453125, 18.423828125, 19.81201171875, 21.2001953125, 22.58837890625, 23.9765625, 25.36474609375, 26.7529296875, 28.14111328125, 29.529296875, 30.91748046875, 32.3056640625, 33.69384765625, 35.08203125, 36.47021484375, 37.8583984375, 39.24658203125, 40.634765625, 42.02294921875, 43.4111328125, 44.79931640625, 46.1875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 3.0, 6.0, 7.0, 7.0, 6.0, 10.0, 14.0, 38.0, 51.0, 83.0, 205.0, 366.0, 822.0, 2189.0, 7326.0, 37496.0, 605498.0, 350684.0, 33487.0, 6727.0, 2000.0, 710.0, 370.0, 182.0, 92.0, 40.0, 38.0, 20.0, 20.0, 11.0, 13.0, 14.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6015625, -10.20849609375, -9.8154296875, -9.42236328125, -9.029296875, -8.63623046875, -8.2431640625, -7.85009765625, -7.45703125, -7.06396484375, -6.6708984375, -6.27783203125, -5.884765625, -5.49169921875, -5.0986328125, -4.70556640625, -4.3125, -3.91943359375, -3.5263671875, -3.13330078125, -2.740234375, -2.34716796875, -1.9541015625, -1.56103515625, -1.16796875, -0.77490234375, -0.3818359375, 0.01123046875, 0.404296875, 0.79736328125, 1.1904296875, 1.58349609375, 1.9765625, 2.36962890625, 2.7626953125, 3.15576171875, 3.548828125, 3.94189453125, 4.3349609375, 4.72802734375, 5.12109375, 5.51416015625, 5.9072265625, 6.30029296875, 6.693359375, 7.08642578125, 7.4794921875, 7.87255859375, 8.265625, 8.65869140625, 9.0517578125, 9.44482421875, 9.837890625, 10.23095703125, 10.6240234375, 11.01708984375, 11.41015625, 11.80322265625, 12.1962890625, 12.58935546875, 12.982421875, 13.37548828125, 13.7685546875, 14.16162109375, 14.5546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 9.0, 1.0, 3.0, 6.0, 8.0, 11.0, 13.0, 11.0, 18.0, 20.0, 32.0, 42.0, 45.0, 51.0, 75.0, 97.0, 113.0, 100.0, 66.0, 44.0, 50.0, 37.0, 30.0, 22.0, 19.0, 11.0, 12.0, 9.0, 10.0, 5.0, 6.0, 3.0, 1.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0020294189453125, -0.0019556283950805664, -0.0018818378448486328, -0.0018080472946166992, -0.0017342567443847656, -0.001660466194152832, -0.0015866756439208984, -0.0015128850936889648, -0.0014390945434570312, -0.0013653039932250977, -0.001291513442993164, -0.0012177228927612305, -0.0011439323425292969, -0.0010701417922973633, -0.0009963512420654297, -0.0009225606918334961, -0.0008487701416015625, -0.0007749795913696289, -0.0007011890411376953, -0.0006273984909057617, -0.0005536079406738281, -0.00047981739044189453, -0.00040602684020996094, -0.00033223628997802734, -0.00025844573974609375, -0.00018465518951416016, -0.00011086463928222656, -3.707408905029297e-05, 3.6716461181640625e-05, 0.00011050701141357422, 0.0001842975616455078, 0.0002580881118774414, 0.000331878662109375, 0.0004056692123413086, 0.0004794597625732422, 0.0005532503128051758, 0.0006270408630371094, 0.000700831413269043, 0.0007746219635009766, 0.0008484125137329102, 0.0009222030639648438, 0.0009959936141967773, 0.001069784164428711, 0.0011435747146606445, 0.0012173652648925781, 0.0012911558151245117, 0.0013649463653564453, 0.001438736915588379, 0.0015125274658203125, 0.001586318016052246, 0.0016601085662841797, 0.0017338991165161133, 0.0018076896667480469, 0.0018814802169799805, 0.001955270767211914, 0.0020290613174438477, 0.0021028518676757812, 0.002176642417907715, 0.0022504329681396484, 0.002324223518371582, 0.0023980140686035156, 0.0024718046188354492, 0.002545595169067383, 0.0026193857192993164, 0.00269317626953125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 5.0, 17.0, 10.0, 28.0, 43.0, 51.0, 117.0, 274.0, 573.0, 1691.0, 5443.0, 28923.0, 642965.0, 336851.0, 24257.0, 4739.0, 1400.0, 607.0, 245.0, 120.0, 58.0, 45.0, 14.0, 14.0, 13.0, 5.0, 4.0, 7.0, 4.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.671875, -13.2440185546875, -12.816162109375, -12.3883056640625, -11.96044921875, -11.5325927734375, -11.104736328125, -10.6768798828125, -10.2490234375, -9.8211669921875, -9.393310546875, -8.9654541015625, -8.53759765625, -8.1097412109375, -7.681884765625, -7.2540283203125, -6.826171875, -6.3983154296875, -5.970458984375, -5.5426025390625, -5.11474609375, -4.6868896484375, -4.259033203125, -3.8311767578125, -3.4033203125, -2.9754638671875, -2.547607421875, -2.1197509765625, -1.69189453125, -1.2640380859375, -0.836181640625, -0.4083251953125, 0.01953125, 0.4473876953125, 0.875244140625, 1.3031005859375, 1.73095703125, 2.1588134765625, 2.586669921875, 3.0145263671875, 3.4423828125, 3.8702392578125, 4.298095703125, 4.7259521484375, 5.15380859375, 5.5816650390625, 6.009521484375, 6.4373779296875, 6.865234375, 7.2930908203125, 7.720947265625, 8.1488037109375, 8.57666015625, 9.0045166015625, 9.432373046875, 9.8602294921875, 10.2880859375, 10.7159423828125, 11.143798828125, 11.5716552734375, 11.99951171875, 12.4273681640625, 12.855224609375, 13.2830810546875, 13.7109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 9.0, 22.0, 24.0, 36.0, 73.0, 89.0, 156.0, 145.0, 118.0, 106.0, 66.0, 43.0, 28.0, 18.0, 18.0, 9.0, 4.0, 7.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7578125, -14.330322265625, -13.90283203125, -13.475341796875, -13.0478515625, -12.620361328125, -12.19287109375, -11.765380859375, -11.337890625, -10.910400390625, -10.48291015625, -10.055419921875, -9.6279296875, -9.200439453125, -8.77294921875, -8.345458984375, -7.91796875, -7.490478515625, -7.06298828125, -6.635498046875, -6.2080078125, -5.780517578125, -5.35302734375, -4.925537109375, -4.498046875, -4.070556640625, -3.64306640625, -3.215576171875, -2.7880859375, -2.360595703125, -1.93310546875, -1.505615234375, -1.078125, -0.650634765625, -0.22314453125, 0.204345703125, 0.6318359375, 1.059326171875, 1.48681640625, 1.914306640625, 2.341796875, 2.769287109375, 3.19677734375, 3.624267578125, 4.0517578125, 4.479248046875, 4.90673828125, 5.334228515625, 5.76171875, 6.189208984375, 6.61669921875, 7.044189453125, 7.4716796875, 7.899169921875, 8.32666015625, 8.754150390625, 9.181640625, 9.609130859375, 10.03662109375, 10.464111328125, 10.8916015625, 11.319091796875, 11.74658203125, 12.174072265625, 12.6015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 19.0, 65.0, 109.0, 296.0, 204.0, 117.0, 83.0, 39.0, 21.0, 11.0, 8.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.73393249511719, -88.57861328125, -80.42330169677734, -72.26799011230469, -64.1126708984375, -55.95735549926758, -47.802040100097656, -39.646724700927734, -31.491409301757812, -23.33609390258789, -15.180778503417969, -7.025463104248047, 1.129852294921875, 9.285167694091797, 17.44048309326172, 25.59579849243164, 33.75111389160156, 41.906429290771484, 50.061744689941406, 58.21706008911133, 66.37237548828125, 74.52769470214844, 82.6830062866211, 90.83831787109375, 98.99363708496094, 107.14895629882812, 115.30426788330078, 123.45957946777344, 131.61489868164062, 139.7702178955078, 147.925537109375, 156.08084106445312, 164.23614501953125, 172.39146423339844, 180.54678344726562, 188.70208740234375, 196.85740661621094, 205.01272583007812, 213.16802978515625, 221.32334899902344, 229.47866821289062, 237.6339874267578, 245.789306640625, 253.94461059570312, 262.09991455078125, 270.2552490234375, 278.4105529785156, 286.5658874511719, 294.72119140625, 302.8764953613281, 311.0318298339844, 319.1871337890625, 327.34246826171875, 335.4977722167969, 343.653076171875, 351.80841064453125, 359.9637145996094, 368.1190185546875, 376.27435302734375, 384.4296569824219, 392.5849609375, 400.74029541015625, 408.8955993652344, 417.0509338378906, 425.20623779296875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 8.0, 7.0, 5.0, 13.0, 17.0, 20.0, 11.0, 17.0, 35.0, 20.0, 30.0, 33.0, 41.0, 39.0, 63.0, 108.0, 135.0, 73.0, 40.0, 42.0, 35.0, 38.0, 31.0, 26.0, 18.0, 21.0, 19.0, 9.0, 12.0, 12.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.61378479003906, -164.01463317871094, -158.4154815673828, -152.81631469726562, -147.2171630859375, -141.61801147460938, -136.01885986328125, -130.41970825195312, -124.82054901123047, -119.22139739990234, -113.62223815917969, -108.02308654785156, -102.42393493652344, -96.82477569580078, -91.22562408447266, -85.62646484375, -80.02731323242188, -74.42816162109375, -68.8290023803711, -63.22985076904297, -57.63069534301758, -52.03153991699219, -46.43238830566406, -40.83323287963867, -35.23407745361328, -29.63492202758789, -24.035768508911133, -18.436614990234375, -12.837459564208984, -7.238304138183594, -1.6391525268554688, 3.960002899169922, 9.559173583984375, 15.15832805633545, 20.757482528686523, 26.35663604736328, 31.955791473388672, 37.55494689941406, 43.15409851074219, 48.75325393676758, 54.35240936279297, 59.95156478881836, 65.55072021484375, 71.14987182617188, 76.7490234375, 82.34818267822266, 87.94733428955078, 93.54649353027344, 99.14564514160156, 104.74479675292969, 110.34395599365234, 115.94310760498047, 121.54226684570312, 127.14141845703125, 132.74057006835938, 138.3397216796875, 143.93887329101562, 149.53802490234375, 155.13717651367188, 160.736328125, 166.3354949951172, 171.9346466064453, 177.53379821777344, 183.13294982910156, 188.73211669921875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 8.0, 9.0, 12.0, 26.0, 31.0, 26.0, 42.0, 68.0, 90.0, 158.0, 232.0, 313.0, 516.0, 777.0, 1242.0, 2089.0, 3663.0, 6584.0, 14013.0, 33963.0, 93146.0, 298237.0, 910834.0, 1633055.0, 803492.0, 254210.0, 80255.0, 29587.0, 12496.0, 6267.0, 3366.0, 1934.0, 1237.0, 781.0, 464.0, 338.0, 203.0, 145.0, 105.0, 88.0, 50.0, 37.0, 25.0, 18.0, 16.0, 12.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4140625, -8.16241455078125, -7.9107666015625, -7.65911865234375, -7.407470703125, -7.15582275390625, -6.9041748046875, -6.65252685546875, -6.40087890625, -6.14923095703125, -5.8975830078125, -5.64593505859375, -5.394287109375, -5.14263916015625, -4.8909912109375, -4.63934326171875, -4.3876953125, -4.13604736328125, -3.8843994140625, -3.63275146484375, -3.381103515625, -3.12945556640625, -2.8778076171875, -2.62615966796875, -2.37451171875, -2.12286376953125, -1.8712158203125, -1.61956787109375, -1.367919921875, -1.11627197265625, -0.8646240234375, -0.61297607421875, -0.361328125, -0.10968017578125, 0.1419677734375, 0.39361572265625, 0.645263671875, 0.89691162109375, 1.1485595703125, 1.40020751953125, 1.65185546875, 1.90350341796875, 2.1551513671875, 2.40679931640625, 2.658447265625, 2.91009521484375, 3.1617431640625, 3.41339111328125, 3.6650390625, 3.91668701171875, 4.1683349609375, 4.41998291015625, 4.671630859375, 4.92327880859375, 5.1749267578125, 5.42657470703125, 5.67822265625, 5.92987060546875, 6.1815185546875, 6.43316650390625, 6.684814453125, 6.93646240234375, 7.1881103515625, 7.43975830078125, 7.69140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 8.0, 12.0, 9.0, 17.0, 29.0, 19.0, 20.0, 26.0, 35.0, 43.0, 43.0, 51.0, 39.0, 44.0, 35.0, 55.0, 48.0, 34.0, 43.0, 46.0, 50.0, 36.0, 37.0, 30.0, 30.0, 32.0, 26.0, 21.0, 10.0, 16.0, 12.0, 4.0, 5.0, 3.0, 5.0, 0.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.53125, -11.191650390625, -10.85205078125, -10.512451171875, -10.1728515625, -9.833251953125, -9.49365234375, -9.154052734375, -8.814453125, -8.474853515625, -8.13525390625, -7.795654296875, -7.4560546875, -7.116455078125, -6.77685546875, -6.437255859375, -6.09765625, -5.758056640625, -5.41845703125, -5.078857421875, -4.7392578125, -4.399658203125, -4.06005859375, -3.720458984375, -3.380859375, -3.041259765625, -2.70166015625, -2.362060546875, -2.0224609375, -1.682861328125, -1.34326171875, -1.003662109375, -0.6640625, -0.324462890625, 0.01513671875, 0.354736328125, 0.6943359375, 1.033935546875, 1.37353515625, 1.713134765625, 2.052734375, 2.392333984375, 2.73193359375, 3.071533203125, 3.4111328125, 3.750732421875, 4.09033203125, 4.429931640625, 4.76953125, 5.109130859375, 5.44873046875, 5.788330078125, 6.1279296875, 6.467529296875, 6.80712890625, 7.146728515625, 7.486328125, 7.825927734375, 8.16552734375, 8.505126953125, 8.8447265625, 9.184326171875, 9.52392578125, 9.863525390625, 10.203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 11.0, 15.0, 25.0, 30.0, 45.0, 89.0, 153.0, 321.0, 849.0, 3026.0, 19501.0, 696808.0, 3424332.0, 42365.0, 4748.0, 1124.0, 393.0, 169.0, 106.0, 60.0, 28.0, 21.0, 11.0, 11.0, 11.0, 7.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.52099609375, -38.2919921875, -37.06298828125, -35.833984375, -34.60498046875, -33.3759765625, -32.14697265625, -30.91796875, -29.68896484375, -28.4599609375, -27.23095703125, -26.001953125, -24.77294921875, -23.5439453125, -22.31494140625, -21.0859375, -19.85693359375, -18.6279296875, -17.39892578125, -16.169921875, -14.94091796875, -13.7119140625, -12.48291015625, -11.25390625, -10.02490234375, -8.7958984375, -7.56689453125, -6.337890625, -5.10888671875, -3.8798828125, -2.65087890625, -1.421875, -0.19287109375, 1.0361328125, 2.26513671875, 3.494140625, 4.72314453125, 5.9521484375, 7.18115234375, 8.41015625, 9.63916015625, 10.8681640625, 12.09716796875, 13.326171875, 14.55517578125, 15.7841796875, 17.01318359375, 18.2421875, 19.47119140625, 20.7001953125, 21.92919921875, 23.158203125, 24.38720703125, 25.6162109375, 26.84521484375, 28.07421875, 29.30322265625, 30.5322265625, 31.76123046875, 32.990234375, 34.21923828125, 35.4482421875, 36.67724609375, 37.90625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 4.0, 5.0, 16.0, 18.0, 16.0, 40.0, 47.0, 87.0, 118.0, 140.0, 265.0, 551.0, 785.0, 776.0, 490.0, 283.0, 150.0, 101.0, 42.0, 40.0, 22.0, 9.0, 14.0, 17.0, 11.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.59375, -26.757080078125, -25.92041015625, -25.083740234375, -24.2470703125, -23.410400390625, -22.57373046875, -21.737060546875, -20.900390625, -20.063720703125, -19.22705078125, -18.390380859375, -17.5537109375, -16.717041015625, -15.88037109375, -15.043701171875, -14.20703125, -13.370361328125, -12.53369140625, -11.697021484375, -10.8603515625, -10.023681640625, -9.18701171875, -8.350341796875, -7.513671875, -6.677001953125, -5.84033203125, -5.003662109375, -4.1669921875, -3.330322265625, -2.49365234375, -1.656982421875, -0.8203125, 0.016357421875, 0.85302734375, 1.689697265625, 2.5263671875, 3.363037109375, 4.19970703125, 5.036376953125, 5.873046875, 6.709716796875, 7.54638671875, 8.383056640625, 9.2197265625, 10.056396484375, 10.89306640625, 11.729736328125, 12.56640625, 13.403076171875, 14.23974609375, 15.076416015625, 15.9130859375, 16.749755859375, 17.58642578125, 18.423095703125, 19.259765625, 20.096435546875, 20.93310546875, 21.769775390625, 22.6064453125, 23.443115234375, 24.27978515625, 25.116455078125, 25.953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 11.0, 18.0, 24.0, 59.0, 161.0, 335.0, 251.0, 93.0, 30.0, 10.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-622.8569946289062, -610.606201171875, -598.3554077148438, -586.1046142578125, -573.8538818359375, -561.6030883789062, -549.352294921875, -537.1015014648438, -524.8507080078125, -512.5999145507812, -500.3491516113281, -488.0983581542969, -475.8475646972656, -463.5967712402344, -451.34600830078125, -439.09521484375, -426.84442138671875, -414.5936279296875, -402.3428649902344, -390.0920715332031, -377.8412780761719, -365.5904846191406, -353.3397216796875, -341.08892822265625, -328.8381652832031, -316.5873718261719, -304.33660888671875, -292.0858154296875, -279.83502197265625, -267.584228515625, -255.33346557617188, -243.08267211914062, -230.83187866210938, -218.5811004638672, -206.33030700683594, -194.07952880859375, -181.8287353515625, -169.5779571533203, -157.32717895507812, -145.07638549804688, -132.82559204101562, -120.5748062133789, -108.32402038574219, -96.0732421875, -83.82244873046875, -71.57167053222656, -59.320884704589844, -47.070098876953125, -34.81932067871094, -22.56853485107422, -10.317750930786133, 1.9330329895019531, 14.183818817138672, 26.43460464477539, 38.685386657714844, 50.93617248535156, 63.18695831298828, 75.437744140625, 87.68852996826172, 99.93931579589844, 112.19009399414062, 124.44088745117188, 136.69166564941406, 148.94244384765625, 161.1932373046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 7.0, 10.0, 15.0, 14.0, 23.0, 22.0, 38.0, 23.0, 32.0, 31.0, 35.0, 31.0, 31.0, 43.0, 31.0, 32.0, 42.0, 28.0, 39.0, 38.0, 42.0, 40.0, 34.0, 42.0, 27.0, 28.0, 34.0, 24.0, 19.0, 21.0, 23.0, 15.0, 16.0, 7.0, 12.0, 6.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0], "bins": [-118.93392944335938, -115.521240234375, -112.10855865478516, -108.69586944580078, -105.2831802368164, -101.87049865722656, -98.45780944824219, -95.04512023925781, -91.63243103027344, -88.21974182128906, -84.80706024169922, -81.39437103271484, -77.98168182373047, -74.56900024414062, -71.15631103515625, -67.74362182617188, -64.33094024658203, -60.91825485229492, -57.50556564331055, -54.09288024902344, -50.68019104003906, -47.26750564575195, -43.854820251464844, -40.44213104248047, -37.02944564819336, -33.61676025390625, -30.204071044921875, -26.791385650634766, -23.378698348999023, -19.96601104736328, -16.553325653076172, -13.14063835144043, -9.727951049804688, -6.3152642250061035, -2.9025774002075195, 0.5101089477539062, 3.9227962493896484, 7.335483551025391, 10.7481689453125, 14.160856246948242, 17.573543548583984, 20.986230850219727, 24.39891815185547, 27.811603546142578, 31.22429084777832, 34.63697814941406, 38.04966354370117, 41.46234893798828, 44.875038146972656, 48.287723541259766, 51.70041275024414, 55.11309814453125, 58.525787353515625, 61.938472747802734, 65.35115814208984, 68.76384735107422, 72.17652893066406, 75.58921813964844, 79.00189971923828, 82.41458892822266, 85.82727813720703, 89.23995971679688, 92.65264892578125, 96.06533813476562, 99.47802734375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 9.0, 16.0, 20.0, 24.0, 30.0, 63.0, 101.0, 122.0, 213.0, 341.0, 466.0, 860.0, 1341.0, 2370.0, 4134.0, 7781.0, 15640.0, 34214.0, 82019.0, 217106.0, 378406.0, 176944.0, 67951.0, 28970.0, 13509.0, 6775.0, 3705.0, 2107.0, 1269.0, 730.0, 433.0, 288.0, 187.0, 117.0, 73.0, 65.0, 31.0, 28.0, 29.0, 15.0, 9.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.3359375, -14.8314208984375, -14.326904296875, -13.8223876953125, -13.31787109375, -12.8133544921875, -12.308837890625, -11.8043212890625, -11.2998046875, -10.7952880859375, -10.290771484375, -9.7862548828125, -9.28173828125, -8.7772216796875, -8.272705078125, -7.7681884765625, -7.263671875, -6.7591552734375, -6.254638671875, -5.7501220703125, -5.24560546875, -4.7410888671875, -4.236572265625, -3.7320556640625, -3.2275390625, -2.7230224609375, -2.218505859375, -1.7139892578125, -1.20947265625, -0.7049560546875, -0.200439453125, 0.3040771484375, 0.80859375, 1.3131103515625, 1.817626953125, 2.3221435546875, 2.82666015625, 3.3311767578125, 3.835693359375, 4.3402099609375, 4.8447265625, 5.3492431640625, 5.853759765625, 6.3582763671875, 6.86279296875, 7.3673095703125, 7.871826171875, 8.3763427734375, 8.880859375, 9.3853759765625, 9.889892578125, 10.3944091796875, 10.89892578125, 11.4034423828125, 11.907958984375, 12.4124755859375, 12.9169921875, 13.4215087890625, 13.926025390625, 14.4305419921875, 14.93505859375, 15.4395751953125, 15.944091796875, 16.4486083984375, 16.953125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 9.0, 9.0, 7.0, 17.0, 18.0, 19.0, 25.0, 16.0, 23.0, 32.0, 37.0, 35.0, 48.0, 44.0, 43.0, 35.0, 41.0, 41.0, 43.0, 40.0, 40.0, 39.0, 54.0, 33.0, 42.0, 31.0, 24.0, 21.0, 22.0, 13.0, 22.0, 12.0, 9.0, 7.0, 8.0, 9.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7244873046875, -9.394287109375, -9.0640869140625, -8.73388671875, -8.4036865234375, -8.073486328125, -7.7432861328125, -7.4130859375, -7.0828857421875, -6.752685546875, -6.4224853515625, -6.09228515625, -5.7620849609375, -5.431884765625, -5.1016845703125, -4.771484375, -4.4412841796875, -4.111083984375, -3.7808837890625, -3.45068359375, -3.1204833984375, -2.790283203125, -2.4600830078125, -2.1298828125, -1.7996826171875, -1.469482421875, -1.1392822265625, -0.80908203125, -0.4788818359375, -0.148681640625, 0.1815185546875, 0.51171875, 0.8419189453125, 1.172119140625, 1.5023193359375, 1.83251953125, 2.1627197265625, 2.492919921875, 2.8231201171875, 3.1533203125, 3.4835205078125, 3.813720703125, 4.1439208984375, 4.47412109375, 4.8043212890625, 5.134521484375, 5.4647216796875, 5.794921875, 6.1251220703125, 6.455322265625, 6.7855224609375, 7.11572265625, 7.4459228515625, 7.776123046875, 8.1063232421875, 8.4365234375, 8.7667236328125, 9.096923828125, 9.4271240234375, 9.75732421875, 10.0875244140625, 10.417724609375, 10.7479248046875, 11.078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 8.0, 9.0, 15.0, 10.0, 25.0, 29.0, 44.0, 59.0, 62.0, 98.0, 161.0, 213.0, 342.0, 545.0, 1020.0, 2074.0, 5647.0, 25555.0, 272875.0, 691043.0, 36257.0, 7021.0, 2424.0, 1167.0, 639.0, 395.0, 239.0, 142.0, 122.0, 77.0, 63.0, 52.0, 32.0, 21.0, 20.0, 9.0, 11.0, 2.0, 5.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-34.6875, -33.53466796875, -32.3818359375, -31.22900390625, -30.076171875, -28.92333984375, -27.7705078125, -26.61767578125, -25.46484375, -24.31201171875, -23.1591796875, -22.00634765625, -20.853515625, -19.70068359375, -18.5478515625, -17.39501953125, -16.2421875, -15.08935546875, -13.9365234375, -12.78369140625, -11.630859375, -10.47802734375, -9.3251953125, -8.17236328125, -7.01953125, -5.86669921875, -4.7138671875, -3.56103515625, -2.408203125, -1.25537109375, -0.1025390625, 1.05029296875, 2.203125, 3.35595703125, 4.5087890625, 5.66162109375, 6.814453125, 7.96728515625, 9.1201171875, 10.27294921875, 11.42578125, 12.57861328125, 13.7314453125, 14.88427734375, 16.037109375, 17.18994140625, 18.3427734375, 19.49560546875, 20.6484375, 21.80126953125, 22.9541015625, 24.10693359375, 25.259765625, 26.41259765625, 27.5654296875, 28.71826171875, 29.87109375, 31.02392578125, 32.1767578125, 33.32958984375, 34.482421875, 35.63525390625, 36.7880859375, 37.94091796875, 39.09375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 16.0, 17.0, 23.0, 37.0, 30.0, 45.0, 49.0, 67.0, 49.0, 79.0, 61.0, 55.0, 73.0, 62.0, 52.0, 52.0, 36.0, 29.0, 32.0, 23.0, 16.0, 21.0, 15.0, 5.0, 7.0, 5.0, 5.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.3125, -44.76025390625, -43.2080078125, -41.65576171875, -40.103515625, -38.55126953125, -36.9990234375, -35.44677734375, -33.89453125, -32.34228515625, -30.7900390625, -29.23779296875, -27.685546875, -26.13330078125, -24.5810546875, -23.02880859375, -21.4765625, -19.92431640625, -18.3720703125, -16.81982421875, -15.267578125, -13.71533203125, -12.1630859375, -10.61083984375, -9.05859375, -7.50634765625, -5.9541015625, -4.40185546875, -2.849609375, -1.29736328125, 0.2548828125, 1.80712890625, 3.359375, 4.91162109375, 6.4638671875, 8.01611328125, 9.568359375, 11.12060546875, 12.6728515625, 14.22509765625, 15.77734375, 17.32958984375, 18.8818359375, 20.43408203125, 21.986328125, 23.53857421875, 25.0908203125, 26.64306640625, 28.1953125, 29.74755859375, 31.2998046875, 32.85205078125, 34.404296875, 35.95654296875, 37.5087890625, 39.06103515625, 40.61328125, 42.16552734375, 43.7177734375, 45.27001953125, 46.822265625, 48.37451171875, 49.9267578125, 51.47900390625, 53.03125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 4.0, 6.0, 8.0, 4.0, 6.0, 11.0, 17.0, 18.0, 35.0, 30.0, 46.0, 75.0, 104.0, 167.0, 314.0, 511.0, 1093.0, 2575.0, 7479.0, 28768.0, 160814.0, 733403.0, 86519.0, 17684.0, 4980.0, 1854.0, 861.0, 454.0, 241.0, 139.0, 91.0, 71.0, 53.0, 31.0, 26.0, 16.0, 10.0, 11.0, 3.0, 9.0, 1.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4765625, -7.23797607421875, -6.9993896484375, -6.76080322265625, -6.522216796875, -6.28363037109375, -6.0450439453125, -5.80645751953125, -5.56787109375, -5.32928466796875, -5.0906982421875, -4.85211181640625, -4.613525390625, -4.37493896484375, -4.1363525390625, -3.89776611328125, -3.6591796875, -3.42059326171875, -3.1820068359375, -2.94342041015625, -2.704833984375, -2.46624755859375, -2.2276611328125, -1.98907470703125, -1.75048828125, -1.51190185546875, -1.2733154296875, -1.03472900390625, -0.796142578125, -0.55755615234375, -0.3189697265625, -0.08038330078125, 0.158203125, 0.39678955078125, 0.6353759765625, 0.87396240234375, 1.112548828125, 1.35113525390625, 1.5897216796875, 1.82830810546875, 2.06689453125, 2.30548095703125, 2.5440673828125, 2.78265380859375, 3.021240234375, 3.25982666015625, 3.4984130859375, 3.73699951171875, 3.9755859375, 4.21417236328125, 4.4527587890625, 4.69134521484375, 4.929931640625, 5.16851806640625, 5.4071044921875, 5.64569091796875, 5.88427734375, 6.12286376953125, 6.3614501953125, 6.60003662109375, 6.838623046875, 7.07720947265625, 7.3157958984375, 7.55438232421875, 7.79296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 10.0, 12.0, 10.0, 17.0, 34.0, 54.0, 70.0, 95.0, 140.0, 170.0, 121.0, 85.0, 51.0, 35.0, 23.0, 23.0, 15.0, 7.0, 7.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00484466552734375, -0.00472104549407959, -0.00459742546081543, -0.0044738054275512695, -0.004350185394287109, -0.004226565361022949, -0.004102945327758789, -0.003979325294494629, -0.0038557052612304688, -0.0037320852279663086, -0.0036084651947021484, -0.0034848451614379883, -0.003361225128173828, -0.003237605094909668, -0.003113985061645508, -0.0029903650283813477, -0.0028667449951171875, -0.0027431249618530273, -0.002619504928588867, -0.002495884895324707, -0.002372264862060547, -0.0022486448287963867, -0.0021250247955322266, -0.0020014047622680664, -0.0018777847290039062, -0.001754164695739746, -0.001630544662475586, -0.0015069246292114258, -0.0013833045959472656, -0.0012596845626831055, -0.0011360645294189453, -0.0010124444961547852, -0.000888824462890625, -0.0007652044296264648, -0.0006415843963623047, -0.0005179643630981445, -0.0003943443298339844, -0.0002707242965698242, -0.00014710426330566406, -2.3484230041503906e-05, 0.00010013580322265625, 0.0002237558364868164, 0.00034737586975097656, 0.0004709959030151367, 0.0005946159362792969, 0.000718235969543457, 0.0008418560028076172, 0.0009654760360717773, 0.0010890960693359375, 0.0012127161026000977, 0.0013363361358642578, 0.001459956169128418, 0.0015835762023925781, 0.0017071962356567383, 0.0018308162689208984, 0.0019544363021850586, 0.0020780563354492188, 0.002201676368713379, 0.002325296401977539, 0.0024489164352416992, 0.0025725364685058594, 0.0026961565017700195, 0.0028197765350341797, 0.00294339656829834, 0.0030670166015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 11.0, 4.0, 8.0, 27.0, 39.0, 54.0, 80.0, 125.0, 193.0, 382.0, 801.0, 2026.0, 7241.0, 45644.0, 723454.0, 236569.0, 24150.0, 4827.0, 1525.0, 609.0, 303.0, 193.0, 90.0, 72.0, 49.0, 29.0, 15.0, 14.0, 10.0, 5.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.454345703125, -9.16650390625, -8.878662109375, -8.5908203125, -8.302978515625, -8.01513671875, -7.727294921875, -7.439453125, -7.151611328125, -6.86376953125, -6.575927734375, -6.2880859375, -6.000244140625, -5.71240234375, -5.424560546875, -5.13671875, -4.848876953125, -4.56103515625, -4.273193359375, -3.9853515625, -3.697509765625, -3.40966796875, -3.121826171875, -2.833984375, -2.546142578125, -2.25830078125, -1.970458984375, -1.6826171875, -1.394775390625, -1.10693359375, -0.819091796875, -0.53125, -0.243408203125, 0.04443359375, 0.332275390625, 0.6201171875, 0.907958984375, 1.19580078125, 1.483642578125, 1.771484375, 2.059326171875, 2.34716796875, 2.635009765625, 2.9228515625, 3.210693359375, 3.49853515625, 3.786376953125, 4.07421875, 4.362060546875, 4.64990234375, 4.937744140625, 5.2255859375, 5.513427734375, 5.80126953125, 6.089111328125, 6.376953125, 6.664794921875, 6.95263671875, 7.240478515625, 7.5283203125, 7.816162109375, 8.10400390625, 8.391845703125, 8.6796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 12.0, 16.0, 13.0, 25.0, 18.0, 33.0, 40.0, 53.0, 66.0, 89.0, 100.0, 78.0, 96.0, 84.0, 55.0, 42.0, 28.0, 27.0, 24.0, 16.0, 14.0, 13.0, 8.0, 8.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.87890625, -6.63433837890625, -6.3897705078125, -6.14520263671875, -5.900634765625, -5.65606689453125, -5.4114990234375, -5.16693115234375, -4.92236328125, -4.67779541015625, -4.4332275390625, -4.18865966796875, -3.944091796875, -3.69952392578125, -3.4549560546875, -3.21038818359375, -2.9658203125, -2.72125244140625, -2.4766845703125, -2.23211669921875, -1.987548828125, -1.74298095703125, -1.4984130859375, -1.25384521484375, -1.00927734375, -0.76470947265625, -0.5201416015625, -0.27557373046875, -0.031005859375, 0.21356201171875, 0.4581298828125, 0.70269775390625, 0.947265625, 1.19183349609375, 1.4364013671875, 1.68096923828125, 1.925537109375, 2.17010498046875, 2.4146728515625, 2.65924072265625, 2.90380859375, 3.14837646484375, 3.3929443359375, 3.63751220703125, 3.882080078125, 4.12664794921875, 4.3712158203125, 4.61578369140625, 4.8603515625, 5.10491943359375, 5.3494873046875, 5.59405517578125, 5.838623046875, 6.08319091796875, 6.3277587890625, 6.57232666015625, 6.81689453125, 7.06146240234375, 7.3060302734375, 7.55059814453125, 7.795166015625, 8.03973388671875, 8.2843017578125, 8.52886962890625, 8.7734375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 18.0, 41.0, 144.0, 523.0, 160.0, 75.0, 22.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-471.956787109375, -458.6495666503906, -445.3423767089844, -432.03515625, -418.7279357910156, -405.42071533203125, -392.113525390625, -378.8063049316406, -365.49908447265625, -352.1918640136719, -338.8846740722656, -325.57745361328125, -312.2702331542969, -298.9630126953125, -285.65582275390625, -272.3486022949219, -259.0414123535156, -245.7342071533203, -232.42698669433594, -219.11978149414062, -205.81256103515625, -192.50535583496094, -179.19815063476562, -165.89093017578125, -152.58372497558594, -139.27651977539062, -125.96929931640625, -112.66209411621094, -99.3548812866211, -86.04766845703125, -72.74046325683594, -59.433250427246094, -46.126007080078125, -32.81879425048828, -19.511585235595703, -6.204376220703125, 7.102836608886719, 20.410049438476562, 33.717254638671875, 47.02446746826172, 60.33168029785156, 73.6388931274414, 86.94610595703125, 100.25331115722656, 113.5605239868164, 126.86773681640625, 140.17494201660156, 153.48214721679688, 166.78936767578125, 180.09657287597656, 193.40379333496094, 206.71099853515625, 220.01821899414062, 233.32542419433594, 246.63262939453125, 259.9398498535156, 273.2470703125, 286.5542907714844, 299.8614807128906, 313.168701171875, 326.4759216308594, 339.78314208984375, 353.09033203125, 366.3975524902344, 379.7047424316406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 10.0, 8.0, 15.0, 16.0, 33.0, 22.0, 23.0, 20.0, 34.0, 40.0, 40.0, 72.0, 160.0, 136.0, 57.0, 43.0, 22.0, 42.0, 34.0, 28.0, 18.0, 17.0, 20.0, 8.0, 13.0, 13.0, 3.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.516357421875, -138.53173828125, -133.547119140625, -128.5625, -123.577880859375, -118.59326171875, -113.608642578125, -108.6240234375, -103.639404296875, -98.65478515625, -93.670166015625, -88.685546875, -83.700927734375, -78.71630859375, -73.731689453125, -68.7470703125, -63.762451171875, -58.77783203125, -53.793212890625, -48.80859375, -43.823974609375, -38.83935546875, -33.854736328125, -28.8701171875, -23.885498046875, -18.90087890625, -13.916259765625, -8.931640625, -3.947021484375, 1.03759765625, 6.022216796875, 11.0068359375, 15.991439819335938, 20.976058959960938, 25.960678100585938, 30.945297241210938, 35.92991638183594, 40.91453552246094, 45.89915466308594, 50.88377380371094, 55.86839294433594, 60.85301208496094, 65.83763122558594, 70.82225036621094, 75.80686950683594, 80.79148864746094, 85.77610778808594, 90.76072692871094, 95.74534606933594, 100.72996520996094, 105.71458435058594, 110.69920349121094, 115.68382263183594, 120.66844177246094, 125.65306091308594, 130.63768005371094, 135.62229919433594, 140.60691833496094, 145.59153747558594, 150.57615661621094, 155.56077575683594, 160.54539489746094, 165.53001403808594, 170.51463317871094, 175.49925231933594]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 2.0, 8.0, 5.0, 9.0, 11.0, 11.0, 15.0, 13.0, 25.0, 32.0, 56.0, 79.0, 138.0, 210.0, 289.0, 504.0, 898.0, 1630.0, 2902.0, 5868.0, 13871.0, 43106.0, 174561.0, 723258.0, 1806043.0, 1050878.0, 273178.0, 62708.0, 18345.0, 7485.0, 3528.0, 1889.0, 1053.0, 606.0, 352.0, 211.0, 155.0, 105.0, 52.0, 50.0, 53.0, 18.0, 16.0, 22.0, 9.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.25732421875, -10.8349609375, -10.41259765625, -9.990234375, -9.56787109375, -9.1455078125, -8.72314453125, -8.30078125, -7.87841796875, -7.4560546875, -7.03369140625, -6.611328125, -6.18896484375, -5.7666015625, -5.34423828125, -4.921875, -4.49951171875, -4.0771484375, -3.65478515625, -3.232421875, -2.81005859375, -2.3876953125, -1.96533203125, -1.54296875, -1.12060546875, -0.6982421875, -0.27587890625, 0.146484375, 0.56884765625, 0.9912109375, 1.41357421875, 1.8359375, 2.25830078125, 2.6806640625, 3.10302734375, 3.525390625, 3.94775390625, 4.3701171875, 4.79248046875, 5.21484375, 5.63720703125, 6.0595703125, 6.48193359375, 6.904296875, 7.32666015625, 7.7490234375, 8.17138671875, 8.59375, 9.01611328125, 9.4384765625, 9.86083984375, 10.283203125, 10.70556640625, 11.1279296875, 11.55029296875, 11.97265625, 12.39501953125, 12.8173828125, 13.23974609375, 13.662109375, 14.08447265625, 14.5068359375, 14.92919921875, 15.3515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 12.0, 13.0, 11.0, 23.0, 15.0, 18.0, 23.0, 34.0, 41.0, 36.0, 26.0, 39.0, 31.0, 36.0, 37.0, 37.0, 39.0, 31.0, 42.0, 43.0, 32.0, 37.0, 38.0, 33.0, 26.0, 31.0, 31.0, 21.0, 25.0, 24.0, 16.0, 14.0, 9.0, 10.0, 11.0, 6.0, 5.0, 6.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.9453125, -8.65771484375, -8.3701171875, -8.08251953125, -7.794921875, -7.50732421875, -7.2197265625, -6.93212890625, -6.64453125, -6.35693359375, -6.0693359375, -5.78173828125, -5.494140625, -5.20654296875, -4.9189453125, -4.63134765625, -4.34375, -4.05615234375, -3.7685546875, -3.48095703125, -3.193359375, -2.90576171875, -2.6181640625, -2.33056640625, -2.04296875, -1.75537109375, -1.4677734375, -1.18017578125, -0.892578125, -0.60498046875, -0.3173828125, -0.02978515625, 0.2578125, 0.54541015625, 0.8330078125, 1.12060546875, 1.408203125, 1.69580078125, 1.9833984375, 2.27099609375, 2.55859375, 2.84619140625, 3.1337890625, 3.42138671875, 3.708984375, 3.99658203125, 4.2841796875, 4.57177734375, 4.859375, 5.14697265625, 5.4345703125, 5.72216796875, 6.009765625, 6.29736328125, 6.5849609375, 6.87255859375, 7.16015625, 7.44775390625, 7.7353515625, 8.02294921875, 8.310546875, 8.59814453125, 8.8857421875, 9.17333984375, 9.4609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 17.0, 10.0, 36.0, 41.0, 83.0, 167.0, 273.0, 631.0, 1751.0, 9736.0, 2717849.0, 1452270.0, 8533.0, 1577.0, 652.0, 291.0, 153.0, 78.0, 46.0, 39.0, 15.0, 14.0, 9.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.5625, -76.10546875, -73.6484375, -71.19140625, -68.734375, -66.27734375, -63.8203125, -61.36328125, -58.90625, -56.44921875, -53.9921875, -51.53515625, -49.078125, -46.62109375, -44.1640625, -41.70703125, -39.25, -36.79296875, -34.3359375, -31.87890625, -29.421875, -26.96484375, -24.5078125, -22.05078125, -19.59375, -17.13671875, -14.6796875, -12.22265625, -9.765625, -7.30859375, -4.8515625, -2.39453125, 0.0625, 2.51953125, 4.9765625, 7.43359375, 9.890625, 12.34765625, 14.8046875, 17.26171875, 19.71875, 22.17578125, 24.6328125, 27.08984375, 29.546875, 32.00390625, 34.4609375, 36.91796875, 39.375, 41.83203125, 44.2890625, 46.74609375, 49.203125, 51.66015625, 54.1171875, 56.57421875, 59.03125, 61.48828125, 63.9453125, 66.40234375, 68.859375, 71.31640625, 73.7734375, 76.23046875, 78.6875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 14.0, 13.0, 14.0, 31.0, 63.0, 76.0, 116.0, 200.0, 360.0, 711.0, 938.0, 633.0, 354.0, 196.0, 129.0, 74.0, 59.0, 39.0, 13.0, 16.0, 8.0, 7.0, 7.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.625, -36.19677734375, -34.7685546875, -33.34033203125, -31.912109375, -30.48388671875, -29.0556640625, -27.62744140625, -26.19921875, -24.77099609375, -23.3427734375, -21.91455078125, -20.486328125, -19.05810546875, -17.6298828125, -16.20166015625, -14.7734375, -13.34521484375, -11.9169921875, -10.48876953125, -9.060546875, -7.63232421875, -6.2041015625, -4.77587890625, -3.34765625, -1.91943359375, -0.4912109375, 0.93701171875, 2.365234375, 3.79345703125, 5.2216796875, 6.64990234375, 8.078125, 9.50634765625, 10.9345703125, 12.36279296875, 13.791015625, 15.21923828125, 16.6474609375, 18.07568359375, 19.50390625, 20.93212890625, 22.3603515625, 23.78857421875, 25.216796875, 26.64501953125, 28.0732421875, 29.50146484375, 30.9296875, 32.35791015625, 33.7861328125, 35.21435546875, 36.642578125, 38.07080078125, 39.4990234375, 40.92724609375, 42.35546875, 43.78369140625, 45.2119140625, 46.64013671875, 48.068359375, 49.49658203125, 50.9248046875, 52.35302734375, 53.78125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 9.0, 42.0, 151.0, 372.0, 272.0, 91.0, 31.0, 11.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-376.2508544921875, -350.451171875, -324.6514892578125, -298.8518371582031, -273.0521545410156, -247.25247192382812, -221.4528045654297, -195.65313720703125, -169.85345458984375, -144.05377197265625, -118.25410461425781, -92.45442962646484, -66.65475463867188, -40.855072021484375, -15.055404663085938, 10.7442626953125, 36.5439453125, 62.34362030029297, 88.14329528808594, 113.9429702758789, 139.74264526367188, 165.54232788085938, 191.3419952392578, 217.14166259765625, 242.94134521484375, 268.74102783203125, 294.54071044921875, 320.3403625488281, 346.1400451660156, 371.9397277832031, 397.7393798828125, 423.5390625, 449.3387451171875, 475.138427734375, 500.9381103515625, 526.73779296875, 552.5374755859375, 578.337158203125, 604.1367797851562, 629.9364624023438, 655.7361450195312, 681.5358276367188, 707.3355102539062, 733.1351928710938, 758.934814453125, 784.7344970703125, 810.5341796875, 836.3338623046875, 862.133544921875, 887.9332275390625, 913.73291015625, 939.5325927734375, 965.332275390625, 991.1319580078125, 1016.9315795898438, 1042.731201171875, 1068.531005859375, 1094.3306884765625, 1120.13037109375, 1145.9300537109375, 1171.729736328125, 1197.5294189453125, 1223.3291015625, 1249.128662109375, 1274.9283447265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 5.0, 7.0, 11.0, 5.0, 25.0, 18.0, 19.0, 32.0, 31.0, 46.0, 39.0, 42.0, 54.0, 48.0, 53.0, 67.0, 65.0, 80.0, 66.0, 47.0, 56.0, 38.0, 38.0, 22.0, 24.0, 16.0, 18.0, 6.0, 4.0, 8.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-238.57244873046875, -231.09690856933594, -223.62136840820312, -216.1458282470703, -208.6702880859375, -201.1947479248047, -193.71920776367188, -186.24366760253906, -178.76812744140625, -171.29258728027344, -163.81704711914062, -156.3415069580078, -148.865966796875, -141.3904266357422, -133.91488647460938, -126.43934631347656, -118.96380615234375, -111.48826599121094, -104.01272583007812, -96.53718566894531, -89.0616455078125, -81.58610534667969, -74.11056518554688, -66.63502502441406, -59.15948486328125, -51.68394470214844, -44.208404541015625, -36.73286437988281, -29.25732421875, -21.781784057617188, -14.306243896484375, -6.8307037353515625, 0.64483642578125, 8.120376586914062, 15.595916748046875, 23.071456909179688, 30.5469970703125, 38.02253723144531, 45.498077392578125, 52.97361755371094, 60.44915771484375, 67.92469787597656, 75.40023803710938, 82.87577819824219, 90.351318359375, 97.82685852050781, 105.30239868164062, 112.77793884277344, 120.25347900390625, 127.72901916503906, 135.20455932617188, 142.6800994873047, 150.1556396484375, 157.6311798095703, 165.10671997070312, 172.58226013183594, 180.05780029296875, 187.53334045410156, 195.00888061523438, 202.4844207763672, 209.9599609375, 217.4355010986328, 224.91104125976562, 232.38658142089844, 239.86212158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 12.0, 11.0, 25.0, 31.0, 57.0, 85.0, 182.0, 309.0, 684.0, 1351.0, 3375.0, 8797.0, 28118.0, 142457.0, 728633.0, 99677.0, 22073.0, 7310.0, 2886.0, 1198.0, 610.0, 296.0, 147.0, 98.0, 52.0, 28.0, 20.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.640625, -28.72607421875, -27.8115234375, -26.89697265625, -25.982421875, -25.06787109375, -24.1533203125, -23.23876953125, -22.32421875, -21.40966796875, -20.4951171875, -19.58056640625, -18.666015625, -17.75146484375, -16.8369140625, -15.92236328125, -15.0078125, -14.09326171875, -13.1787109375, -12.26416015625, -11.349609375, -10.43505859375, -9.5205078125, -8.60595703125, -7.69140625, -6.77685546875, -5.8623046875, -4.94775390625, -4.033203125, -3.11865234375, -2.2041015625, -1.28955078125, -0.375, 0.53955078125, 1.4541015625, 2.36865234375, 3.283203125, 4.19775390625, 5.1123046875, 6.02685546875, 6.94140625, 7.85595703125, 8.7705078125, 9.68505859375, 10.599609375, 11.51416015625, 12.4287109375, 13.34326171875, 14.2578125, 15.17236328125, 16.0869140625, 17.00146484375, 17.916015625, 18.83056640625, 19.7451171875, 20.65966796875, 21.57421875, 22.48876953125, 23.4033203125, 24.31787109375, 25.232421875, 26.14697265625, 27.0615234375, 27.97607421875, 28.890625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 10.0, 21.0, 20.0, 29.0, 29.0, 27.0, 32.0, 50.0, 50.0, 57.0, 64.0, 63.0, 59.0, 62.0, 73.0, 56.0, 55.0, 48.0, 49.0, 30.0, 22.0, 28.0, 14.0, 14.0, 7.0, 7.0, 6.0, 3.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.9814453125, -19.447265625, -18.9130859375, -18.37890625, -17.8447265625, -17.310546875, -16.7763671875, -16.2421875, -15.7080078125, -15.173828125, -14.6396484375, -14.10546875, -13.5712890625, -13.037109375, -12.5029296875, -11.96875, -11.4345703125, -10.900390625, -10.3662109375, -9.83203125, -9.2978515625, -8.763671875, -8.2294921875, -7.6953125, -7.1611328125, -6.626953125, -6.0927734375, -5.55859375, -5.0244140625, -4.490234375, -3.9560546875, -3.421875, -2.8876953125, -2.353515625, -1.8193359375, -1.28515625, -0.7509765625, -0.216796875, 0.3173828125, 0.8515625, 1.3857421875, 1.919921875, 2.4541015625, 2.98828125, 3.5224609375, 4.056640625, 4.5908203125, 5.125, 5.6591796875, 6.193359375, 6.7275390625, 7.26171875, 7.7958984375, 8.330078125, 8.8642578125, 9.3984375, 9.9326171875, 10.466796875, 11.0009765625, 11.53515625, 12.0693359375, 12.603515625, 13.1376953125, 13.671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 11.0, 11.0, 14.0, 27.0, 43.0, 47.0, 67.0, 107.0, 143.0, 220.0, 385.0, 796.0, 1817.0, 5534.0, 27298.0, 861756.0, 129288.0, 14463.0, 3542.0, 1358.0, 605.0, 345.0, 196.0, 137.0, 79.0, 62.0, 38.0, 38.0, 28.0, 16.0, 14.0, 13.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.5, -34.450439453125, -33.40087890625, -32.351318359375, -31.3017578125, -30.252197265625, -29.20263671875, -28.153076171875, -27.103515625, -26.053955078125, -25.00439453125, -23.954833984375, -22.9052734375, -21.855712890625, -20.80615234375, -19.756591796875, -18.70703125, -17.657470703125, -16.60791015625, -15.558349609375, -14.5087890625, -13.459228515625, -12.40966796875, -11.360107421875, -10.310546875, -9.260986328125, -8.21142578125, -7.161865234375, -6.1123046875, -5.062744140625, -4.01318359375, -2.963623046875, -1.9140625, -0.864501953125, 0.18505859375, 1.234619140625, 2.2841796875, 3.333740234375, 4.38330078125, 5.432861328125, 6.482421875, 7.531982421875, 8.58154296875, 9.631103515625, 10.6806640625, 11.730224609375, 12.77978515625, 13.829345703125, 14.87890625, 15.928466796875, 16.97802734375, 18.027587890625, 19.0771484375, 20.126708984375, 21.17626953125, 22.225830078125, 23.275390625, 24.324951171875, 25.37451171875, 26.424072265625, 27.4736328125, 28.523193359375, 29.57275390625, 30.622314453125, 31.671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 1.0, 6.0, 12.0, 8.0, 12.0, 13.0, 16.0, 15.0, 25.0, 28.0, 37.0, 42.0, 54.0, 65.0, 85.0, 99.0, 93.0, 92.0, 60.0, 36.0, 31.0, 27.0, 27.0, 19.0, 14.0, 18.0, 14.0, 15.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.875, -48.9736328125, -47.072265625, -45.1708984375, -43.26953125, -41.3681640625, -39.466796875, -37.5654296875, -35.6640625, -33.7626953125, -31.861328125, -29.9599609375, -28.05859375, -26.1572265625, -24.255859375, -22.3544921875, -20.453125, -18.5517578125, -16.650390625, -14.7490234375, -12.84765625, -10.9462890625, -9.044921875, -7.1435546875, -5.2421875, -3.3408203125, -1.439453125, 0.4619140625, 2.36328125, 4.2646484375, 6.166015625, 8.0673828125, 9.96875, 11.8701171875, 13.771484375, 15.6728515625, 17.57421875, 19.4755859375, 21.376953125, 23.2783203125, 25.1796875, 27.0810546875, 28.982421875, 30.8837890625, 32.78515625, 34.6865234375, 36.587890625, 38.4892578125, 40.390625, 42.2919921875, 44.193359375, 46.0947265625, 47.99609375, 49.8974609375, 51.798828125, 53.7001953125, 55.6015625, 57.5029296875, 59.404296875, 61.3056640625, 63.20703125, 65.1083984375, 67.009765625, 68.9111328125, 70.8125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 5.0, 15.0, 14.0, 28.0, 37.0, 72.0, 123.0, 288.0, 661.0, 2326.0, 14489.0, 904470.0, 116291.0, 7214.0, 1507.0, 502.0, 222.0, 123.0, 48.0, 36.0, 22.0, 15.0, 10.0, 5.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.8984375, -13.5211181640625, -13.143798828125, -12.7664794921875, -12.38916015625, -12.0118408203125, -11.634521484375, -11.2572021484375, -10.8798828125, -10.5025634765625, -10.125244140625, -9.7479248046875, -9.37060546875, -8.9932861328125, -8.615966796875, -8.2386474609375, -7.861328125, -7.4840087890625, -7.106689453125, -6.7293701171875, -6.35205078125, -5.9747314453125, -5.597412109375, -5.2200927734375, -4.8427734375, -4.4654541015625, -4.088134765625, -3.7108154296875, -3.33349609375, -2.9561767578125, -2.578857421875, -2.2015380859375, -1.82421875, -1.4468994140625, -1.069580078125, -0.6922607421875, -0.31494140625, 0.0623779296875, 0.439697265625, 0.8170166015625, 1.1943359375, 1.5716552734375, 1.948974609375, 2.3262939453125, 2.70361328125, 3.0809326171875, 3.458251953125, 3.8355712890625, 4.212890625, 4.5902099609375, 4.967529296875, 5.3448486328125, 5.72216796875, 6.0994873046875, 6.476806640625, 6.8541259765625, 7.2314453125, 7.6087646484375, 7.986083984375, 8.3634033203125, 8.74072265625, 9.1180419921875, 9.495361328125, 9.8726806640625, 10.25]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 20.0, 20.0, 39.0, 69.0, 172.0, 278.0, 178.0, 79.0, 42.0, 26.0, 11.0, 16.0, 6.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034427642822265625, -0.003290146589279175, -0.003137528896331787, -0.0029849112033843994, -0.0028322935104370117, -0.002679675817489624, -0.0025270581245422363, -0.0023744404315948486, -0.002221822738647461, -0.0020692050457000732, -0.0019165873527526855, -0.0017639696598052979, -0.0016113519668579102, -0.0014587342739105225, -0.0013061165809631348, -0.001153498888015747, -0.0010008811950683594, -0.0008482635021209717, -0.000695645809173584, -0.0005430281162261963, -0.0003904104232788086, -0.0002377927303314209, -8.51750373840332e-05, 6.744265556335449e-05, 0.0002200603485107422, 0.0003726780414581299, 0.0005252957344055176, 0.0006779134273529053, 0.000830531120300293, 0.0009831488132476807, 0.0011357665061950684, 0.001288384199142456, 0.0014410018920898438, 0.0015936195850372314, 0.0017462372779846191, 0.0018988549709320068, 0.0020514726638793945, 0.0022040903568267822, 0.00235670804977417, 0.0025093257427215576, 0.0026619434356689453, 0.002814561128616333, 0.0029671788215637207, 0.0031197965145111084, 0.003272414207458496, 0.003425031900405884, 0.0035776495933532715, 0.003730267286300659, 0.003882884979248047, 0.004035502672195435, 0.004188120365142822, 0.00434073805809021, 0.004493355751037598, 0.004645973443984985, 0.004798591136932373, 0.004951208829879761, 0.0051038265228271484, 0.005256444215774536, 0.005409061908721924, 0.0055616796016693115, 0.005714297294616699, 0.005866914987564087, 0.006019532680511475, 0.006172150373458862, 0.00632476806640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 13.0, 17.0, 21.0, 30.0, 55.0, 94.0, 206.0, 436.0, 1072.0, 3553.0, 15336.0, 168904.0, 828488.0, 23229.0, 4741.0, 1367.0, 508.0, 210.0, 116.0, 59.0, 29.0, 21.0, 18.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.6463623046875, -5.402099609375, -5.1578369140625, -4.91357421875, -4.6693115234375, -4.425048828125, -4.1807861328125, -3.9365234375, -3.6922607421875, -3.447998046875, -3.2037353515625, -2.95947265625, -2.7152099609375, -2.470947265625, -2.2266845703125, -1.982421875, -1.7381591796875, -1.493896484375, -1.2496337890625, -1.00537109375, -0.7611083984375, -0.516845703125, -0.2725830078125, -0.0283203125, 0.2159423828125, 0.460205078125, 0.7044677734375, 0.94873046875, 1.1929931640625, 1.437255859375, 1.6815185546875, 1.92578125, 2.1700439453125, 2.414306640625, 2.6585693359375, 2.90283203125, 3.1470947265625, 3.391357421875, 3.6356201171875, 3.8798828125, 4.1241455078125, 4.368408203125, 4.6126708984375, 4.85693359375, 5.1011962890625, 5.345458984375, 5.5897216796875, 5.833984375, 6.0782470703125, 6.322509765625, 6.5667724609375, 6.81103515625, 7.0552978515625, 7.299560546875, 7.5438232421875, 7.7880859375, 8.0323486328125, 8.276611328125, 8.5208740234375, 8.76513671875, 9.0093994140625, 9.253662109375, 9.4979248046875, 9.7421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 7.0, 7.0, 9.0, 20.0, 19.0, 47.0, 73.0, 83.0, 156.0, 160.0, 141.0, 87.0, 77.0, 32.0, 27.0, 9.0, 13.0, 9.0, 6.0, 2.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.21942138671875, -6.9349365234375, -6.65045166015625, -6.365966796875, -6.08148193359375, -5.7969970703125, -5.51251220703125, -5.22802734375, -4.94354248046875, -4.6590576171875, -4.37457275390625, -4.090087890625, -3.80560302734375, -3.5211181640625, -3.23663330078125, -2.9521484375, -2.66766357421875, -2.3831787109375, -2.09869384765625, -1.814208984375, -1.52972412109375, -1.2452392578125, -0.96075439453125, -0.67626953125, -0.39178466796875, -0.1072998046875, 0.17718505859375, 0.461669921875, 0.74615478515625, 1.0306396484375, 1.31512451171875, 1.599609375, 1.88409423828125, 2.1685791015625, 2.45306396484375, 2.737548828125, 3.02203369140625, 3.3065185546875, 3.59100341796875, 3.87548828125, 4.15997314453125, 4.4444580078125, 4.72894287109375, 5.013427734375, 5.29791259765625, 5.5823974609375, 5.86688232421875, 6.1513671875, 6.43585205078125, 6.7203369140625, 7.00482177734375, 7.289306640625, 7.57379150390625, 7.8582763671875, 8.14276123046875, 8.42724609375, 8.71173095703125, 8.9962158203125, 9.28070068359375, 9.565185546875, 9.84967041015625, 10.1341552734375, 10.41864013671875, 10.703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 9.0, 20.0, 40.0, 72.0, 109.0, 518.0, 96.0, 56.0, 31.0, 15.0, 11.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-342.2680969238281, -334.751220703125, -327.23431396484375, -319.7174377441406, -312.2005310058594, -304.68365478515625, -297.166748046875, -289.6498718261719, -282.13299560546875, -274.6161193847656, -267.0992126464844, -259.58233642578125, -252.0654296875, -244.54855346679688, -237.0316619873047, -229.5147705078125, -221.99786376953125, -214.48097229003906, -206.96408081054688, -199.4471893310547, -191.9302978515625, -184.41342163085938, -176.8965301513672, -169.379638671875, -161.8627471923828, -154.34585571289062, -146.82896423339844, -139.31207275390625, -131.79519653320312, -124.2782974243164, -116.76141357421875, -109.24452209472656, -101.72763061523438, -94.21073913574219, -86.69384765625, -79.17696380615234, -71.66007232666016, -64.14318084716797, -56.62629318237305, -49.109405517578125, -41.59251403808594, -34.07562255859375, -26.558734893798828, -19.041845321655273, -11.524955749511719, -4.008064270019531, 3.5088233947753906, 11.025711059570312, 18.5426025390625, 26.059492111206055, 33.57638168334961, 41.09326934814453, 48.61016082763672, 56.127052307128906, 63.64393997192383, 71.16082763671875, 78.67771911621094, 86.19461059570312, 93.71150207519531, 101.22838592529297, 108.74527740478516, 116.26216888427734, 123.779052734375, 131.2959442138672, 138.81283569335938]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 11.0, 11.0, 6.0, 11.0, 8.0, 14.0, 13.0, 19.0, 17.0, 16.0, 23.0, 18.0, 25.0, 28.0, 33.0, 148.0, 268.0, 86.0, 26.0, 24.0, 22.0, 21.0, 24.0, 15.0, 13.0, 13.0, 9.0, 13.0, 9.0, 9.0, 5.0, 3.0, 7.0, 7.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-133.6512451171875, -129.50686645507812, -125.36248016357422, -121.21809387207031, -117.07371520996094, -112.92932891845703, -108.78494262695312, -104.64056396484375, -100.49617767333984, -96.35179138183594, -92.20741271972656, -88.06302642822266, -83.91864013671875, -79.77426147460938, -75.62987518310547, -71.48548889160156, -67.34111022949219, -63.19672775268555, -59.052345275878906, -54.907958984375, -50.76357650756836, -46.61919403076172, -42.47480773925781, -38.33042526245117, -34.18604278564453, -30.04166030883789, -25.897275924682617, -21.752891540527344, -17.608509063720703, -13.464126586914062, -9.319742202758789, -5.175357818603516, -1.030975341796875, 3.113408088684082, 7.257791519165039, 11.402174949645996, 15.546558380126953, 19.690940856933594, 23.835325241088867, 27.97970962524414, 32.12409210205078, 36.26847457885742, 40.41285705566406, 44.55724334716797, 48.70162582397461, 52.84600830078125, 56.990394592285156, 61.1347770690918, 65.27915954589844, 69.42354583740234, 73.56792449951172, 77.71231079101562, 81.856689453125, 86.0010757446289, 90.14546203613281, 94.28984069824219, 98.4342269897461, 102.57861328125, 106.72299194335938, 110.86737823486328, 115.01176452636719, 119.15614318847656, 123.30052947998047, 127.44491577148438, 131.58929443359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 6.0, 9.0, 3.0, 8.0, 9.0, 9.0, 19.0, 12.0, 24.0, 19.0, 20.0, 34.0, 31.0, 31.0, 53.0, 206.0, 148.0, 59.0, 35.0, 42.0, 36.0, 31.0, 24.0, 24.0, 13.0, 14.0, 13.0, 16.0, 9.0, 9.0, 8.0, 4.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5390625, -11.1663818359375, -10.793701171875, -10.4210205078125, -10.04833984375, -9.6756591796875, -9.302978515625, -8.9302978515625, -8.5576171875, -8.1849365234375, -7.812255859375, -7.4395751953125, -7.06689453125, -6.6942138671875, -6.321533203125, -5.9488525390625, -5.576171875, -5.2034912109375, -4.830810546875, -4.4581298828125, -4.08544921875, -3.7127685546875, -3.340087890625, -2.9674072265625, -2.5947265625, -2.2220458984375, -1.849365234375, -1.4766845703125, -1.10400390625, -0.7313232421875, -0.358642578125, 0.0140380859375, 0.38671875, 0.7593994140625, 1.132080078125, 1.5047607421875, 1.87744140625, 2.2501220703125, 2.622802734375, 2.9954833984375, 3.3681640625, 3.7408447265625, 4.113525390625, 4.4862060546875, 4.85888671875, 5.2315673828125, 5.604248046875, 5.9769287109375, 6.349609375, 6.7222900390625, 7.094970703125, 7.4676513671875, 7.84033203125, 8.2130126953125, 8.585693359375, 8.9583740234375, 9.3310546875, 9.7037353515625, 10.076416015625, 10.4490966796875, 10.82177734375, 11.1944580078125, 11.567138671875, 11.9398193359375, 12.3125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 17.0, 12.0, 16.0, 19.0, 25.0, 32.0, 54.0, 113.0, 202.0, 503.0, 1439.0, 6230.0, 8268120.0, 105079.0, 4657.0, 1167.0, 396.0, 191.0, 104.0, 52.0, 24.0, 19.0, 13.0, 30.0, 12.0, 10.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-113.7357406616211, -109.80189514160156, -105.86804962158203, -101.9342041015625, -98.0003662109375, -94.06652069091797, -90.13267517089844, -86.1988296508789, -82.26498413085938, -78.33113861083984, -74.39729309082031, -70.46345520019531, -66.52960968017578, -62.59576416015625, -58.66191864013672, -54.72807312011719, -50.79423522949219, -46.860389709472656, -42.92654800415039, -38.99270248413086, -35.058860778808594, -31.125015258789062, -27.19116973876953, -23.257326126098633, -19.323482513427734, -15.389638900756836, -11.455794334411621, -7.521949768066406, -3.588106155395508, 0.3457374572753906, 4.279582977294922, 8.21342658996582, 12.147262573242188, 16.081106185913086, 20.014949798583984, 23.948795318603516, 27.882638931274414, 31.816482543945312, 35.750328063964844, 39.684173583984375, 43.61801528930664, 47.55186080932617, 51.48570251464844, 55.41954803466797, 59.3533935546875, 63.287235260009766, 67.22108459472656, 71.15492248535156, 75.0887680053711, 79.02261352539062, 82.95645904541016, 86.89030456542969, 90.82414245605469, 94.75798797607422, 98.69183349609375, 102.62567901611328, 106.55952453613281, 110.49337005615234, 114.42721557617188, 118.36105346679688, 122.2948989868164, 126.22874450683594, 130.16259765625, 134.096435546875, 138.0302734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 5.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.32476043701172, -70.30366516113281, -67.28257751464844, -64.26148223876953, -61.24039077758789, -58.21929931640625, -55.198204040527344, -52.1771125793457, -49.15602111816406, -46.13492965698242, -43.113834381103516, -40.092742919921875, -37.071651458740234, -34.050559997558594, -31.029464721679688, -28.008373260498047, -24.98727798461914, -21.966184616088867, -18.945093154907227, -15.923999786376953, -12.902907371520996, -9.881814956665039, -6.860721588134766, -3.839630126953125, -0.8185367584228516, 2.2025558948516846, 5.223648548126221, 8.244741439819336, 11.265833854675293, 14.28692626953125, 17.308019638061523, 20.329111099243164, 23.350204467773438, 26.37129783630371, 29.39238929748535, 32.413482666015625, 35.434574127197266, 38.455665588378906, 41.47676086425781, 44.49785232543945, 47.518943786621094, 50.540035247802734, 53.56113052368164, 56.58222198486328, 59.60331344604492, 62.62440490722656, 65.64550018310547, 68.66659545898438, 71.68768310546875, 74.70877838134766, 77.72986602783203, 80.75096130371094, 83.77205657958984, 86.79314422607422, 89.81423950195312, 92.8353271484375, 95.85643005371094, 98.87752532958984, 101.89861297607422, 104.91970825195312, 107.94080352783203, 110.9618911743164, 113.98298645019531, 117.00407409667969, 120.0251693725586]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 15.0, 20.0, 32.0, 44.0, 53.0, 118.0, 184.0, 327.0, 645.0, 1374.0, 3321.0, 9150.0, 29376.0, 109557.0, 241145.0, 91649.0, 24283.0, 7782.0, 2773.0, 1140.0, 542.0, 276.0, 144.0, 105.0, 59.0, 46.0, 30.0, 25.0, 8.0, 10.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.1875, -93.994140625, -90.80078125, -87.607421875, -84.4140625, -81.220703125, -78.02734375, -74.833984375, -71.640625, -68.447265625, -65.25390625, -62.060546875, -58.8671875, -55.673828125, -52.48046875, -49.287109375, -46.09375, -42.900390625, -39.70703125, -36.513671875, -33.3203125, -30.126953125, -26.93359375, -23.740234375, -20.546875, -17.353515625, -14.16015625, -10.966796875, -7.7734375, -4.580078125, -1.38671875, 1.806640625, 5.0, 8.193359375, 11.38671875, 14.580078125, 17.7734375, 20.966796875, 24.16015625, 27.353515625, 30.546875, 33.740234375, 36.93359375, 40.126953125, 43.3203125, 46.513671875, 49.70703125, 52.900390625, 56.09375, 59.287109375, 62.48046875, 65.673828125, 68.8671875, 72.060546875, 75.25390625, 78.447265625, 81.640625, 84.833984375, 88.02734375, 91.220703125, 94.4140625, 97.607421875, 100.80078125, 103.994140625, 107.1875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 7.0, 4.0, 8.0, 17.0, 18.0, 13.0, 30.0, 39.0, 56.0, 68.0, 76.0, 73.0, 82.0, 82.0, 76.0, 61.0, 72.0, 42.0, 38.0, 32.0, 27.0, 26.0, 11.0, 11.0, 9.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-21.921875, -21.378173828125, -20.83447265625, -20.290771484375, -19.7470703125, -19.203369140625, -18.65966796875, -18.115966796875, -17.572265625, -17.028564453125, -16.48486328125, -15.941162109375, -15.3974609375, -14.853759765625, -14.31005859375, -13.766357421875, -13.22265625, -12.678955078125, -12.13525390625, -11.591552734375, -11.0478515625, -10.504150390625, -9.96044921875, -9.416748046875, -8.873046875, -8.329345703125, -7.78564453125, -7.241943359375, -6.6982421875, -6.154541015625, -5.61083984375, -5.067138671875, -4.5234375, -3.979736328125, -3.43603515625, -2.892333984375, -2.3486328125, -1.804931640625, -1.26123046875, -0.717529296875, -0.173828125, 0.369873046875, 0.91357421875, 1.457275390625, 2.0009765625, 2.544677734375, 3.08837890625, 3.632080078125, 4.17578125, 4.719482421875, 5.26318359375, 5.806884765625, 6.3505859375, 6.894287109375, 7.43798828125, 7.981689453125, 8.525390625, 9.069091796875, 9.61279296875, 10.156494140625, 10.7001953125, 11.243896484375, 11.78759765625, 12.331298828125, 12.875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 12.0, 10.0, 29.0, 45.0, 60.0, 71.0, 55.0, 54.0, 33.0, 26.0, 18.0, 7.0, 7.0, 7.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-70.97396850585938, -68.40577697753906, -65.83759307861328, -63.26940155029297, -60.70121383666992, -58.133026123046875, -55.56483459472656, -52.996646881103516, -50.42845916748047, -47.86027145385742, -45.29207992553711, -42.72389221191406, -40.155704498291016, -37.58751678466797, -35.019325256347656, -32.45113754272461, -29.882946014404297, -27.314756393432617, -24.74656867980957, -22.17837905883789, -19.610191345214844, -17.042001724243164, -14.473812103271484, -11.905624389648438, -9.337434768676758, -6.7692461013793945, -4.201056957244873, -1.6328678131103516, 0.9353208541870117, 3.503509521484375, 6.071699142456055, 8.639886856079102, 11.208076477050781, 13.776265144348145, 16.344453811645508, 18.912643432617188, 21.480831146240234, 24.049020767211914, 26.617210388183594, 29.18539810180664, 31.75358772277832, 34.32177734375, 36.88996505737305, 39.458152770996094, 42.026344299316406, 44.59453201293945, 47.1627197265625, 49.73091125488281, 52.29909896850586, 54.867286682128906, 57.43547821044922, 60.003665924072266, 62.57185363769531, 65.14004516601562, 67.70823669433594, 70.27642059326172, 72.84461212158203, 75.41280364990234, 77.98098754882812, 80.54917907714844, 83.11737060546875, 85.68555450439453, 88.25374603271484, 90.82192993164062, 93.39012145996094]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 10.0, 19.0, 25.0, 35.0, 81.0, 74.0, 69.0, 48.0, 21.0, 20.0, 9.0, 6.0, 6.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-57.83226776123047, -55.78666305541992, -53.741058349609375, -51.69545364379883, -49.64984893798828, -47.604244232177734, -45.55863952636719, -43.513038635253906, -41.467430114746094, -39.42182540893555, -37.376220703125, -35.33061599731445, -33.285011291503906, -31.23940658569336, -29.193803787231445, -27.1481990814209, -25.102596282958984, -23.056991577148438, -21.01138687133789, -18.965782165527344, -16.920177459716797, -14.874573707580566, -12.828969955444336, -10.783365249633789, -8.737760543823242, -6.692155838012695, -4.646551609039307, -2.600947380065918, -0.5553426742553711, 1.4902620315551758, 3.5358657836914062, 5.581470489501953, 7.6270751953125, 9.672679901123047, 11.718284606933594, 13.763888359069824, 15.809493064880371, 17.855098724365234, 19.90070152282715, 21.946306228637695, 23.991910934448242, 26.03751564025879, 28.083120346069336, 30.12872314453125, 32.1743278503418, 34.219932556152344, 36.26553726196289, 38.31114196777344, 40.356746673583984, 42.40235137939453, 44.44795608520508, 46.493560791015625, 48.53916549682617, 50.58477020263672, 52.63037109375, 54.67597961425781, 56.721580505371094, 58.76718521118164, 60.81278991699219, 62.858394622802734, 64.90399932861328, 66.94960021972656, 68.99520874023438, 71.04080963134766, 73.08641815185547]}, "eval/loss": 6.984083652496338, "eval/wer": 0.9473381352064607, "eval/runtime": 433.6165, "eval/samples_per_second": 6.093, "eval/steps_per_second": 1.524} \ No newline at end of file